#include #include #include typedef signed int Int; typedef unsigned int UInt; typedef unsigned long long int Addr64; typedef unsigned char UChar; typedef unsigned long int UWord; static inline UInt ROL32 ( UInt x, UInt n ) { assert(n != 0); n &= 31; x = (x << n) | (x >> (32-n)); return x; } ////////////////////////////////////////////////////////// typedef struct { Addr64 ga; Int nbytes; UChar* bytes; UChar* actual; } GuestBytes; GuestBytes* read_one ( FILE* f ) { Int r; UInt i; UInt esum, csum; GuestBytes* gb = malloc(sizeof(GuestBytes)); assert(gb); if (feof(f)) return NULL; assert(!ferror(f)); r= fscanf(f, "GuestBytes %llx %d ", &gb->ga, &gb->nbytes); if (0) printf("r = %d\n", r); assert(r == 2); assert(gb->ga != 0); assert(gb->nbytes > 0); assert(gb->nbytes < 5000); // let's say Int nToAlloc = gb->nbytes + (gb->ga & 3); gb->bytes = malloc( gb->nbytes + nToAlloc); gb->actual = gb->bytes + (gb->ga & 3); assert(gb->bytes); csum = 0; for (i = 0; i < gb->nbytes; i++) { UInt b; r= fscanf(f, "%02x ", &b); assert(r == 1); gb->actual[i] = b; csum = (csum << 1) ^ b; } r= fscanf(f, " %08x\n", &esum); assert(r == 1); assert(esum == csum); return gb; } ////////////////////////////////////////////////////////// void apply_to_all ( FILE* f, void(*fn)( GuestBytes*, void* ), void* opaque ) { while (!feof(f)) { GuestBytes* gb = read_one(f); if (0) printf("got %llu %d\n", gb->ga, gb->nbytes); fn( gb, opaque ); free(gb->bytes); free(gb); } } ////////////////////////////////////////////////////////// UInt hash_const_zero ( GuestBytes* gb ) { return 0; } UInt hash_sum ( GuestBytes* gb ) { UInt i, sum = 0; for (i = 0; i < gb->nbytes; i++) sum += (UInt)gb->actual[i]; return sum; } UInt hash_rol ( GuestBytes* gb ) { UInt i, sum = 0; for (i = 0; i < gb->nbytes; i++) { sum ^= (UInt)gb->actual[i]; sum = ROL32(sum,7); } return sum; } static UInt cand0 ( GuestBytes* gb ) { UWord addr = (UWord)gb->actual; UWord len = gb->nbytes; UInt sum = 0; /* pull up to 4-alignment */ while ((addr & 3) != 0 && len >= 1) { UChar* p = (UChar*)addr; sum = (sum << 8) | (UInt)p[0]; addr++; len--; } /* vectorised + unrolled */ while (len >= 16) { UInt* p = (UInt*)addr; sum = ROL32(sum ^ p[0], 13); sum = ROL32(sum ^ p[1], 13); sum = ROL32(sum ^ p[2], 13); sum = ROL32(sum ^ p[3], 13); addr += 16; len -= 16; } /* vectorised fixup */ while (len >= 4) { UInt* p = (UInt*)addr; sum = ROL32(sum ^ p[0], 13); addr += 4; len -= 4; } /* scalar fixup */ while (len >= 1) { UChar* p = (UChar*)addr; sum = ROL32(sum ^ (UInt)p[0], 19); addr++; len--; } return sum; } static UInt cand1 ( GuestBytes* gb ) { UWord addr = (UWord)gb->actual; UWord len = gb->nbytes; UInt sum1 = 0, sum2 = 0; /* pull up to 4-alignment */ while ((addr & 3) != 0 && len >= 1) { UChar* p = (UChar*)addr; sum1 = (sum1 << 8) | (UInt)p[0]; addr++; len--; } /* vectorised + unrolled */ while (len >= 16) { UInt* p = (UInt*)addr; UInt w; w = p[0]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; w = p[1]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; w = p[2]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; w = p[3]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; addr += 16; len -= 16; sum1 ^= sum2; } /* vectorised fixup */ while (len >= 4) { UInt* p = (UInt*)addr; UInt w = p[0]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; addr += 4; len -= 4; sum1 ^= sum2; } /* scalar fixup */ while (len >= 1) { UChar* p = (UChar*)addr; UInt w = (UInt)p[0]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; addr++; len--; } return sum1 + sum2; } static UInt adler32 ( GuestBytes* gb ) { UWord addr = (UWord)gb->actual; UWord len = gb->nbytes; UInt s1 = 1; UInt s2 = 0; UChar* buf = (UChar*)addr; while (len >= 4) { s1 += buf[0]; s2 += s1; s1 += buf[1]; s2 += s1; s1 += buf[2]; s2 += s1; s1 += buf[3]; s2 += s1; buf += 4; len -= 4; } while (len > 0) { s1 += buf[0]; s2 += s1; len--; buf++; } return (s2 << 16) + s1; } ////////////////////////////////////////////////////////// UInt (*theFn)(GuestBytes*) = //hash_const_zero; //hash_sum; //hash_rol; //cand0; cand1; //adler32; Int cmp_UInt_ps ( UInt* p1, UInt* p2 ) { if (*p1 < *p2) return -1; if (*p1 > *p2) return 1; return 0; } Int nSetBits ( UInt w ) { Int i, j; j = 0; for (i = 0; i < 32; i++) if (w & (1<nbytes; UInt* hashes = malloc( nHashes * sizeof(UInt) ); UInt byteIx, bitIx; UInt hInit, hFinal, hRunning; Int dist, totDist = 0, nNoDist = 0; assert(hashes); hInit = theFn( gb ); for (byteIx = 0; byteIx < gb->nbytes; byteIx++) { for (bitIx = 0; bitIx < 8; bitIx++) { invertBit(gb->actual, byteIx, bitIx); //invertBit(gb->actual, byteIx, bitIx ^ 4); hRunning = theFn( gb ); dist = nSetBits(hRunning ^ hInit); totDist += dist; if (dist == 0) nNoDist++; hashes[hashIx++] = hRunning; invertBit(gb->actual, byteIx, bitIx); //invertBit(gb->actual, byteIx, bitIx ^ 4); if (0) printf(" %02d.%d %08x %d\n", byteIx, bitIx, hRunning ^ hInit, dist); } } hFinal = theFn( gb ); assert(hFinal == hInit); assert(hashIx == nHashes); if (nNoDist > 0) printf("%4d measurements, %5.2f avg dist, %2d zeroes\n", (Int)nHashes, (double)totDist / (double)nHashes, nNoDist); else printf("%4d measurements, %5.2f avg dist\n", (Int)nHashes, (double)totDist / (double)nHashes); if (nNoDist > 0) toc_nblocks_with_zero++; toc_sum_of_avgs += (double)totDist / (double)nHashes; free(hashes); } ////////////////////////////////////////////////////////// int main ( void ) { FILE* f = stdin; apply_to_all(f, try_onebit_changes, NULL); printf("\n%d blocks, %d with a zero, %5.2f avg avg\n\n", toc_nblocks, toc_nblocks_with_zero, toc_sum_of_avgs / (double)toc_nblocks ); return 0; } //////////////////////////////////////////////////////////