2021-06-10 08:39:33 -04:00
|
|
|
/* This is a small program used in order to understand the collision rate
|
2019-08-02 14:13:16 -04:00
|
|
|
* of CRC64 (ISO version) VS other stronger hashing functions in the context
|
|
|
|
* of hashing keys for the Redis "tracking" feature (client side caching
|
|
|
|
* assisted by the server).
|
|
|
|
*
|
|
|
|
* The program attempts to hash keys with common names in the form of
|
|
|
|
*
|
|
|
|
* prefix:<counter>
|
|
|
|
*
|
2021-06-10 08:39:33 -04:00
|
|
|
* And counts the resulting collisions generated in the 24 bits of output
|
2019-08-02 14:13:16 -04:00
|
|
|
* needed for the tracking feature invalidation table (16 millions + entries)
|
|
|
|
*
|
2019-08-02 14:24:27 -04:00
|
|
|
* Compile with:
|
|
|
|
*
|
|
|
|
* cc -O2 ./tracking_collisions.c ../src/crc64.c ../src/sha1.c
|
|
|
|
* ./a.out
|
|
|
|
*
|
2019-08-02 14:13:16 -04:00
|
|
|
* --------------------------------------------------------------------------
|
|
|
|
*
|
|
|
|
* Copyright (C) 2019 Salvatore Sanfilippo
|
|
|
|
* This code is released under the BSD 2 clause license.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <stdint.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <stdio.h>
|
2019-08-02 14:24:27 -04:00
|
|
|
#include "../src/crc64.h"
|
|
|
|
#include "../src/sha1.h"
|
2019-08-02 14:13:16 -04:00
|
|
|
|
|
|
|
#define TABLE_SIZE (1<<24)
|
|
|
|
int Table[TABLE_SIZE];
|
|
|
|
|
2019-08-02 14:24:27 -04:00
|
|
|
uint64_t crc64Hash(char *key, size_t len) {
|
|
|
|
return crc64(0,(unsigned char*)key,len);
|
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t sha1Hash(char *key, size_t len) {
|
|
|
|
SHA1_CTX ctx;
|
|
|
|
unsigned char hash[20];
|
|
|
|
|
|
|
|
SHA1Init(&ctx);
|
|
|
|
SHA1Update(&ctx,(unsigned char*)key,len);
|
|
|
|
SHA1Final(hash,&ctx);
|
|
|
|
uint64_t hash64;
|
|
|
|
memcpy(&hash64,hash,sizeof(hash64));
|
|
|
|
return hash64;
|
|
|
|
}
|
|
|
|
|
2019-08-02 14:13:16 -04:00
|
|
|
/* Test the hashing function provided as callback and return the
|
|
|
|
* number of collisions found. */
|
|
|
|
unsigned long testHashingFunction(uint64_t (*hash)(char *, size_t)) {
|
|
|
|
unsigned long collisions = 0;
|
|
|
|
memset(Table,0,sizeof(Table));
|
|
|
|
char *prefixes[] = {"object", "message", "user", NULL};
|
2019-08-02 14:24:27 -04:00
|
|
|
for (int i = 0; prefixes[i] != NULL; i++) {
|
|
|
|
for (int j = 0; j < TABLE_SIZE/2; j++) {
|
|
|
|
char keyname[128];
|
|
|
|
size_t keylen = snprintf(keyname,sizeof(keyname),"%s:%d",
|
|
|
|
prefixes[i],j);
|
|
|
|
uint64_t bucket = hash(keyname,keylen) % TABLE_SIZE;
|
|
|
|
if (Table[bucket]) {
|
|
|
|
collisions++;
|
|
|
|
} else {
|
|
|
|
Table[bucket] = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2019-08-02 14:13:16 -04:00
|
|
|
return collisions;
|
|
|
|
}
|
|
|
|
|
|
|
|
int main(void) {
|
|
|
|
printf("SHA1 : %lu\n", testHashingFunction(sha1Hash));
|
|
|
|
printf("CRC64: %lu\n", testHashingFunction(crc64Hash));
|
|
|
|
return 0;
|
|
|
|
}
|