mirror of
https://codeberg.org/redict/redict.git
synced 2025-01-23 08:38:27 -05:00
Improved bigkeys with progress, pipelining and summary
This commit reworks the redis-cli --bigkeys command to provide more information about our progress as well as output summary information when we're done. - We now show an approximate percentage completion as we go - Hiredis pipelining is used for TYPE and SIZE retreival - A summary of keyspace distribution and overall breakout at the end
This commit is contained in:
parent
8b8c1cd4c2
commit
806788d009
315
src/redis-cli.c
315
src/redis-cli.c
@ -1331,108 +1331,271 @@ static void pipeMode(void) {
|
|||||||
#define TYPE_SET 2
|
#define TYPE_SET 2
|
||||||
#define TYPE_HASH 3
|
#define TYPE_HASH 3
|
||||||
#define TYPE_ZSET 4
|
#define TYPE_ZSET 4
|
||||||
|
#define TYPE_NONE 5
|
||||||
|
|
||||||
static void findBigKeys(void) {
|
static redisReply *sendScan(unsigned long long *it) {
|
||||||
unsigned long long biggest[5] = {0,0,0,0,0};
|
redisReply *reply = redisCommand(context, "SCAN %llu", *it);
|
||||||
unsigned long long samples = 0;
|
|
||||||
redisReply *reply1, *reply2, *reply3 = NULL, *keys;
|
|
||||||
char *key, *sizecmd, *typename[] = {"string","list","set","hash","zset"};
|
|
||||||
char *typeunit[] = {"bytes","items","members","fields","members"};
|
|
||||||
int type, it=0, i;
|
|
||||||
|
|
||||||
printf("\n# Press ctrl+c when you have had enough of it... :)\n");
|
/* Handle any error conditions */
|
||||||
printf("# You can use -i 0.1 to sleep 0.1 sec per 100 SCANS\n");
|
if(reply == NULL) {
|
||||||
printf("# in order to reduce server load (usually not needed).\n\n");
|
|
||||||
|
|
||||||
do {
|
|
||||||
/* Grab some keys with SCAN */
|
|
||||||
reply1 = redisCommand(context, "SCAN %d", it);
|
|
||||||
if(reply1 == NULL) {
|
|
||||||
fprintf(stderr, "\nI/O error\n");
|
fprintf(stderr, "\nI/O error\n");
|
||||||
exit(1);
|
exit(1);
|
||||||
} else if(reply1->type == REDIS_REPLY_ERROR) {
|
} else if(reply->type == REDIS_REPLY_ERROR) {
|
||||||
fprintf(stderr, "SCAN error: %s\n", reply1->str);
|
fprintf(stderr, "SCAN error: %s\n", reply->str);
|
||||||
exit(1);
|
exit(1);
|
||||||
} else if(reply1->type != REDIS_REPLY_ARRAY) {
|
} else if(reply->type != REDIS_REPLY_ARRAY) {
|
||||||
fprintf(stderr, "Non ARRAY response from SCAN!\n");
|
fprintf(stderr, "Non ARRAY response from SCAN!\n");
|
||||||
exit(1);
|
exit(1);
|
||||||
} else if(reply1->elements!=2) {
|
} else if(reply->elements != 2) {
|
||||||
fprintf(stderr, "Invalid SCAN result!\n");
|
fprintf(stderr, "Invalid element count from SCAN!\n");
|
||||||
exit(1);
|
exit(1);
|
||||||
}
|
}
|
||||||
|
|
||||||
/* Validate the SCAN response */
|
/* Validate our types are correct */
|
||||||
assert(reply1->element[0]->type == REDIS_REPLY_STRING);
|
assert(reply->element[0]->type == REDIS_REPLY_STRING);
|
||||||
assert(reply1->element[1]->type == REDIS_REPLY_ARRAY);
|
assert(reply->element[1]->type == REDIS_REPLY_ARRAY);
|
||||||
|
|
||||||
/* Update iterator and grab pointer to keys */
|
/* Update iterator */
|
||||||
it = atoi(reply1->element[0]->str);
|
*it = atoi(reply->element[0]->str);
|
||||||
keys = reply1->element[1];
|
|
||||||
|
|
||||||
/* Iterate keys that SCAN returned */
|
return reply;
|
||||||
for(i=0;i<keys->elements;i++) {
|
}
|
||||||
/* Make sure we've got a string, grab it, and increment samples */
|
|
||||||
assert(keys->element[i]->type == REDIS_REPLY_STRING);
|
|
||||||
key = keys->element[i]->str;
|
|
||||||
samples++;
|
|
||||||
|
|
||||||
/* Get the key type */
|
static int getDbSize(void) {
|
||||||
reply2 = redisCommand(context, "TYPE %s", key);
|
redisReply *reply;
|
||||||
assert(reply2 && reply2->type == REDIS_REPLY_STATUS);
|
int size;
|
||||||
|
|
||||||
/* Get the key "size" */
|
reply = redisCommand(context, "DBSIZE");
|
||||||
if (!strcmp(reply2->str,"string")) {
|
|
||||||
sizecmd = "STRLEN";
|
if(reply == NULL || reply->type != REDIS_REPLY_INTEGER) {
|
||||||
type = TYPE_STRING;
|
fprintf(stderr, "Couldn't determine DBSIZE!\n");
|
||||||
} else if (!strcmp(reply2->str,"list")) {
|
exit(1);
|
||||||
sizecmd = "LLEN";
|
}
|
||||||
type = TYPE_LIST;
|
|
||||||
} else if (!strcmp(reply2->str,"set")) {
|
/* Grab the number of keys and free our reply */
|
||||||
sizecmd = "SCARD";
|
size = reply->integer;
|
||||||
type = TYPE_SET;
|
freeReplyObject(reply);
|
||||||
} else if (!strcmp(reply2->str,"hash")) {
|
|
||||||
sizecmd = "HLEN";
|
return size;
|
||||||
type = TYPE_HASH;
|
}
|
||||||
} else if (!strcmp(reply2->str,"zset")) {
|
|
||||||
sizecmd = "ZCARD";
|
static int toIntType(char *key, char *type) {
|
||||||
type = TYPE_ZSET;
|
if(!strcmp(type, "string")) {
|
||||||
} else if (!strcmp(reply2->str,"none")) {
|
return TYPE_STRING;
|
||||||
freeReplyObject(reply1);
|
} else if(!strcmp(type, "list")) {
|
||||||
freeReplyObject(reply2);
|
return TYPE_LIST;
|
||||||
continue;
|
} else if(!strcmp(type, "set")) {
|
||||||
|
return TYPE_SET;
|
||||||
|
} else if(!strcmp(type, "hash")) {
|
||||||
|
return TYPE_HASH;
|
||||||
|
} else if(!strcmp(type, "zset")) {
|
||||||
|
return TYPE_ZSET;
|
||||||
|
} else if(!strcmp(type, "none")) {
|
||||||
|
return TYPE_NONE;
|
||||||
} else {
|
} else {
|
||||||
fprintf(stderr, "Unknown key type '%s' for key '%s'\n",
|
fprintf(stderr, "Unknown type '%s' for key '%s'\n", type, key);
|
||||||
reply2->str, key);
|
exit(1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
static void getKeyTypes(redisReply *keys, int *types) {
|
||||||
|
redisReply *reply;
|
||||||
|
int i;
|
||||||
|
|
||||||
|
/* Pipeline TYPE commands */
|
||||||
|
for(i=0;i<keys->elements;i++) {
|
||||||
|
redisAppendCommand(context, "TYPE %s", keys->element[i]->str);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Retrieve types */
|
||||||
|
for(i=0;i<keys->elements;i++) {
|
||||||
|
if(redisGetReply(context, (void**)&reply)!=REDIS_OK) {
|
||||||
|
fprintf(stderr, "Error getting type for key '%s' (%d: %s)\n",
|
||||||
|
keys->element[i]->str, context->err, context->errstr);
|
||||||
|
exit(1);
|
||||||
|
} else if(reply->type != REDIS_REPLY_STATUS) {
|
||||||
|
fprintf(stderr, "Invalid reply type (%d) for TYPE on key '%s'!\n",
|
||||||
|
reply->type, keys->element[i]->str);
|
||||||
exit(1);
|
exit(1);
|
||||||
}
|
}
|
||||||
|
|
||||||
/* The size command */
|
types[i] = toIntType(keys->element[i]->str, reply->str);
|
||||||
reply3 = redisCommand(context,"%s %s", sizecmd, key);
|
freeReplyObject(reply);
|
||||||
if (reply3 && reply3->type == REDIS_REPLY_INTEGER) {
|
}
|
||||||
if (biggest[type] < reply3->integer) {
|
}
|
||||||
printf("Biggest %-6s found so far '%s' with %llu %s.\n",
|
|
||||||
typename[type], key,
|
static void getKeySizes(redisReply *keys, int *types,
|
||||||
(unsigned long long) reply3->integer,
|
unsigned long long *sizes)
|
||||||
|
{
|
||||||
|
redisReply *reply;
|
||||||
|
char *sizecmds[] = {"STRLEN","LLEN","SCARD","HLEN","ZCARD"};
|
||||||
|
int i;
|
||||||
|
|
||||||
|
/* Pipeline size commands */
|
||||||
|
for(i=0;i<keys->elements;i++) {
|
||||||
|
/* Skip keys that were deleted */
|
||||||
|
if(types[i]==TYPE_NONE)
|
||||||
|
continue;
|
||||||
|
|
||||||
|
redisAppendCommand(context, "%s %s", sizecmds[types[i]],
|
||||||
|
keys->element[i]->str);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Retreive sizes */
|
||||||
|
for(i=0;i<keys->elements;i++) {
|
||||||
|
/* Skip keys that dissapeared between SCAN and TYPE */
|
||||||
|
if(types[i] == TYPE_NONE) {
|
||||||
|
sizes[i] = 0;
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Retreive size */
|
||||||
|
if(redisGetReply(context, (void**)&reply)!=REDIS_OK) {
|
||||||
|
fprintf(stderr, "Error getting size for key '%s' (%d: %s)\n",
|
||||||
|
keys->element[i]->str, context->err, context->errstr);
|
||||||
|
exit(1);
|
||||||
|
} else if(reply->type != REDIS_REPLY_INTEGER) {
|
||||||
|
/* Theoretically the key could have been removed and
|
||||||
|
* added as a different type between TYPE and SIZE */
|
||||||
|
fprintf(stderr,
|
||||||
|
"Warning: %s on '%s' failed (may have changed type)\n",
|
||||||
|
sizecmds[types[i]], keys->element[i]->str);
|
||||||
|
sizes[i] = 0;
|
||||||
|
} else {
|
||||||
|
sizes[i] = reply->integer;
|
||||||
|
}
|
||||||
|
|
||||||
|
freeReplyObject(reply);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
static void findBigKeys(void) {
|
||||||
|
unsigned long long biggest[5] = {0}, counts[5] = {0}, totalsize[5] = {0};
|
||||||
|
unsigned long long sampled = 0, total_keys, totlen=0, *sizes=NULL, it=0;
|
||||||
|
sds maxkeys[5] = {0};
|
||||||
|
char *typename[] = {"string","list","set","hash","zset"};
|
||||||
|
char *typeunit[] = {"bytes","items","members","fields","members"};
|
||||||
|
redisReply *reply, *keys;
|
||||||
|
int type, *types=NULL, arrsize=0, i;
|
||||||
|
double pct;
|
||||||
|
|
||||||
|
/* Total keys pre scanning */
|
||||||
|
total_keys = getDbSize();
|
||||||
|
|
||||||
|
/* Status message */
|
||||||
|
printf("\n# Scanning the entire keyspace to find biggest keys as well as\n");
|
||||||
|
printf("# average sizes per key type. You can use -i 0.1 to sleep 0.1 sec\n");
|
||||||
|
printf("# per 100 SCAN commands (not usually needed).\n\n");
|
||||||
|
|
||||||
|
/* New up sds strings to keep track of overall biggest per type */
|
||||||
|
for(i=0;i<TYPE_NONE; i++) {
|
||||||
|
maxkeys[i] = sdsempty();
|
||||||
|
if(!maxkeys[i]) {
|
||||||
|
fprintf(stderr, "Failed to allocate memory for largest key names!");
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/* SCAN loop */
|
||||||
|
do {
|
||||||
|
/* Calculate approximate percentage completion */
|
||||||
|
pct = 100 * (double)sampled/total_keys;
|
||||||
|
|
||||||
|
/* Grab some keys and point to the keys array */
|
||||||
|
reply = sendScan(&it);
|
||||||
|
keys = reply->element[1];
|
||||||
|
|
||||||
|
/* Reallocate our type and size array if we need to */
|
||||||
|
if(keys->elements > arrsize) {
|
||||||
|
types = zrealloc(types, sizeof(int)*keys->elements);
|
||||||
|
sizes = zrealloc(sizes, sizeof(unsigned long long)*keys->elements);
|
||||||
|
|
||||||
|
if(!types || !sizes) {
|
||||||
|
fprintf(stderr, "Failed to allocate storage for keys!\n");
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
arrsize = keys->elements;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Retreive types and then sizes */
|
||||||
|
getKeyTypes(keys, types);
|
||||||
|
getKeySizes(keys, types, sizes);
|
||||||
|
|
||||||
|
/* Now update our stats */
|
||||||
|
for(i=0;i<keys->elements;i++) {
|
||||||
|
if((type = types[i]) == TYPE_NONE)
|
||||||
|
continue;
|
||||||
|
|
||||||
|
totalsize[type] += sizes[i];
|
||||||
|
counts[type]++;
|
||||||
|
totlen += keys->element[i]->len;
|
||||||
|
sampled++;
|
||||||
|
|
||||||
|
if(biggest[type]<sizes[i]) {
|
||||||
|
printf(
|
||||||
|
"[%05.2f%%] Biggest %-6s found so far '%s' with %llu %s\n",
|
||||||
|
pct, typename[type], keys->element[i]->str, sizes[i],
|
||||||
typeunit[type]);
|
typeunit[type]);
|
||||||
biggest[type] = reply3->integer;
|
|
||||||
|
/* Keep track of biggest key name for this type */
|
||||||
|
maxkeys[type] = sdscpy(maxkeys[type], keys->element[i]->str);
|
||||||
|
if(!maxkeys[type]) {
|
||||||
|
fprintf(stderr, "Failed to allocate memory for key!\n");
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Keep track of the biggest size for this type */
|
||||||
|
biggest[type] = sizes[i];
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Update overall progress */
|
||||||
|
if(sampled % 1000000 == 0) {
|
||||||
|
printf("[%05.2f%%] Sampled %llu keys so far\n", pct, sampled);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
freeReplyObject(reply2);
|
/* Sleep if we've been directed to do so */
|
||||||
if(reply3) freeReplyObject(reply3);
|
if(sampled && (sampled %100) == 0 && config.interval) {
|
||||||
}
|
|
||||||
|
|
||||||
if (samples && (samples % 1000000) == 0)
|
|
||||||
printf("(%llu keys sampled)\n", samples);
|
|
||||||
|
|
||||||
if (samples && (samples % 100) == 0 && config.interval)
|
|
||||||
usleep(config.interval);
|
usleep(config.interval);
|
||||||
|
}
|
||||||
|
|
||||||
freeReplyObject(reply1);
|
freeReplyObject(reply);
|
||||||
} while(it != 0);
|
} while(it != 0);
|
||||||
|
|
||||||
/* We've finished scanning the keyspace */
|
if(types) zfree(types);
|
||||||
printf("\n# Scanned all %llu keys in the keyspace!\n", samples);
|
if(sizes) zfree(sizes);
|
||||||
|
|
||||||
|
/* We're done */
|
||||||
|
printf("\n-------- summary -------\n\n");
|
||||||
|
|
||||||
|
printf("Sampled %llu keys in the keyspace!\n", sampled);
|
||||||
|
printf("Total key length in bytes is %llu (avg len %.2f)\n\n",
|
||||||
|
totlen, totlen ? (double)totlen/sampled : 0);
|
||||||
|
|
||||||
|
/* Output the biggest keys we found, for types we did find */
|
||||||
|
for(i=0;i<TYPE_NONE;i++) {
|
||||||
|
if(sdslen(maxkeys[i])>0) {
|
||||||
|
printf("Biggest %6s found '%s' has %llu %s\n", typename[i], maxkeys[i],
|
||||||
|
biggest[i], typeunit[i]);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
printf("\n");
|
||||||
|
|
||||||
|
for(i=0;i<TYPE_NONE;i++) {
|
||||||
|
printf("%llu %ss with %llu %s (%05.2f%% of keys, avg size %.2f)\n",
|
||||||
|
counts[i], typename[i], totalsize[i], typeunit[i],
|
||||||
|
sampled ? 100 * (double)counts[i]/sampled : 0,
|
||||||
|
counts[i] ? (double)totalsize[i]/counts[i] : 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Free sds strings containing max keys */
|
||||||
|
for(i=0;i<TYPE_NONE;i++) {
|
||||||
|
sdsfree(maxkeys[i]);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Success! */
|
||||||
exit(0);
|
exit(0);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user