mirror of
https://codeberg.org/redict/redict.git
synced 2025-01-23 16:48:27 -05:00
6689 lines
241 KiB
C
6689 lines
241 KiB
C
/* Redis CLI (command line interface)
|
|
*
|
|
* Copyright (c) 2009-2012, Salvatore Sanfilippo <antirez at gmail dot com>
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are met:
|
|
*
|
|
* * Redistributions of source code must retain the above copyright notice,
|
|
* this list of conditions and the following disclaimer.
|
|
* * Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* * Neither the name of Redis nor the names of its contributors may be used
|
|
* to endorse or promote products derived from this software without
|
|
* specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
* POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#include "fmacros.h"
|
|
#include "version.h"
|
|
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include <stdlib.h>
|
|
#include <signal.h>
|
|
#include <unistd.h>
|
|
#include <time.h>
|
|
#include <ctype.h>
|
|
#include <errno.h>
|
|
#include <sys/stat.h>
|
|
#include <sys/time.h>
|
|
#include <assert.h>
|
|
#include <fcntl.h>
|
|
#include <limits.h>
|
|
#include <math.h>
|
|
|
|
#include <hiredis.h>
|
|
#include <sds.h> /* use sds.h from hiredis, so that only one set of sds functions will be present in the binary */
|
|
#include "dict.h"
|
|
#include "adlist.h"
|
|
#include "zmalloc.h"
|
|
#include "linenoise.h"
|
|
#include "help.h"
|
|
#include "anet.h"
|
|
#include "ae.h"
|
|
|
|
#define UNUSED(V) ((void) V)
|
|
|
|
#define OUTPUT_STANDARD 0
|
|
#define OUTPUT_RAW 1
|
|
#define OUTPUT_CSV 2
|
|
#define REDIS_CLI_KEEPALIVE_INTERVAL 15 /* seconds */
|
|
#define REDIS_CLI_DEFAULT_PIPE_TIMEOUT 30 /* seconds */
|
|
#define REDIS_CLI_HISTFILE_ENV "REDISCLI_HISTFILE"
|
|
#define REDIS_CLI_HISTFILE_DEFAULT ".rediscli_history"
|
|
#define REDIS_CLI_RCFILE_ENV "REDISCLI_RCFILE"
|
|
#define REDIS_CLI_RCFILE_DEFAULT ".redisclirc"
|
|
|
|
#define CLUSTER_MANAGER_SLOTS 16384
|
|
#define CLUSTER_MANAGER_MIGRATE_TIMEOUT 60000
|
|
#define CLUSTER_MANAGER_MIGRATE_PIPELINE 10
|
|
#define CLUSTER_MANAGER_REBALANCE_THRESHOLD 2
|
|
|
|
#define CLUSTER_MANAGER_INVALID_HOST_ARG \
|
|
"[ERR] Invalid arguments: you need to pass either a valid " \
|
|
"address (ie. 120.0.0.1:7000) or space separated IP " \
|
|
"and port (ie. 120.0.0.1 7000)\n"
|
|
#define CLUSTER_MANAGER_MODE() (config.cluster_manager_command.name != NULL)
|
|
#define CLUSTER_MANAGER_MASTERS_COUNT(nodes, replicas) (nodes/(replicas + 1))
|
|
#define CLUSTER_MANAGER_NODE_CONNECT(n) \
|
|
(n->context = redisConnect(n->ip, n->port));
|
|
#define CLUSTER_MANAGER_COMMAND(n,...) \
|
|
(reconnectingRedisCommand(n->context, __VA_ARGS__))
|
|
|
|
#define CLUSTER_MANAGER_NODE_ARRAY_FREE(array) zfree(array->alloc)
|
|
|
|
#define CLUSTER_MANAGER_PRINT_REPLY_ERROR(n, err) \
|
|
clusterManagerLogErr("Node %s:%d replied with error:\n%s\n", \
|
|
n->ip, n->port, err);
|
|
|
|
#define clusterManagerLogInfo(...) \
|
|
clusterManagerLog(CLUSTER_MANAGER_LOG_LVL_INFO,__VA_ARGS__)
|
|
|
|
#define clusterManagerLogErr(...) \
|
|
clusterManagerLog(CLUSTER_MANAGER_LOG_LVL_ERR,__VA_ARGS__)
|
|
|
|
#define clusterManagerLogWarn(...) \
|
|
clusterManagerLog(CLUSTER_MANAGER_LOG_LVL_WARN,__VA_ARGS__)
|
|
|
|
#define clusterManagerLogOk(...) \
|
|
clusterManagerLog(CLUSTER_MANAGER_LOG_LVL_SUCCESS,__VA_ARGS__)
|
|
|
|
#define CLUSTER_MANAGER_FLAG_MYSELF 1 << 0
|
|
#define CLUSTER_MANAGER_FLAG_SLAVE 1 << 1
|
|
#define CLUSTER_MANAGER_FLAG_FRIEND 1 << 2
|
|
#define CLUSTER_MANAGER_FLAG_NOADDR 1 << 3
|
|
#define CLUSTER_MANAGER_FLAG_DISCONNECT 1 << 4
|
|
#define CLUSTER_MANAGER_FLAG_FAIL 1 << 5
|
|
|
|
#define CLUSTER_MANAGER_CMD_FLAG_FIX 1 << 0
|
|
#define CLUSTER_MANAGER_CMD_FLAG_SLAVE 1 << 1
|
|
#define CLUSTER_MANAGER_CMD_FLAG_YES 1 << 2
|
|
#define CLUSTER_MANAGER_CMD_FLAG_AUTOWEIGHTS 1 << 3
|
|
#define CLUSTER_MANAGER_CMD_FLAG_EMPTYMASTER 1 << 4
|
|
#define CLUSTER_MANAGER_CMD_FLAG_SIMULATE 1 << 5
|
|
#define CLUSTER_MANAGER_CMD_FLAG_REPLACE 1 << 6
|
|
#define CLUSTER_MANAGER_CMD_FLAG_COPY 1 << 7
|
|
#define CLUSTER_MANAGER_CMD_FLAG_COLOR 1 << 8
|
|
|
|
#define CLUSTER_MANAGER_OPT_GETFRIENDS 1 << 0
|
|
#define CLUSTER_MANAGER_OPT_COLD 1 << 1
|
|
#define CLUSTER_MANAGER_OPT_UPDATE 1 << 2
|
|
#define CLUSTER_MANAGER_OPT_QUIET 1 << 6
|
|
#define CLUSTER_MANAGER_OPT_VERBOSE 1 << 7
|
|
|
|
#define CLUSTER_MANAGER_LOG_LVL_INFO 1
|
|
#define CLUSTER_MANAGER_LOG_LVL_WARN 2
|
|
#define CLUSTER_MANAGER_LOG_LVL_ERR 3
|
|
#define CLUSTER_MANAGER_LOG_LVL_SUCCESS 4
|
|
|
|
#define LOG_COLOR_BOLD "29;1m"
|
|
#define LOG_COLOR_RED "31;1m"
|
|
#define LOG_COLOR_GREEN "32;1m"
|
|
#define LOG_COLOR_YELLOW "33;1m"
|
|
#define LOG_COLOR_RESET "0m"
|
|
|
|
/* --latency-dist palettes. */
|
|
int spectrum_palette_color_size = 19;
|
|
int spectrum_palette_color[] = {0,233,234,235,237,239,241,243,245,247,144,143,142,184,226,214,208,202,196};
|
|
|
|
int spectrum_palette_mono_size = 13;
|
|
int spectrum_palette_mono[] = {0,233,234,235,237,239,241,243,245,247,249,251,253};
|
|
|
|
/* The actual palette in use. */
|
|
int *spectrum_palette;
|
|
int spectrum_palette_size;
|
|
|
|
/* Dict Helpers */
|
|
|
|
static uint64_t dictSdsHash(const void *key);
|
|
static int dictSdsKeyCompare(void *privdata, const void *key1,
|
|
const void *key2);
|
|
static void dictSdsDestructor(void *privdata, void *val);
|
|
static void dictListDestructor(void *privdata, void *val);
|
|
|
|
/* Cluster Manager Command Info */
|
|
typedef struct clusterManagerCommand {
|
|
char *name;
|
|
int argc;
|
|
char **argv;
|
|
int flags;
|
|
int replicas;
|
|
char *from;
|
|
char *to;
|
|
char **weight;
|
|
char *master_id;
|
|
int weight_argc;
|
|
int slots;
|
|
int timeout;
|
|
int pipeline;
|
|
float threshold;
|
|
} clusterManagerCommand;
|
|
|
|
static void createClusterManagerCommand(char *cmdname, int argc, char **argv);
|
|
|
|
|
|
static redisContext *context;
|
|
static struct config {
|
|
char *hostip;
|
|
int hostport;
|
|
char *hostsocket;
|
|
long repeat;
|
|
long interval;
|
|
int dbnum;
|
|
int interactive;
|
|
int shutdown;
|
|
int monitor_mode;
|
|
int pubsub_mode;
|
|
int latency_mode;
|
|
int latency_dist_mode;
|
|
int latency_history;
|
|
int lru_test_mode;
|
|
long long lru_test_sample_size;
|
|
int cluster_mode;
|
|
int cluster_reissue_command;
|
|
int slave_mode;
|
|
int pipe_mode;
|
|
int pipe_timeout;
|
|
int getrdb_mode;
|
|
int stat_mode;
|
|
int scan_mode;
|
|
int intrinsic_latency_mode;
|
|
int intrinsic_latency_duration;
|
|
char *pattern;
|
|
char *rdb_filename;
|
|
int bigkeys;
|
|
int hotkeys;
|
|
int stdinarg; /* get last arg from stdin. (-x option) */
|
|
char *auth;
|
|
int output; /* output mode, see OUTPUT_* defines */
|
|
sds mb_delim;
|
|
char prompt[128];
|
|
char *eval;
|
|
int eval_ldb;
|
|
int eval_ldb_sync; /* Ask for synchronous mode of the Lua debugger. */
|
|
int eval_ldb_end; /* Lua debugging session ended. */
|
|
int enable_ldb_on_eval; /* Handle manual SCRIPT DEBUG + EVAL commands. */
|
|
int last_cmd_type;
|
|
int verbose;
|
|
clusterManagerCommand cluster_manager_command;
|
|
int no_auth_warning;
|
|
} config;
|
|
|
|
/* User preferences. */
|
|
static struct pref {
|
|
int hints;
|
|
} pref;
|
|
|
|
static volatile sig_atomic_t force_cancel_loop = 0;
|
|
static void usage(void);
|
|
static void slaveMode(void);
|
|
char *redisGitSHA1(void);
|
|
char *redisGitDirty(void);
|
|
static int cliConnect(int force);
|
|
|
|
static char *getInfoField(char *info, char *field);
|
|
static long getLongInfoField(char *info, char *field);
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Utility functions
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
uint16_t crc16(const char *buf, int len);
|
|
|
|
static long long ustime(void) {
|
|
struct timeval tv;
|
|
long long ust;
|
|
|
|
gettimeofday(&tv, NULL);
|
|
ust = ((long long)tv.tv_sec)*1000000;
|
|
ust += tv.tv_usec;
|
|
return ust;
|
|
}
|
|
|
|
static long long mstime(void) {
|
|
return ustime()/1000;
|
|
}
|
|
|
|
static void cliRefreshPrompt(void) {
|
|
if (config.eval_ldb) return;
|
|
|
|
sds prompt = sdsempty();
|
|
if (config.hostsocket != NULL) {
|
|
prompt = sdscatfmt(prompt,"redis %s",config.hostsocket);
|
|
} else {
|
|
char addr[256];
|
|
anetFormatAddr(addr, sizeof(addr), config.hostip, config.hostport);
|
|
prompt = sdscatlen(prompt,addr,strlen(addr));
|
|
}
|
|
|
|
/* Add [dbnum] if needed */
|
|
if (config.dbnum != 0)
|
|
prompt = sdscatfmt(prompt,"[%i]",config.dbnum);
|
|
|
|
/* Copy the prompt in the static buffer. */
|
|
prompt = sdscatlen(prompt,"> ",2);
|
|
snprintf(config.prompt,sizeof(config.prompt),"%s",prompt);
|
|
sdsfree(prompt);
|
|
}
|
|
|
|
/* Return the name of the dotfile for the specified 'dotfilename'.
|
|
* Normally it just concatenates user $HOME to the file specified
|
|
* in 'dotfilename'. However if the environment varialbe 'envoverride'
|
|
* is set, its value is taken as the path.
|
|
*
|
|
* The function returns NULL (if the file is /dev/null or cannot be
|
|
* obtained for some error), or an SDS string that must be freed by
|
|
* the user. */
|
|
static sds getDotfilePath(char *envoverride, char *dotfilename) {
|
|
char *path = NULL;
|
|
sds dotPath = NULL;
|
|
|
|
/* Check the env for a dotfile override. */
|
|
path = getenv(envoverride);
|
|
if (path != NULL && *path != '\0') {
|
|
if (!strcmp("/dev/null", path)) {
|
|
return NULL;
|
|
}
|
|
|
|
/* If the env is set, return it. */
|
|
dotPath = sdsnew(path);
|
|
} else {
|
|
char *home = getenv("HOME");
|
|
if (home != NULL && *home != '\0') {
|
|
/* If no override is set use $HOME/<dotfilename>. */
|
|
dotPath = sdscatprintf(sdsempty(), "%s/%s", home, dotfilename);
|
|
}
|
|
}
|
|
return dotPath;
|
|
}
|
|
|
|
/* URL-style percent decoding. */
|
|
#define isHexChar(c) (isdigit(c) || (c >= 'a' && c <= 'f'))
|
|
#define decodeHexChar(c) (isdigit(c) ? c - '0' : c - 'a' + 10)
|
|
#define decodeHex(h, l) ((decodeHexChar(h) << 4) + decodeHexChar(l))
|
|
|
|
static sds percentDecode(const char *pe, size_t len) {
|
|
const char *end = pe + len;
|
|
sds ret = sdsempty();
|
|
const char *curr = pe;
|
|
|
|
while (curr < end) {
|
|
if (*curr == '%') {
|
|
if ((end - curr) < 2) {
|
|
fprintf(stderr, "Incomplete URI encoding\n");
|
|
exit(1);
|
|
}
|
|
|
|
char h = tolower(*(++curr));
|
|
char l = tolower(*(++curr));
|
|
if (!isHexChar(h) || !isHexChar(l)) {
|
|
fprintf(stderr, "Illegal character in URI encoding\n");
|
|
exit(1);
|
|
}
|
|
char c = decodeHex(h, l);
|
|
ret = sdscatlen(ret, &c, 1);
|
|
curr++;
|
|
} else {
|
|
ret = sdscatlen(ret, curr++, 1);
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
/* Parse a URI and extract the server connection information.
|
|
* URI scheme is based on the the provisional specification[1] excluding support
|
|
* for query parameters. Valid URIs are:
|
|
* scheme: "redis://"
|
|
* authority: [<username> ":"] <password> "@"] [<hostname> [":" <port>]]
|
|
* path: ["/" [<db>]]
|
|
*
|
|
* [1]: https://www.iana.org/assignments/uri-schemes/prov/redis */
|
|
static void parseRedisUri(const char *uri) {
|
|
|
|
const char *scheme = "redis://";
|
|
const char *curr = uri;
|
|
const char *end = uri + strlen(uri);
|
|
const char *userinfo, *username, *port, *host, *path;
|
|
|
|
/* URI must start with a valid scheme. */
|
|
if (strncasecmp(scheme, curr, strlen(scheme))) {
|
|
fprintf(stderr,"Invalid URI scheme\n");
|
|
exit(1);
|
|
}
|
|
curr += strlen(scheme);
|
|
if (curr == end) return;
|
|
|
|
/* Extract user info. */
|
|
if ((userinfo = strchr(curr,'@'))) {
|
|
if ((username = strchr(curr, ':')) && username < userinfo) {
|
|
/* If provided, username is ignored. */
|
|
curr = username + 1;
|
|
}
|
|
|
|
config.auth = percentDecode(curr, userinfo - curr);
|
|
curr = userinfo + 1;
|
|
}
|
|
if (curr == end) return;
|
|
|
|
/* Extract host and port. */
|
|
path = strchr(curr, '/');
|
|
if (*curr != '/') {
|
|
host = path ? path - 1 : end;
|
|
if ((port = strchr(curr, ':'))) {
|
|
config.hostport = atoi(port + 1);
|
|
host = port - 1;
|
|
}
|
|
config.hostip = sdsnewlen(curr, host - curr + 1);
|
|
}
|
|
curr = path ? path + 1 : end;
|
|
if (curr == end) return;
|
|
|
|
/* Extract database number. */
|
|
config.dbnum = atoi(curr);
|
|
}
|
|
|
|
static uint64_t dictSdsHash(const void *key) {
|
|
return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
|
|
}
|
|
|
|
static int dictSdsKeyCompare(void *privdata, const void *key1,
|
|
const void *key2)
|
|
{
|
|
int l1,l2;
|
|
DICT_NOTUSED(privdata);
|
|
|
|
l1 = sdslen((sds)key1);
|
|
l2 = sdslen((sds)key2);
|
|
if (l1 != l2) return 0;
|
|
return memcmp(key1, key2, l1) == 0;
|
|
}
|
|
|
|
static void dictSdsDestructor(void *privdata, void *val)
|
|
{
|
|
DICT_NOTUSED(privdata);
|
|
sdsfree(val);
|
|
}
|
|
|
|
void dictListDestructor(void *privdata, void *val)
|
|
{
|
|
DICT_NOTUSED(privdata);
|
|
listRelease((list*)val);
|
|
}
|
|
|
|
/* _serverAssert is needed by dict */
|
|
void _serverAssert(const char *estr, const char *file, int line) {
|
|
fprintf(stderr, "=== ASSERTION FAILED ===");
|
|
fprintf(stderr, "==> %s:%d '%s' is not true",file,line,estr);
|
|
*((char*)-1) = 'x';
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Help functions
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
#define CLI_HELP_COMMAND 1
|
|
#define CLI_HELP_GROUP 2
|
|
|
|
typedef struct {
|
|
int type;
|
|
int argc;
|
|
sds *argv;
|
|
sds full;
|
|
|
|
/* Only used for help on commands */
|
|
struct commandHelp *org;
|
|
} helpEntry;
|
|
|
|
static helpEntry *helpEntries;
|
|
static int helpEntriesLen;
|
|
|
|
static sds cliVersion(void) {
|
|
sds version;
|
|
version = sdscatprintf(sdsempty(), "%s", REDIS_VERSION);
|
|
|
|
/* Add git commit and working tree status when available */
|
|
if (strtoll(redisGitSHA1(),NULL,16)) {
|
|
version = sdscatprintf(version, " (git:%s", redisGitSHA1());
|
|
if (strtoll(redisGitDirty(),NULL,10))
|
|
version = sdscatprintf(version, "-dirty");
|
|
version = sdscat(version, ")");
|
|
}
|
|
return version;
|
|
}
|
|
|
|
static void cliInitHelp(void) {
|
|
int commandslen = sizeof(commandHelp)/sizeof(struct commandHelp);
|
|
int groupslen = sizeof(commandGroups)/sizeof(char*);
|
|
int i, len, pos = 0;
|
|
helpEntry tmp;
|
|
|
|
helpEntriesLen = len = commandslen+groupslen;
|
|
helpEntries = zmalloc(sizeof(helpEntry)*len);
|
|
|
|
for (i = 0; i < groupslen; i++) {
|
|
tmp.argc = 1;
|
|
tmp.argv = zmalloc(sizeof(sds));
|
|
tmp.argv[0] = sdscatprintf(sdsempty(),"@%s",commandGroups[i]);
|
|
tmp.full = tmp.argv[0];
|
|
tmp.type = CLI_HELP_GROUP;
|
|
tmp.org = NULL;
|
|
helpEntries[pos++] = tmp;
|
|
}
|
|
|
|
for (i = 0; i < commandslen; i++) {
|
|
tmp.argv = sdssplitargs(commandHelp[i].name,&tmp.argc);
|
|
tmp.full = sdsnew(commandHelp[i].name);
|
|
tmp.type = CLI_HELP_COMMAND;
|
|
tmp.org = &commandHelp[i];
|
|
helpEntries[pos++] = tmp;
|
|
}
|
|
}
|
|
|
|
/* cliInitHelp() setups the helpEntries array with the command and group
|
|
* names from the help.h file. However the Redis instance we are connecting
|
|
* to may support more commands, so this function integrates the previous
|
|
* entries with additional entries obtained using the COMMAND command
|
|
* available in recent versions of Redis. */
|
|
static void cliIntegrateHelp(void) {
|
|
if (cliConnect(0) == REDIS_ERR) return;
|
|
|
|
redisReply *reply = redisCommand(context, "COMMAND");
|
|
if(reply == NULL || reply->type != REDIS_REPLY_ARRAY) return;
|
|
|
|
/* Scan the array reported by COMMAND and fill only the entries that
|
|
* don't already match what we have. */
|
|
for (size_t j = 0; j < reply->elements; j++) {
|
|
redisReply *entry = reply->element[j];
|
|
if (entry->type != REDIS_REPLY_ARRAY || entry->elements < 4 ||
|
|
entry->element[0]->type != REDIS_REPLY_STRING ||
|
|
entry->element[1]->type != REDIS_REPLY_INTEGER ||
|
|
entry->element[3]->type != REDIS_REPLY_INTEGER) return;
|
|
char *cmdname = entry->element[0]->str;
|
|
int i;
|
|
|
|
for (i = 0; i < helpEntriesLen; i++) {
|
|
helpEntry *he = helpEntries+i;
|
|
if (!strcasecmp(he->argv[0],cmdname))
|
|
break;
|
|
}
|
|
if (i != helpEntriesLen) continue;
|
|
|
|
helpEntriesLen++;
|
|
helpEntries = zrealloc(helpEntries,sizeof(helpEntry)*helpEntriesLen);
|
|
helpEntry *new = helpEntries+(helpEntriesLen-1);
|
|
|
|
new->argc = 1;
|
|
new->argv = zmalloc(sizeof(sds));
|
|
new->argv[0] = sdsnew(cmdname);
|
|
new->full = new->argv[0];
|
|
new->type = CLI_HELP_COMMAND;
|
|
sdstoupper(new->argv[0]);
|
|
|
|
struct commandHelp *ch = zmalloc(sizeof(*ch));
|
|
ch->name = new->argv[0];
|
|
ch->params = sdsempty();
|
|
int args = llabs(entry->element[1]->integer);
|
|
if (entry->element[3]->integer == 1) {
|
|
ch->params = sdscat(ch->params,"key ");
|
|
args--;
|
|
}
|
|
while(args--) ch->params = sdscat(ch->params,"arg ");
|
|
if (entry->element[1]->integer < 0)
|
|
ch->params = sdscat(ch->params,"...options...");
|
|
ch->summary = "Help not available";
|
|
ch->group = 0;
|
|
ch->since = "not known";
|
|
new->org = ch;
|
|
}
|
|
freeReplyObject(reply);
|
|
}
|
|
|
|
/* Output command help to stdout. */
|
|
static void cliOutputCommandHelp(struct commandHelp *help, int group) {
|
|
printf("\r\n \x1b[1m%s\x1b[0m \x1b[90m%s\x1b[0m\r\n", help->name, help->params);
|
|
printf(" \x1b[33msummary:\x1b[0m %s\r\n", help->summary);
|
|
printf(" \x1b[33msince:\x1b[0m %s\r\n", help->since);
|
|
if (group) {
|
|
printf(" \x1b[33mgroup:\x1b[0m %s\r\n", commandGroups[help->group]);
|
|
}
|
|
}
|
|
|
|
/* Print generic help. */
|
|
static void cliOutputGenericHelp(void) {
|
|
sds version = cliVersion();
|
|
printf(
|
|
"redis-cli %s\n"
|
|
"To get help about Redis commands type:\n"
|
|
" \"help @<group>\" to get a list of commands in <group>\n"
|
|
" \"help <command>\" for help on <command>\n"
|
|
" \"help <tab>\" to get a list of possible help topics\n"
|
|
" \"quit\" to exit\n"
|
|
"\n"
|
|
"To set redis-cli preferences:\n"
|
|
" \":set hints\" enable online hints\n"
|
|
" \":set nohints\" disable online hints\n"
|
|
"Set your preferences in ~/.redisclirc\n",
|
|
version
|
|
);
|
|
sdsfree(version);
|
|
}
|
|
|
|
/* Output all command help, filtering by group or command name. */
|
|
static void cliOutputHelp(int argc, char **argv) {
|
|
int i, j, len;
|
|
int group = -1;
|
|
helpEntry *entry;
|
|
struct commandHelp *help;
|
|
|
|
if (argc == 0) {
|
|
cliOutputGenericHelp();
|
|
return;
|
|
} else if (argc > 0 && argv[0][0] == '@') {
|
|
len = sizeof(commandGroups)/sizeof(char*);
|
|
for (i = 0; i < len; i++) {
|
|
if (strcasecmp(argv[0]+1,commandGroups[i]) == 0) {
|
|
group = i;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
assert(argc > 0);
|
|
for (i = 0; i < helpEntriesLen; i++) {
|
|
entry = &helpEntries[i];
|
|
if (entry->type != CLI_HELP_COMMAND) continue;
|
|
|
|
help = entry->org;
|
|
if (group == -1) {
|
|
/* Compare all arguments */
|
|
if (argc == entry->argc) {
|
|
for (j = 0; j < argc; j++) {
|
|
if (strcasecmp(argv[j],entry->argv[j]) != 0) break;
|
|
}
|
|
if (j == argc) {
|
|
cliOutputCommandHelp(help,1);
|
|
}
|
|
}
|
|
} else {
|
|
if (group == help->group) {
|
|
cliOutputCommandHelp(help,0);
|
|
}
|
|
}
|
|
}
|
|
printf("\r\n");
|
|
}
|
|
|
|
/* Linenoise completion callback. */
|
|
static void completionCallback(const char *buf, linenoiseCompletions *lc) {
|
|
size_t startpos = 0;
|
|
int mask;
|
|
int i;
|
|
size_t matchlen;
|
|
sds tmp;
|
|
|
|
if (strncasecmp(buf,"help ",5) == 0) {
|
|
startpos = 5;
|
|
while (isspace(buf[startpos])) startpos++;
|
|
mask = CLI_HELP_COMMAND | CLI_HELP_GROUP;
|
|
} else {
|
|
mask = CLI_HELP_COMMAND;
|
|
}
|
|
|
|
for (i = 0; i < helpEntriesLen; i++) {
|
|
if (!(helpEntries[i].type & mask)) continue;
|
|
|
|
matchlen = strlen(buf+startpos);
|
|
if (strncasecmp(buf+startpos,helpEntries[i].full,matchlen) == 0) {
|
|
tmp = sdsnewlen(buf,startpos);
|
|
tmp = sdscat(tmp,helpEntries[i].full);
|
|
linenoiseAddCompletion(lc,tmp);
|
|
sdsfree(tmp);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Linenoise hints callback. */
|
|
static char *hintsCallback(const char *buf, int *color, int *bold) {
|
|
if (!pref.hints) return NULL;
|
|
|
|
int i, argc, buflen = strlen(buf);
|
|
sds *argv = sdssplitargs(buf,&argc);
|
|
int endspace = buflen && isspace(buf[buflen-1]);
|
|
|
|
/* Check if the argument list is empty and return ASAP. */
|
|
if (argc == 0) {
|
|
sdsfreesplitres(argv,argc);
|
|
return NULL;
|
|
}
|
|
|
|
for (i = 0; i < helpEntriesLen; i++) {
|
|
if (!(helpEntries[i].type & CLI_HELP_COMMAND)) continue;
|
|
|
|
if (strcasecmp(argv[0],helpEntries[i].full) == 0)
|
|
{
|
|
*color = 90;
|
|
*bold = 0;
|
|
sds hint = sdsnew(helpEntries[i].org->params);
|
|
|
|
/* Remove arguments from the returned hint to show only the
|
|
* ones the user did not yet typed. */
|
|
int toremove = argc-1;
|
|
while(toremove > 0 && sdslen(hint)) {
|
|
if (hint[0] == '[') break;
|
|
if (hint[0] == ' ') toremove--;
|
|
sdsrange(hint,1,-1);
|
|
}
|
|
|
|
/* Add an initial space if needed. */
|
|
if (!endspace) {
|
|
sds newhint = sdsnewlen(" ",1);
|
|
newhint = sdscatsds(newhint,hint);
|
|
sdsfree(hint);
|
|
hint = newhint;
|
|
}
|
|
|
|
sdsfreesplitres(argv,argc);
|
|
return hint;
|
|
}
|
|
}
|
|
sdsfreesplitres(argv,argc);
|
|
return NULL;
|
|
}
|
|
|
|
static void freeHintsCallback(void *ptr) {
|
|
sdsfree(ptr);
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Networking / parsing
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
/* Send AUTH command to the server */
|
|
static int cliAuth(void) {
|
|
redisReply *reply;
|
|
if (config.auth == NULL) return REDIS_OK;
|
|
|
|
reply = redisCommand(context,"AUTH %s",config.auth);
|
|
if (reply != NULL) {
|
|
freeReplyObject(reply);
|
|
return REDIS_OK;
|
|
}
|
|
return REDIS_ERR;
|
|
}
|
|
|
|
/* Send SELECT dbnum to the server */
|
|
static int cliSelect(void) {
|
|
redisReply *reply;
|
|
if (config.dbnum == 0) return REDIS_OK;
|
|
|
|
reply = redisCommand(context,"SELECT %d",config.dbnum);
|
|
if (reply != NULL) {
|
|
int result = REDIS_OK;
|
|
if (reply->type == REDIS_REPLY_ERROR) result = REDIS_ERR;
|
|
freeReplyObject(reply);
|
|
return result;
|
|
}
|
|
return REDIS_ERR;
|
|
}
|
|
|
|
/* Connect to the server. If force is not zero the connection is performed
|
|
* even if there is already a connected socket. */
|
|
static int cliConnect(int force) {
|
|
if (context == NULL || force) {
|
|
if (context != NULL) {
|
|
redisFree(context);
|
|
}
|
|
|
|
if (config.hostsocket == NULL) {
|
|
context = redisConnect(config.hostip,config.hostport);
|
|
} else {
|
|
context = redisConnectUnix(config.hostsocket);
|
|
}
|
|
|
|
if (context->err) {
|
|
fprintf(stderr,"Could not connect to Redis at ");
|
|
if (config.hostsocket == NULL)
|
|
fprintf(stderr,"%s:%d: %s\n",config.hostip,config.hostport,context->errstr);
|
|
else
|
|
fprintf(stderr,"%s: %s\n",config.hostsocket,context->errstr);
|
|
redisFree(context);
|
|
context = NULL;
|
|
return REDIS_ERR;
|
|
}
|
|
|
|
/* Set aggressive KEEP_ALIVE socket option in the Redis context socket
|
|
* in order to prevent timeouts caused by the execution of long
|
|
* commands. At the same time this improves the detection of real
|
|
* errors. */
|
|
anetKeepAlive(NULL, context->fd, REDIS_CLI_KEEPALIVE_INTERVAL);
|
|
|
|
/* Do AUTH and select the right DB. */
|
|
if (cliAuth() != REDIS_OK)
|
|
return REDIS_ERR;
|
|
if (cliSelect() != REDIS_OK)
|
|
return REDIS_ERR;
|
|
}
|
|
return REDIS_OK;
|
|
}
|
|
|
|
static void cliPrintContextError(void) {
|
|
if (context == NULL) return;
|
|
fprintf(stderr,"Error: %s\n",context->errstr);
|
|
}
|
|
|
|
static sds cliFormatReplyTTY(redisReply *r, char *prefix) {
|
|
sds out = sdsempty();
|
|
switch (r->type) {
|
|
case REDIS_REPLY_ERROR:
|
|
out = sdscatprintf(out,"(error) %s\n", r->str);
|
|
break;
|
|
case REDIS_REPLY_STATUS:
|
|
out = sdscat(out,r->str);
|
|
out = sdscat(out,"\n");
|
|
break;
|
|
case REDIS_REPLY_INTEGER:
|
|
out = sdscatprintf(out,"(integer) %lld\n",r->integer);
|
|
break;
|
|
case REDIS_REPLY_STRING:
|
|
/* If you are producing output for the standard output we want
|
|
* a more interesting output with quoted characters and so forth */
|
|
out = sdscatrepr(out,r->str,r->len);
|
|
out = sdscat(out,"\n");
|
|
break;
|
|
case REDIS_REPLY_NIL:
|
|
out = sdscat(out,"(nil)\n");
|
|
break;
|
|
case REDIS_REPLY_ARRAY:
|
|
if (r->elements == 0) {
|
|
out = sdscat(out,"(empty list or set)\n");
|
|
} else {
|
|
unsigned int i, idxlen = 0;
|
|
char _prefixlen[16];
|
|
char _prefixfmt[16];
|
|
sds _prefix;
|
|
sds tmp;
|
|
|
|
/* Calculate chars needed to represent the largest index */
|
|
i = r->elements;
|
|
do {
|
|
idxlen++;
|
|
i /= 10;
|
|
} while(i);
|
|
|
|
/* Prefix for nested multi bulks should grow with idxlen+2 spaces */
|
|
memset(_prefixlen,' ',idxlen+2);
|
|
_prefixlen[idxlen+2] = '\0';
|
|
_prefix = sdscat(sdsnew(prefix),_prefixlen);
|
|
|
|
/* Setup prefix format for every entry */
|
|
snprintf(_prefixfmt,sizeof(_prefixfmt),"%%s%%%ud) ",idxlen);
|
|
|
|
for (i = 0; i < r->elements; i++) {
|
|
/* Don't use the prefix for the first element, as the parent
|
|
* caller already prepended the index number. */
|
|
out = sdscatprintf(out,_prefixfmt,i == 0 ? "" : prefix,i+1);
|
|
|
|
/* Format the multi bulk entry */
|
|
tmp = cliFormatReplyTTY(r->element[i],_prefix);
|
|
out = sdscatlen(out,tmp,sdslen(tmp));
|
|
sdsfree(tmp);
|
|
}
|
|
sdsfree(_prefix);
|
|
}
|
|
break;
|
|
default:
|
|
fprintf(stderr,"Unknown reply type: %d\n", r->type);
|
|
exit(1);
|
|
}
|
|
return out;
|
|
}
|
|
|
|
int isColorTerm(void) {
|
|
char *t = getenv("TERM");
|
|
return t != NULL && strstr(t,"xterm") != NULL;
|
|
}
|
|
|
|
/* Helper function for sdsCatColorizedLdbReply() appending colorize strings
|
|
* to an SDS string. */
|
|
sds sdscatcolor(sds o, char *s, size_t len, char *color) {
|
|
if (!isColorTerm()) return sdscatlen(o,s,len);
|
|
|
|
int bold = strstr(color,"bold") != NULL;
|
|
int ccode = 37; /* Defaults to white. */
|
|
if (strstr(color,"red")) ccode = 31;
|
|
else if (strstr(color,"green")) ccode = 32;
|
|
else if (strstr(color,"yellow")) ccode = 33;
|
|
else if (strstr(color,"blue")) ccode = 34;
|
|
else if (strstr(color,"magenta")) ccode = 35;
|
|
else if (strstr(color,"cyan")) ccode = 36;
|
|
else if (strstr(color,"white")) ccode = 37;
|
|
|
|
o = sdscatfmt(o,"\033[%i;%i;49m",bold,ccode);
|
|
o = sdscatlen(o,s,len);
|
|
o = sdscat(o,"\033[0m");
|
|
return o;
|
|
}
|
|
|
|
/* Colorize Lua debugger status replies according to the prefix they
|
|
* have. */
|
|
sds sdsCatColorizedLdbReply(sds o, char *s, size_t len) {
|
|
char *color = "white";
|
|
|
|
if (strstr(s,"<debug>")) color = "bold";
|
|
if (strstr(s,"<redis>")) color = "green";
|
|
if (strstr(s,"<reply>")) color = "cyan";
|
|
if (strstr(s,"<error>")) color = "red";
|
|
if (strstr(s,"<hint>")) color = "bold";
|
|
if (strstr(s,"<value>") || strstr(s,"<retval>")) color = "magenta";
|
|
if (len > 4 && isdigit(s[3])) {
|
|
if (s[1] == '>') color = "yellow"; /* Current line. */
|
|
else if (s[2] == '#') color = "bold"; /* Break point. */
|
|
}
|
|
return sdscatcolor(o,s,len,color);
|
|
}
|
|
|
|
static sds cliFormatReplyRaw(redisReply *r) {
|
|
sds out = sdsempty(), tmp;
|
|
size_t i;
|
|
|
|
switch (r->type) {
|
|
case REDIS_REPLY_NIL:
|
|
/* Nothing... */
|
|
break;
|
|
case REDIS_REPLY_ERROR:
|
|
out = sdscatlen(out,r->str,r->len);
|
|
out = sdscatlen(out,"\n",1);
|
|
break;
|
|
case REDIS_REPLY_STATUS:
|
|
case REDIS_REPLY_STRING:
|
|
if (r->type == REDIS_REPLY_STATUS && config.eval_ldb) {
|
|
/* The Lua debugger replies with arrays of simple (status)
|
|
* strings. We colorize the output for more fun if this
|
|
* is a debugging session. */
|
|
|
|
/* Detect the end of a debugging session. */
|
|
if (strstr(r->str,"<endsession>") == r->str) {
|
|
config.enable_ldb_on_eval = 0;
|
|
config.eval_ldb = 0;
|
|
config.eval_ldb_end = 1; /* Signal the caller session ended. */
|
|
config.output = OUTPUT_STANDARD;
|
|
cliRefreshPrompt();
|
|
} else {
|
|
out = sdsCatColorizedLdbReply(out,r->str,r->len);
|
|
}
|
|
} else {
|
|
out = sdscatlen(out,r->str,r->len);
|
|
}
|
|
break;
|
|
case REDIS_REPLY_INTEGER:
|
|
out = sdscatprintf(out,"%lld",r->integer);
|
|
break;
|
|
case REDIS_REPLY_ARRAY:
|
|
for (i = 0; i < r->elements; i++) {
|
|
if (i > 0) out = sdscat(out,config.mb_delim);
|
|
tmp = cliFormatReplyRaw(r->element[i]);
|
|
out = sdscatlen(out,tmp,sdslen(tmp));
|
|
sdsfree(tmp);
|
|
}
|
|
break;
|
|
default:
|
|
fprintf(stderr,"Unknown reply type: %d\n", r->type);
|
|
exit(1);
|
|
}
|
|
return out;
|
|
}
|
|
|
|
static sds cliFormatReplyCSV(redisReply *r) {
|
|
unsigned int i;
|
|
|
|
sds out = sdsempty();
|
|
switch (r->type) {
|
|
case REDIS_REPLY_ERROR:
|
|
out = sdscat(out,"ERROR,");
|
|
out = sdscatrepr(out,r->str,strlen(r->str));
|
|
break;
|
|
case REDIS_REPLY_STATUS:
|
|
out = sdscatrepr(out,r->str,r->len);
|
|
break;
|
|
case REDIS_REPLY_INTEGER:
|
|
out = sdscatprintf(out,"%lld",r->integer);
|
|
break;
|
|
case REDIS_REPLY_STRING:
|
|
out = sdscatrepr(out,r->str,r->len);
|
|
break;
|
|
case REDIS_REPLY_NIL:
|
|
out = sdscat(out,"NIL");
|
|
break;
|
|
case REDIS_REPLY_ARRAY:
|
|
for (i = 0; i < r->elements; i++) {
|
|
sds tmp = cliFormatReplyCSV(r->element[i]);
|
|
out = sdscatlen(out,tmp,sdslen(tmp));
|
|
if (i != r->elements-1) out = sdscat(out,",");
|
|
sdsfree(tmp);
|
|
}
|
|
break;
|
|
default:
|
|
fprintf(stderr,"Unknown reply type: %d\n", r->type);
|
|
exit(1);
|
|
}
|
|
return out;
|
|
}
|
|
|
|
static int cliReadReply(int output_raw_strings) {
|
|
void *_reply;
|
|
redisReply *reply;
|
|
sds out = NULL;
|
|
int output = 1;
|
|
|
|
if (redisGetReply(context,&_reply) != REDIS_OK) {
|
|
if (config.shutdown) {
|
|
redisFree(context);
|
|
context = NULL;
|
|
return REDIS_OK;
|
|
}
|
|
if (config.interactive) {
|
|
/* Filter cases where we should reconnect */
|
|
if (context->err == REDIS_ERR_IO &&
|
|
(errno == ECONNRESET || errno == EPIPE))
|
|
return REDIS_ERR;
|
|
if (context->err == REDIS_ERR_EOF)
|
|
return REDIS_ERR;
|
|
}
|
|
cliPrintContextError();
|
|
exit(1);
|
|
return REDIS_ERR; /* avoid compiler warning */
|
|
}
|
|
|
|
reply = (redisReply*)_reply;
|
|
|
|
config.last_cmd_type = reply->type;
|
|
|
|
/* Check if we need to connect to a different node and reissue the
|
|
* request. */
|
|
if (config.cluster_mode && reply->type == REDIS_REPLY_ERROR &&
|
|
(!strncmp(reply->str,"MOVED",5) || !strcmp(reply->str,"ASK")))
|
|
{
|
|
char *p = reply->str, *s;
|
|
int slot;
|
|
|
|
output = 0;
|
|
/* Comments show the position of the pointer as:
|
|
*
|
|
* [S] for pointer 's'
|
|
* [P] for pointer 'p'
|
|
*/
|
|
s = strchr(p,' '); /* MOVED[S]3999 127.0.0.1:6381 */
|
|
p = strchr(s+1,' '); /* MOVED[S]3999[P]127.0.0.1:6381 */
|
|
*p = '\0';
|
|
slot = atoi(s+1);
|
|
s = strrchr(p+1,':'); /* MOVED 3999[P]127.0.0.1[S]6381 */
|
|
*s = '\0';
|
|
sdsfree(config.hostip);
|
|
config.hostip = sdsnew(p+1);
|
|
config.hostport = atoi(s+1);
|
|
if (config.interactive)
|
|
printf("-> Redirected to slot [%d] located at %s:%d\n",
|
|
slot, config.hostip, config.hostport);
|
|
config.cluster_reissue_command = 1;
|
|
cliRefreshPrompt();
|
|
}
|
|
|
|
if (output) {
|
|
if (output_raw_strings) {
|
|
out = cliFormatReplyRaw(reply);
|
|
} else {
|
|
if (config.output == OUTPUT_RAW) {
|
|
out = cliFormatReplyRaw(reply);
|
|
out = sdscat(out,"\n");
|
|
} else if (config.output == OUTPUT_STANDARD) {
|
|
out = cliFormatReplyTTY(reply,"");
|
|
} else if (config.output == OUTPUT_CSV) {
|
|
out = cliFormatReplyCSV(reply);
|
|
out = sdscat(out,"\n");
|
|
}
|
|
}
|
|
fwrite(out,sdslen(out),1,stdout);
|
|
sdsfree(out);
|
|
}
|
|
freeReplyObject(reply);
|
|
return REDIS_OK;
|
|
}
|
|
|
|
static int cliSendCommand(int argc, char **argv, long repeat) {
|
|
char *command = argv[0];
|
|
size_t *argvlen;
|
|
int j, output_raw;
|
|
|
|
if (!config.eval_ldb && /* In debugging mode, let's pass "help" to Redis. */
|
|
(!strcasecmp(command,"help") || !strcasecmp(command,"?"))) {
|
|
cliOutputHelp(--argc, ++argv);
|
|
return REDIS_OK;
|
|
}
|
|
|
|
if (context == NULL) return REDIS_ERR;
|
|
|
|
output_raw = 0;
|
|
if (!strcasecmp(command,"info") ||
|
|
(argc >= 2 && !strcasecmp(command,"debug") &&
|
|
!strcasecmp(argv[1],"htstats")) ||
|
|
(argc >= 2 && !strcasecmp(command,"debug") &&
|
|
!strcasecmp(argv[1],"htstats-key")) ||
|
|
(argc >= 2 && !strcasecmp(command,"memory") &&
|
|
(!strcasecmp(argv[1],"malloc-stats") ||
|
|
!strcasecmp(argv[1],"doctor"))) ||
|
|
(argc == 2 && !strcasecmp(command,"cluster") &&
|
|
(!strcasecmp(argv[1],"nodes") ||
|
|
!strcasecmp(argv[1],"info"))) ||
|
|
(argc >= 2 && !strcasecmp(command,"client") &&
|
|
!strcasecmp(argv[1],"list")) ||
|
|
(argc == 3 && !strcasecmp(command,"latency") &&
|
|
!strcasecmp(argv[1],"graph")) ||
|
|
(argc == 2 && !strcasecmp(command,"latency") &&
|
|
!strcasecmp(argv[1],"doctor")))
|
|
{
|
|
output_raw = 1;
|
|
}
|
|
|
|
if (!strcasecmp(command,"shutdown")) config.shutdown = 1;
|
|
if (!strcasecmp(command,"monitor")) config.monitor_mode = 1;
|
|
if (!strcasecmp(command,"subscribe") ||
|
|
!strcasecmp(command,"psubscribe")) config.pubsub_mode = 1;
|
|
if (!strcasecmp(command,"sync") ||
|
|
!strcasecmp(command,"psync")) config.slave_mode = 1;
|
|
|
|
/* When the user manually calls SCRIPT DEBUG, setup the activation of
|
|
* debugging mode on the next eval if needed. */
|
|
if (argc == 3 && !strcasecmp(argv[0],"script") &&
|
|
!strcasecmp(argv[1],"debug"))
|
|
{
|
|
if (!strcasecmp(argv[2],"yes") || !strcasecmp(argv[2],"sync")) {
|
|
config.enable_ldb_on_eval = 1;
|
|
} else {
|
|
config.enable_ldb_on_eval = 0;
|
|
}
|
|
}
|
|
|
|
/* Actually activate LDB on EVAL if needed. */
|
|
if (!strcasecmp(command,"eval") && config.enable_ldb_on_eval) {
|
|
config.eval_ldb = 1;
|
|
config.output = OUTPUT_RAW;
|
|
}
|
|
|
|
/* Setup argument length */
|
|
argvlen = zmalloc(argc*sizeof(size_t));
|
|
for (j = 0; j < argc; j++)
|
|
argvlen[j] = sdslen(argv[j]);
|
|
|
|
while(repeat-- > 0) {
|
|
redisAppendCommandArgv(context,argc,(const char**)argv,argvlen);
|
|
while (config.monitor_mode) {
|
|
if (cliReadReply(output_raw) != REDIS_OK) exit(1);
|
|
fflush(stdout);
|
|
}
|
|
|
|
if (config.pubsub_mode) {
|
|
if (config.output != OUTPUT_RAW)
|
|
printf("Reading messages... (press Ctrl-C to quit)\n");
|
|
while (1) {
|
|
if (cliReadReply(output_raw) != REDIS_OK) exit(1);
|
|
}
|
|
}
|
|
|
|
if (config.slave_mode) {
|
|
printf("Entering slave output mode... (press Ctrl-C to quit)\n");
|
|
slaveMode();
|
|
config.slave_mode = 0;
|
|
zfree(argvlen);
|
|
return REDIS_ERR; /* Error = slaveMode lost connection to master */
|
|
}
|
|
|
|
if (cliReadReply(output_raw) != REDIS_OK) {
|
|
zfree(argvlen);
|
|
return REDIS_ERR;
|
|
} else {
|
|
/* Store database number when SELECT was successfully executed. */
|
|
if (!strcasecmp(command,"select") && argc == 2 && config.last_cmd_type != REDIS_REPLY_ERROR) {
|
|
config.dbnum = atoi(argv[1]);
|
|
cliRefreshPrompt();
|
|
} else if (!strcasecmp(command,"auth") && argc == 2) {
|
|
cliSelect();
|
|
}
|
|
}
|
|
if (config.interval) usleep(config.interval);
|
|
fflush(stdout); /* Make it grep friendly */
|
|
}
|
|
|
|
zfree(argvlen);
|
|
return REDIS_OK;
|
|
}
|
|
|
|
/* Send a command reconnecting the link if needed. */
|
|
static redisReply *reconnectingRedisCommand(redisContext *c, const char *fmt, ...) {
|
|
redisReply *reply = NULL;
|
|
int tries = 0;
|
|
va_list ap;
|
|
|
|
assert(!c->err);
|
|
while(reply == NULL) {
|
|
while (c->err & (REDIS_ERR_IO | REDIS_ERR_EOF)) {
|
|
printf("\r\x1b[0K"); /* Cursor to left edge + clear line. */
|
|
printf("Reconnecting... %d\r", ++tries);
|
|
fflush(stdout);
|
|
|
|
redisFree(c);
|
|
c = redisConnect(config.hostip,config.hostport);
|
|
usleep(1000000);
|
|
}
|
|
|
|
va_start(ap,fmt);
|
|
reply = redisvCommand(c,fmt,ap);
|
|
va_end(ap);
|
|
|
|
if (c->err && !(c->err & (REDIS_ERR_IO | REDIS_ERR_EOF))) {
|
|
fprintf(stderr, "Error: %s\n", c->errstr);
|
|
exit(1);
|
|
} else if (tries > 0) {
|
|
printf("\r\x1b[0K"); /* Cursor to left edge + clear line. */
|
|
}
|
|
}
|
|
|
|
context = c;
|
|
return reply;
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* User interface
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
static int parseOptions(int argc, char **argv) {
|
|
int i;
|
|
|
|
for (i = 1; i < argc; i++) {
|
|
int lastarg = i==argc-1;
|
|
|
|
if (!strcmp(argv[i],"-h") && !lastarg) {
|
|
sdsfree(config.hostip);
|
|
config.hostip = sdsnew(argv[++i]);
|
|
} else if (!strcmp(argv[i],"-h") && lastarg) {
|
|
usage();
|
|
} else if (!strcmp(argv[i],"--help")) {
|
|
usage();
|
|
} else if (!strcmp(argv[i],"-x")) {
|
|
config.stdinarg = 1;
|
|
} else if (!strcmp(argv[i],"-p") && !lastarg) {
|
|
config.hostport = atoi(argv[++i]);
|
|
} else if (!strcmp(argv[i],"-s") && !lastarg) {
|
|
config.hostsocket = argv[++i];
|
|
} else if (!strcmp(argv[i],"-r") && !lastarg) {
|
|
config.repeat = strtoll(argv[++i],NULL,10);
|
|
} else if (!strcmp(argv[i],"-i") && !lastarg) {
|
|
double seconds = atof(argv[++i]);
|
|
config.interval = seconds*1000000;
|
|
} else if (!strcmp(argv[i],"-n") && !lastarg) {
|
|
config.dbnum = atoi(argv[++i]);
|
|
} else if (!strcmp(argv[i], "--no-auth-warning")) {
|
|
config.no_auth_warning = 1;
|
|
} else if (!strcmp(argv[i],"-a") && !lastarg) {
|
|
config.auth = argv[++i];
|
|
} else if (!strcmp(argv[i],"-u") && !lastarg) {
|
|
parseRedisUri(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--raw")) {
|
|
config.output = OUTPUT_RAW;
|
|
} else if (!strcmp(argv[i],"--no-raw")) {
|
|
config.output = OUTPUT_STANDARD;
|
|
} else if (!strcmp(argv[i],"--csv")) {
|
|
config.output = OUTPUT_CSV;
|
|
} else if (!strcmp(argv[i],"--latency")) {
|
|
config.latency_mode = 1;
|
|
} else if (!strcmp(argv[i],"--latency-dist")) {
|
|
config.latency_dist_mode = 1;
|
|
} else if (!strcmp(argv[i],"--mono")) {
|
|
spectrum_palette = spectrum_palette_mono;
|
|
spectrum_palette_size = spectrum_palette_mono_size;
|
|
} else if (!strcmp(argv[i],"--latency-history")) {
|
|
config.latency_mode = 1;
|
|
config.latency_history = 1;
|
|
} else if (!strcmp(argv[i],"--lru-test") && !lastarg) {
|
|
config.lru_test_mode = 1;
|
|
config.lru_test_sample_size = strtoll(argv[++i],NULL,10);
|
|
} else if (!strcmp(argv[i],"--slave")) {
|
|
config.slave_mode = 1;
|
|
} else if (!strcmp(argv[i],"--stat")) {
|
|
config.stat_mode = 1;
|
|
} else if (!strcmp(argv[i],"--scan")) {
|
|
config.scan_mode = 1;
|
|
} else if (!strcmp(argv[i],"--pattern") && !lastarg) {
|
|
config.pattern = argv[++i];
|
|
} else if (!strcmp(argv[i],"--intrinsic-latency") && !lastarg) {
|
|
config.intrinsic_latency_mode = 1;
|
|
config.intrinsic_latency_duration = atoi(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--rdb") && !lastarg) {
|
|
config.getrdb_mode = 1;
|
|
config.rdb_filename = argv[++i];
|
|
} else if (!strcmp(argv[i],"--pipe")) {
|
|
config.pipe_mode = 1;
|
|
} else if (!strcmp(argv[i],"--pipe-timeout") && !lastarg) {
|
|
config.pipe_timeout = atoi(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--bigkeys")) {
|
|
config.bigkeys = 1;
|
|
} else if (!strcmp(argv[i],"--hotkeys")) {
|
|
config.hotkeys = 1;
|
|
} else if (!strcmp(argv[i],"--eval") && !lastarg) {
|
|
config.eval = argv[++i];
|
|
} else if (!strcmp(argv[i],"--ldb")) {
|
|
config.eval_ldb = 1;
|
|
config.output = OUTPUT_RAW;
|
|
} else if (!strcmp(argv[i],"--ldb-sync-mode")) {
|
|
config.eval_ldb = 1;
|
|
config.eval_ldb_sync = 1;
|
|
config.output = OUTPUT_RAW;
|
|
} else if (!strcmp(argv[i],"-c")) {
|
|
config.cluster_mode = 1;
|
|
} else if (!strcmp(argv[i],"-d") && !lastarg) {
|
|
sdsfree(config.mb_delim);
|
|
config.mb_delim = sdsnew(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--verbose")) {
|
|
config.verbose = 1;
|
|
} else if (!strcmp(argv[i],"--cluster") && !lastarg) {
|
|
if (CLUSTER_MANAGER_MODE()) usage();
|
|
char *cmd = argv[++i];
|
|
int j = i;
|
|
while (j < argc && argv[j][0] != '-') j++;
|
|
if (j > i) j--;
|
|
createClusterManagerCommand(cmd, j - i, argv + i + 1);
|
|
i = j;
|
|
} else if (!strcmp(argv[i],"--cluster") && lastarg) {
|
|
usage();
|
|
} else if (!strcmp(argv[i],"--cluster-replicas") && !lastarg) {
|
|
config.cluster_manager_command.replicas = atoi(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--cluster-master-id") && !lastarg) {
|
|
config.cluster_manager_command.master_id = argv[++i];
|
|
} else if (!strcmp(argv[i],"--cluster-from") && !lastarg) {
|
|
config.cluster_manager_command.from = argv[++i];
|
|
} else if (!strcmp(argv[i],"--cluster-to") && !lastarg) {
|
|
config.cluster_manager_command.to = argv[++i];
|
|
} else if (!strcmp(argv[i],"--cluster-weight") && !lastarg) {
|
|
int widx = i + 1;
|
|
char **weight = argv + widx;
|
|
int wargc = 0;
|
|
for (; widx < argc; widx++) {
|
|
if (strstr(argv[widx], "--") == argv[widx]) break;
|
|
wargc++;
|
|
}
|
|
if (wargc > 0) {
|
|
config.cluster_manager_command.weight = weight;
|
|
config.cluster_manager_command.weight_argc = wargc;
|
|
i += wargc;
|
|
}
|
|
} else if (!strcmp(argv[i],"--cluster-slots") && !lastarg) {
|
|
config.cluster_manager_command.slots = atoi(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--cluster-timeout") && !lastarg) {
|
|
config.cluster_manager_command.timeout = atoi(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--cluster-pipeline") && !lastarg) {
|
|
config.cluster_manager_command.pipeline = atoi(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--cluster-threshold") && !lastarg) {
|
|
config.cluster_manager_command.threshold = atof(argv[++i]);
|
|
} else if (!strcmp(argv[i],"--cluster-yes")) {
|
|
config.cluster_manager_command.flags |=
|
|
CLUSTER_MANAGER_CMD_FLAG_YES;
|
|
} else if (!strcmp(argv[i],"--cluster-simulate")) {
|
|
config.cluster_manager_command.flags |=
|
|
CLUSTER_MANAGER_CMD_FLAG_SIMULATE;
|
|
} else if (!strcmp(argv[i],"--cluster-replace")) {
|
|
config.cluster_manager_command.flags |=
|
|
CLUSTER_MANAGER_CMD_FLAG_REPLACE;
|
|
} else if (!strcmp(argv[i],"--cluster-copy")) {
|
|
config.cluster_manager_command.flags |=
|
|
CLUSTER_MANAGER_CMD_FLAG_COPY;
|
|
} else if (!strcmp(argv[i],"--cluster-slave")) {
|
|
config.cluster_manager_command.flags |=
|
|
CLUSTER_MANAGER_CMD_FLAG_SLAVE;
|
|
} else if (!strcmp(argv[i],"--cluster-use-empty-masters")) {
|
|
config.cluster_manager_command.flags |=
|
|
CLUSTER_MANAGER_CMD_FLAG_EMPTYMASTER;
|
|
} else if (!strcmp(argv[i],"-v") || !strcmp(argv[i], "--version")) {
|
|
sds version = cliVersion();
|
|
printf("redis-cli %s\n", version);
|
|
sdsfree(version);
|
|
exit(0);
|
|
} else if (CLUSTER_MANAGER_MODE() && argv[i][0] != '-') {
|
|
if (config.cluster_manager_command.argc == 0) {
|
|
int j = i + 1;
|
|
while (j < argc && argv[j][0] != '-') j++;
|
|
int cmd_argc = j - i;
|
|
config.cluster_manager_command.argc = cmd_argc;
|
|
config.cluster_manager_command.argv = argv + i;
|
|
if (cmd_argc > 1) i = j - 1;
|
|
}
|
|
} else {
|
|
if (argv[i][0] == '-') {
|
|
fprintf(stderr,
|
|
"Unrecognized option or bad number of args for: '%s'\n",
|
|
argv[i]);
|
|
exit(1);
|
|
} else {
|
|
/* Likely the command name, stop here. */
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* --ldb requires --eval. */
|
|
if (config.eval_ldb && config.eval == NULL) {
|
|
fprintf(stderr,"Options --ldb and --ldb-sync-mode require --eval.\n");
|
|
fprintf(stderr,"Try %s --help for more information.\n", argv[0]);
|
|
exit(1);
|
|
}
|
|
|
|
if (!config.no_auth_warning && config.auth != NULL) {
|
|
fputs("Warning: Using a password with '-a' or '-u' option on the command"
|
|
" line interface may not be safe.\n", stderr);
|
|
}
|
|
|
|
return i;
|
|
}
|
|
|
|
static sds readArgFromStdin(void) {
|
|
char buf[1024];
|
|
sds arg = sdsempty();
|
|
|
|
while(1) {
|
|
int nread = read(fileno(stdin),buf,1024);
|
|
|
|
if (nread == 0) break;
|
|
else if (nread == -1) {
|
|
perror("Reading from standard input");
|
|
exit(1);
|
|
}
|
|
arg = sdscatlen(arg,buf,nread);
|
|
}
|
|
return arg;
|
|
}
|
|
|
|
static void usage(void) {
|
|
sds version = cliVersion();
|
|
fprintf(stderr,
|
|
"redis-cli %s\n"
|
|
"\n"
|
|
"Usage: redis-cli [OPTIONS] [cmd [arg [arg ...]]]\n"
|
|
" -h <hostname> Server hostname (default: 127.0.0.1).\n"
|
|
" -p <port> Server port (default: 6379).\n"
|
|
" -s <socket> Server socket (overrides hostname and port).\n"
|
|
" -a <password> Password to use when connecting to the server.\n"
|
|
" -u <uri> Server URI.\n"
|
|
" -r <repeat> Execute specified command N times.\n"
|
|
" -i <interval> When -r is used, waits <interval> seconds per command.\n"
|
|
" It is possible to specify sub-second times like -i 0.1.\n"
|
|
" -n <db> Database number.\n"
|
|
" -x Read last argument from STDIN.\n"
|
|
" -d <delimiter> Multi-bulk delimiter in for raw formatting (default: \\n).\n"
|
|
" -c Enable cluster mode (follow -ASK and -MOVED redirections).\n"
|
|
" --raw Use raw formatting for replies (default when STDOUT is\n"
|
|
" not a tty).\n"
|
|
" --no-raw Force formatted output even when STDOUT is not a tty.\n"
|
|
" --csv Output in CSV format.\n"
|
|
" --stat Print rolling stats about server: mem, clients, ...\n"
|
|
" --latency Enter a special mode continuously sampling latency.\n"
|
|
" If you use this mode in an interactive session it runs\n"
|
|
" forever displaying real-time stats. Otherwise if --raw or\n"
|
|
" --csv is specified, or if you redirect the output to a non\n"
|
|
" TTY, it samples the latency for 1 second (you can use\n"
|
|
" -i to change the interval), then produces a single output\n"
|
|
" and exits.\n"
|
|
" --latency-history Like --latency but tracking latency changes over time.\n"
|
|
" Default time interval is 15 sec. Change it using -i.\n"
|
|
" --latency-dist Shows latency as a spectrum, requires xterm 256 colors.\n"
|
|
" Default time interval is 1 sec. Change it using -i.\n"
|
|
" --lru-test <keys> Simulate a cache workload with an 80-20 distribution.\n"
|
|
" --slave Simulate a slave showing commands received from the master.\n"
|
|
" --rdb <filename> Transfer an RDB dump from remote server to local file.\n"
|
|
" --pipe Transfer raw Redis protocol from stdin to server.\n"
|
|
" --pipe-timeout <n> In --pipe mode, abort with error if after sending all data.\n"
|
|
" no reply is received within <n> seconds.\n"
|
|
" Default timeout: %d. Use 0 to wait forever.\n"
|
|
" --bigkeys Sample Redis keys looking for big keys.\n"
|
|
" --hotkeys Sample Redis keys looking for hot keys.\n"
|
|
" only works when maxmemory-policy is *lfu.\n"
|
|
" --scan List all keys using the SCAN command.\n"
|
|
" --pattern <pat> Useful with --scan to specify a SCAN pattern.\n"
|
|
" --intrinsic-latency <sec> Run a test to measure intrinsic system latency.\n"
|
|
" The test will run for the specified amount of seconds.\n"
|
|
" --eval <file> Send an EVAL command using the Lua script at <file>.\n"
|
|
" --ldb Used with --eval enable the Redis Lua debugger.\n"
|
|
" --ldb-sync-mode Like --ldb but uses the synchronous Lua debugger, in\n"
|
|
" this mode the server is blocked and script changes are\n"
|
|
" are not rolled back from the server memory.\n"
|
|
" --cluster <command> [args...] [opts...]\n"
|
|
" Cluster Manager command and arguments (see below).\n"
|
|
" --verbose Verbose mode.\n"
|
|
" --no-auth-warning Don't show warning message when using password on command\n"
|
|
" line interface.\n"
|
|
" --help Output this help and exit.\n"
|
|
" --version Output version and exit.\n"
|
|
"\n",
|
|
version, REDIS_CLI_DEFAULT_PIPE_TIMEOUT);
|
|
/* Using another fprintf call to avoid -Woverlength-strings compile warning */
|
|
fprintf(stderr,
|
|
"Cluster Manager Commands:\n"
|
|
" Use --cluster help to list all available cluster manager commands.\n"
|
|
"\n"
|
|
"Examples:\n"
|
|
" cat /etc/passwd | redis-cli -x set mypasswd\n"
|
|
" redis-cli get mypasswd\n"
|
|
" redis-cli -r 100 lpush mylist x\n"
|
|
" redis-cli -r 100 -i 1 info | grep used_memory_human:\n"
|
|
" redis-cli --eval myscript.lua key1 key2 , arg1 arg2 arg3\n"
|
|
" redis-cli --scan --pattern '*:12345*'\n"
|
|
"\n"
|
|
" (Note: when using --eval the comma separates KEYS[] from ARGV[] items)\n"
|
|
"\n"
|
|
"When no command is given, redis-cli starts in interactive mode.\n"
|
|
"Type \"help\" in interactive mode for information on available commands\n"
|
|
"and settings.\n"
|
|
"\n");
|
|
sdsfree(version);
|
|
exit(1);
|
|
}
|
|
|
|
static int confirmWithYes(char *msg) {
|
|
printf("%s (type 'yes' to accept): ", msg);
|
|
fflush(stdout);
|
|
char buf[4];
|
|
int nread = read(fileno(stdin),buf,4);
|
|
buf[3] = '\0';
|
|
return (nread != 0 && !strcmp("yes", buf));
|
|
}
|
|
|
|
/* Turn the plain C strings into Sds strings */
|
|
static char **convertToSds(int count, char** args) {
|
|
int j;
|
|
char **sds = zmalloc(sizeof(char*)*count);
|
|
|
|
for(j = 0; j < count; j++)
|
|
sds[j] = sdsnew(args[j]);
|
|
|
|
return sds;
|
|
}
|
|
|
|
static int issueCommandRepeat(int argc, char **argv, long repeat) {
|
|
while (1) {
|
|
config.cluster_reissue_command = 0;
|
|
if (cliSendCommand(argc,argv,repeat) != REDIS_OK) {
|
|
cliConnect(1);
|
|
|
|
/* If we still cannot send the command print error.
|
|
* We'll try to reconnect the next time. */
|
|
if (cliSendCommand(argc,argv,repeat) != REDIS_OK) {
|
|
cliPrintContextError();
|
|
return REDIS_ERR;
|
|
}
|
|
}
|
|
/* Issue the command again if we got redirected in cluster mode */
|
|
if (config.cluster_mode && config.cluster_reissue_command) {
|
|
cliConnect(1);
|
|
} else {
|
|
break;
|
|
}
|
|
}
|
|
return REDIS_OK;
|
|
}
|
|
|
|
static int issueCommand(int argc, char **argv) {
|
|
return issueCommandRepeat(argc, argv, config.repeat);
|
|
}
|
|
|
|
/* Split the user provided command into multiple SDS arguments.
|
|
* This function normally uses sdssplitargs() from sds.c which is able
|
|
* to understand "quoted strings", escapes and so forth. However when
|
|
* we are in Lua debugging mode and the "eval" command is used, we want
|
|
* the remaining Lua script (after "e " or "eval ") to be passed verbatim
|
|
* as a single big argument. */
|
|
static sds *cliSplitArgs(char *line, int *argc) {
|
|
if (config.eval_ldb && (strstr(line,"eval ") == line ||
|
|
strstr(line,"e ") == line))
|
|
{
|
|
sds *argv = sds_malloc(sizeof(sds)*2);
|
|
*argc = 2;
|
|
int len = strlen(line);
|
|
int elen = line[1] == ' ' ? 2 : 5; /* "e " or "eval "? */
|
|
argv[0] = sdsnewlen(line,elen-1);
|
|
argv[1] = sdsnewlen(line+elen,len-elen);
|
|
return argv;
|
|
} else {
|
|
return sdssplitargs(line,argc);
|
|
}
|
|
}
|
|
|
|
/* Set the CLI preferences. This function is invoked when an interactive
|
|
* ":command" is called, or when reading ~/.redisclirc file, in order to
|
|
* set user preferences. */
|
|
void cliSetPreferences(char **argv, int argc, int interactive) {
|
|
if (!strcasecmp(argv[0],":set") && argc >= 2) {
|
|
if (!strcasecmp(argv[1],"hints")) pref.hints = 1;
|
|
else if (!strcasecmp(argv[1],"nohints")) pref.hints = 0;
|
|
else {
|
|
printf("%sunknown redis-cli preference '%s'\n",
|
|
interactive ? "" : ".redisclirc: ",
|
|
argv[1]);
|
|
}
|
|
} else {
|
|
printf("%sunknown redis-cli internal command '%s'\n",
|
|
interactive ? "" : ".redisclirc: ",
|
|
argv[0]);
|
|
}
|
|
}
|
|
|
|
/* Load the ~/.redisclirc file if any. */
|
|
void cliLoadPreferences(void) {
|
|
sds rcfile = getDotfilePath(REDIS_CLI_RCFILE_ENV,REDIS_CLI_RCFILE_DEFAULT);
|
|
if (rcfile == NULL) return;
|
|
FILE *fp = fopen(rcfile,"r");
|
|
char buf[1024];
|
|
|
|
if (fp) {
|
|
while(fgets(buf,sizeof(buf),fp) != NULL) {
|
|
sds *argv;
|
|
int argc;
|
|
|
|
argv = sdssplitargs(buf,&argc);
|
|
if (argc > 0) cliSetPreferences(argv,argc,0);
|
|
sdsfreesplitres(argv,argc);
|
|
}
|
|
fclose(fp);
|
|
}
|
|
sdsfree(rcfile);
|
|
}
|
|
|
|
static void repl(void) {
|
|
sds historyfile = NULL;
|
|
int history = 0;
|
|
char *line;
|
|
int argc;
|
|
sds *argv;
|
|
|
|
/* Initialize the help and, if possible, use the COMMAND command in order
|
|
* to retrieve missing entries. */
|
|
cliInitHelp();
|
|
cliIntegrateHelp();
|
|
|
|
config.interactive = 1;
|
|
linenoiseSetMultiLine(1);
|
|
linenoiseSetCompletionCallback(completionCallback);
|
|
linenoiseSetHintsCallback(hintsCallback);
|
|
linenoiseSetFreeHintsCallback(freeHintsCallback);
|
|
|
|
/* Only use history and load the rc file when stdin is a tty. */
|
|
if (isatty(fileno(stdin))) {
|
|
historyfile = getDotfilePath(REDIS_CLI_HISTFILE_ENV,REDIS_CLI_HISTFILE_DEFAULT);
|
|
//keep in-memory history always regardless if history file can be determined
|
|
history = 1;
|
|
if (historyfile != NULL) {
|
|
linenoiseHistoryLoad(historyfile);
|
|
}
|
|
cliLoadPreferences();
|
|
}
|
|
|
|
cliRefreshPrompt();
|
|
while((line = linenoise(context ? config.prompt : "not connected> ")) != NULL) {
|
|
if (line[0] != '\0') {
|
|
long repeat = 1;
|
|
int skipargs = 0;
|
|
char *endptr = NULL;
|
|
|
|
argv = cliSplitArgs(line,&argc);
|
|
|
|
/* check if we have a repeat command option and
|
|
* need to skip the first arg */
|
|
if (argv && argc > 0) {
|
|
errno = 0;
|
|
repeat = strtol(argv[0], &endptr, 10);
|
|
if (argc > 1 && *endptr == '\0') {
|
|
if (errno == ERANGE || errno == EINVAL || repeat <= 0) {
|
|
fputs("Invalid redis-cli repeat command option value.\n", stdout);
|
|
sdsfreesplitres(argv, argc);
|
|
linenoiseFree(line);
|
|
continue;
|
|
}
|
|
skipargs = 1;
|
|
} else {
|
|
repeat = 1;
|
|
}
|
|
}
|
|
|
|
/* Won't save auth command in history file */
|
|
if (!(argv && argc > 0 && !strcasecmp(argv[0+skipargs], "auth"))) {
|
|
if (history) linenoiseHistoryAdd(line);
|
|
if (historyfile) linenoiseHistorySave(historyfile);
|
|
}
|
|
|
|
if (argv == NULL) {
|
|
printf("Invalid argument(s)\n");
|
|
linenoiseFree(line);
|
|
continue;
|
|
} else if (argc > 0) {
|
|
if (strcasecmp(argv[0],"quit") == 0 ||
|
|
strcasecmp(argv[0],"exit") == 0)
|
|
{
|
|
exit(0);
|
|
} else if (argv[0][0] == ':') {
|
|
cliSetPreferences(argv,argc,1);
|
|
sdsfreesplitres(argv,argc);
|
|
linenoiseFree(line);
|
|
continue;
|
|
} else if (strcasecmp(argv[0],"restart") == 0) {
|
|
if (config.eval) {
|
|
config.eval_ldb = 1;
|
|
config.output = OUTPUT_RAW;
|
|
return; /* Return to evalMode to restart the session. */
|
|
} else {
|
|
printf("Use 'restart' only in Lua debugging mode.");
|
|
}
|
|
} else if (argc == 3 && !strcasecmp(argv[0],"connect")) {
|
|
sdsfree(config.hostip);
|
|
config.hostip = sdsnew(argv[1]);
|
|
config.hostport = atoi(argv[2]);
|
|
cliRefreshPrompt();
|
|
cliConnect(1);
|
|
} else if (argc == 1 && !strcasecmp(argv[0],"clear")) {
|
|
linenoiseClearScreen();
|
|
} else {
|
|
long long start_time = mstime(), elapsed;
|
|
|
|
issueCommandRepeat(argc-skipargs, argv+skipargs, repeat);
|
|
|
|
/* If our debugging session ended, show the EVAL final
|
|
* reply. */
|
|
if (config.eval_ldb_end) {
|
|
config.eval_ldb_end = 0;
|
|
cliReadReply(0);
|
|
printf("\n(Lua debugging session ended%s)\n\n",
|
|
config.eval_ldb_sync ? "" :
|
|
" -- dataset changes rolled back");
|
|
}
|
|
|
|
elapsed = mstime()-start_time;
|
|
if (elapsed >= 500 &&
|
|
config.output == OUTPUT_STANDARD)
|
|
{
|
|
printf("(%.2fs)\n",(double)elapsed/1000);
|
|
}
|
|
}
|
|
}
|
|
/* Free the argument vector */
|
|
sdsfreesplitres(argv,argc);
|
|
}
|
|
/* linenoise() returns malloc-ed lines like readline() */
|
|
linenoiseFree(line);
|
|
}
|
|
exit(0);
|
|
}
|
|
|
|
static int noninteractive(int argc, char **argv) {
|
|
int retval = 0;
|
|
if (config.stdinarg) {
|
|
argv = zrealloc(argv, (argc+1)*sizeof(char*));
|
|
argv[argc] = readArgFromStdin();
|
|
retval = issueCommand(argc+1, argv);
|
|
} else {
|
|
retval = issueCommand(argc, argv);
|
|
}
|
|
return retval;
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Eval mode
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
static int evalMode(int argc, char **argv) {
|
|
sds script = NULL;
|
|
FILE *fp;
|
|
char buf[1024];
|
|
size_t nread;
|
|
char **argv2;
|
|
int j, got_comma, keys;
|
|
int retval = REDIS_OK;
|
|
|
|
while(1) {
|
|
if (config.eval_ldb) {
|
|
printf(
|
|
"Lua debugging session started, please use:\n"
|
|
"quit -- End the session.\n"
|
|
"restart -- Restart the script in debug mode again.\n"
|
|
"help -- Show Lua script debugging commands.\n\n"
|
|
);
|
|
}
|
|
|
|
sdsfree(script);
|
|
script = sdsempty();
|
|
got_comma = 0;
|
|
keys = 0;
|
|
|
|
/* Load the script from the file, as an sds string. */
|
|
fp = fopen(config.eval,"r");
|
|
if (!fp) {
|
|
fprintf(stderr,
|
|
"Can't open file '%s': %s\n", config.eval, strerror(errno));
|
|
exit(1);
|
|
}
|
|
while((nread = fread(buf,1,sizeof(buf),fp)) != 0) {
|
|
script = sdscatlen(script,buf,nread);
|
|
}
|
|
fclose(fp);
|
|
|
|
/* If we are debugging a script, enable the Lua debugger. */
|
|
if (config.eval_ldb) {
|
|
redisReply *reply = redisCommand(context,
|
|
config.eval_ldb_sync ?
|
|
"SCRIPT DEBUG sync": "SCRIPT DEBUG yes");
|
|
if (reply) freeReplyObject(reply);
|
|
}
|
|
|
|
/* Create our argument vector */
|
|
argv2 = zmalloc(sizeof(sds)*(argc+3));
|
|
argv2[0] = sdsnew("EVAL");
|
|
argv2[1] = script;
|
|
for (j = 0; j < argc; j++) {
|
|
if (!got_comma && argv[j][0] == ',' && argv[j][1] == 0) {
|
|
got_comma = 1;
|
|
continue;
|
|
}
|
|
argv2[j+3-got_comma] = sdsnew(argv[j]);
|
|
if (!got_comma) keys++;
|
|
}
|
|
argv2[2] = sdscatprintf(sdsempty(),"%d",keys);
|
|
|
|
/* Call it */
|
|
int eval_ldb = config.eval_ldb; /* Save it, may be reverteed. */
|
|
retval = issueCommand(argc+3-got_comma, argv2);
|
|
if (eval_ldb) {
|
|
if (!config.eval_ldb) {
|
|
/* If the debugging session ended immediately, there was an
|
|
* error compiling the script. Show it and don't enter
|
|
* the REPL at all. */
|
|
printf("Eval debugging session can't start:\n");
|
|
cliReadReply(0);
|
|
break; /* Return to the caller. */
|
|
} else {
|
|
strncpy(config.prompt,"lua debugger> ",sizeof(config.prompt));
|
|
repl();
|
|
/* Restart the session if repl() returned. */
|
|
cliConnect(1);
|
|
printf("\n");
|
|
}
|
|
} else {
|
|
break; /* Return to the caller. */
|
|
}
|
|
}
|
|
return retval;
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Cluster Manager
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
/* The Cluster Manager global structure */
|
|
static struct clusterManager {
|
|
list *nodes; /* List of nodes in the configuration. */
|
|
list *errors;
|
|
} cluster_manager;
|
|
|
|
/* Used by clusterManagerFixSlotsCoverage */
|
|
dict *clusterManagerUncoveredSlots = NULL;
|
|
|
|
typedef struct clusterManagerNode {
|
|
redisContext *context;
|
|
sds name;
|
|
char *ip;
|
|
int port;
|
|
uint64_t current_epoch;
|
|
time_t ping_sent;
|
|
time_t ping_recv;
|
|
int flags;
|
|
list *flags_str; /* Flags string representations */
|
|
sds replicate; /* Master ID if node is a slave */
|
|
list replicas;
|
|
int dirty; /* Node has changes that can be flushed */
|
|
uint8_t slots[CLUSTER_MANAGER_SLOTS];
|
|
int slots_count;
|
|
int replicas_count;
|
|
list *friends;
|
|
sds *migrating; /* An array of sds where even strings are slots and odd
|
|
* strings are the destination node IDs. */
|
|
sds *importing; /* An array of sds where even strings are slots and odd
|
|
* strings are the source node IDs. */
|
|
int migrating_count; /* Length of the migrating array (migrating slots*2) */
|
|
int importing_count; /* Length of the importing array (importing slots*2) */
|
|
float weight; /* Weight used by rebalance */
|
|
int balance; /* Used by rebalance */
|
|
} clusterManagerNode;
|
|
|
|
/* Data structure used to represent a sequence of cluster nodes. */
|
|
typedef struct clusterManagerNodeArray {
|
|
clusterManagerNode **nodes; /* Actual nodes array */
|
|
clusterManagerNode **alloc; /* Pointer to the allocated memory */
|
|
int len; /* Actual length of the array */
|
|
int count; /* Non-NULL nodes count */
|
|
} clusterManagerNodeArray;
|
|
|
|
/* Used for the reshard table. */
|
|
typedef struct clusterManagerReshardTableItem {
|
|
clusterManagerNode *source;
|
|
int slot;
|
|
} clusterManagerReshardTableItem;
|
|
|
|
static dictType clusterManagerDictType = {
|
|
dictSdsHash, /* hash function */
|
|
NULL, /* key dup */
|
|
NULL, /* val dup */
|
|
dictSdsKeyCompare, /* key compare */
|
|
NULL, /* key destructor */
|
|
dictSdsDestructor /* val destructor */
|
|
};
|
|
|
|
typedef int clusterManagerCommandProc(int argc, char **argv);
|
|
|
|
/* Cluster Manager helper functions */
|
|
|
|
static clusterManagerNode *clusterManagerNewNode(char *ip, int port);
|
|
static clusterManagerNode *clusterManagerNodeByName(const char *name);
|
|
static clusterManagerNode *clusterManagerNodeByAbbreviatedName(const char *n);
|
|
static void clusterManagerNodeResetSlots(clusterManagerNode *node);
|
|
static int clusterManagerNodeIsCluster(clusterManagerNode *node, char **err);
|
|
static void clusterManagerPrintNotClusterNodeError(clusterManagerNode *node,
|
|
char *err);
|
|
static int clusterManagerNodeLoadInfo(clusterManagerNode *node, int opts,
|
|
char **err);
|
|
static int clusterManagerLoadInfoFromNode(clusterManagerNode *node, int opts);
|
|
static int clusterManagerNodeIsEmpty(clusterManagerNode *node, char **err);
|
|
static int clusterManagerGetAntiAffinityScore(clusterManagerNodeArray *ipnodes,
|
|
int ip_count, clusterManagerNode ***offending, int *offending_len);
|
|
static void clusterManagerOptimizeAntiAffinity(clusterManagerNodeArray *ipnodes,
|
|
int ip_count);
|
|
static sds clusterManagerNodeInfo(clusterManagerNode *node, int indent);
|
|
static void clusterManagerShowNodes(void);
|
|
static void clusterManagerShowClusterInfo(void);
|
|
static int clusterManagerFlushNodeConfig(clusterManagerNode *node, char **err);
|
|
static void clusterManagerWaitForClusterJoin(void);
|
|
static int clusterManagerCheckCluster(int quiet);
|
|
static void clusterManagerLog(int level, const char* fmt, ...);
|
|
static int clusterManagerIsConfigConsistent(void);
|
|
static void clusterManagerOnError(sds err);
|
|
static void clusterManagerNodeArrayInit(clusterManagerNodeArray *array,
|
|
int len);
|
|
static void clusterManagerNodeArrayReset(clusterManagerNodeArray *array);
|
|
static void clusterManagerNodeArrayShift(clusterManagerNodeArray *array,
|
|
clusterManagerNode **nodeptr);
|
|
static void clusterManagerNodeArrayAdd(clusterManagerNodeArray *array,
|
|
clusterManagerNode *node);
|
|
|
|
/* Cluster Manager commands. */
|
|
|
|
static int clusterManagerCommandCreate(int argc, char **argv);
|
|
static int clusterManagerCommandAddNode(int argc, char **argv);
|
|
static int clusterManagerCommandDeleteNode(int argc, char **argv);
|
|
static int clusterManagerCommandInfo(int argc, char **argv);
|
|
static int clusterManagerCommandCheck(int argc, char **argv);
|
|
static int clusterManagerCommandFix(int argc, char **argv);
|
|
static int clusterManagerCommandReshard(int argc, char **argv);
|
|
static int clusterManagerCommandRebalance(int argc, char **argv);
|
|
static int clusterManagerCommandSetTimeout(int argc, char **argv);
|
|
static int clusterManagerCommandImport(int argc, char **argv);
|
|
static int clusterManagerCommandCall(int argc, char **argv);
|
|
static int clusterManagerCommandHelp(int argc, char **argv);
|
|
|
|
typedef struct clusterManagerCommandDef {
|
|
char *name;
|
|
clusterManagerCommandProc *proc;
|
|
int arity;
|
|
char *args;
|
|
char *options;
|
|
} clusterManagerCommandDef;
|
|
|
|
clusterManagerCommandDef clusterManagerCommands[] = {
|
|
{"create", clusterManagerCommandCreate, -2, "host1:port1 ... hostN:portN",
|
|
"replicas <arg>"},
|
|
{"check", clusterManagerCommandCheck, -1, "host:port", NULL},
|
|
{"info", clusterManagerCommandInfo, -1, "host:port", NULL},
|
|
{"fix", clusterManagerCommandFix, -1, "host:port", NULL},
|
|
{"reshard", clusterManagerCommandReshard, -1, "host:port",
|
|
"from <arg>,to <arg>,slots <arg>,yes,timeout <arg>,pipeline <arg>"},
|
|
{"rebalance", clusterManagerCommandRebalance, -1, "host:port",
|
|
"weight <node1=w1...nodeN=wN>,use-empty-masters,"
|
|
"timeout <arg>,simulate,pipeline <arg>,threshold <arg>"},
|
|
{"add-node", clusterManagerCommandAddNode, 2,
|
|
"new_host:new_port existing_host:existing_port", "slave,master-id <arg>"},
|
|
{"del-node", clusterManagerCommandDeleteNode, 2, "host:port node_id",NULL},
|
|
{"call", clusterManagerCommandCall, -2,
|
|
"host:port command arg arg .. arg", NULL},
|
|
{"set-timeout", clusterManagerCommandSetTimeout, 2,
|
|
"host:port milliseconds", NULL},
|
|
{"import", clusterManagerCommandImport, 1, "host:port",
|
|
"from <arg>,copy,replace"},
|
|
{"help", clusterManagerCommandHelp, 0, NULL, NULL}
|
|
};
|
|
|
|
|
|
static void createClusterManagerCommand(char *cmdname, int argc, char **argv) {
|
|
clusterManagerCommand *cmd = &config.cluster_manager_command;
|
|
cmd->name = cmdname;
|
|
cmd->argc = argc;
|
|
cmd->argv = argc ? argv : NULL;
|
|
if (isColorTerm()) cmd->flags |= CLUSTER_MANAGER_CMD_FLAG_COLOR;
|
|
}
|
|
|
|
|
|
static clusterManagerCommandProc *validateClusterManagerCommand(void) {
|
|
int i, commands_count = sizeof(clusterManagerCommands) /
|
|
sizeof(clusterManagerCommandDef);
|
|
clusterManagerCommandProc *proc = NULL;
|
|
char *cmdname = config.cluster_manager_command.name;
|
|
int argc = config.cluster_manager_command.argc;
|
|
for (i = 0; i < commands_count; i++) {
|
|
clusterManagerCommandDef cmddef = clusterManagerCommands[i];
|
|
if (!strcmp(cmddef.name, cmdname)) {
|
|
if ((cmddef.arity > 0 && argc != cmddef.arity) ||
|
|
(cmddef.arity < 0 && argc < (cmddef.arity * -1))) {
|
|
fprintf(stderr, "[ERR] Wrong number of arguments for "
|
|
"specified --cluster sub command\n");
|
|
return NULL;
|
|
}
|
|
proc = cmddef.proc;
|
|
}
|
|
}
|
|
if (!proc) fprintf(stderr, "Unknown --cluster subcommand\n");
|
|
return proc;
|
|
}
|
|
|
|
/* Get host ip and port from command arguments. If only one argument has
|
|
* been provided it must be in the form of 'ip:port', elsewhere
|
|
* the first argument must be the ip and the second one the port.
|
|
* If host and port can be detected, it returns 1 and it stores host and
|
|
* port into variables referenced by'ip_ptr' and 'port_ptr' pointers,
|
|
* elsewhere it returns 0. */
|
|
static int getClusterHostFromCmdArgs(int argc, char **argv,
|
|
char **ip_ptr, int *port_ptr) {
|
|
int port = 0;
|
|
char *ip = NULL;
|
|
if (argc == 1) {
|
|
char *addr = argv[0];
|
|
char *c = strrchr(addr, '@');
|
|
if (c != NULL) *c = '\0';
|
|
c = strrchr(addr, ':');
|
|
if (c != NULL) {
|
|
*c = '\0';
|
|
ip = addr;
|
|
port = atoi(++c);
|
|
} else return 0;
|
|
} else {
|
|
ip = argv[0];
|
|
port = atoi(argv[1]);
|
|
}
|
|
if (!ip || !port) return 0;
|
|
else {
|
|
*ip_ptr = ip;
|
|
*port_ptr = port;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static void freeClusterManagerNodeFlags(list *flags) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(flags, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
sds flag = ln->value;
|
|
sdsfree(flag);
|
|
}
|
|
listRelease(flags);
|
|
}
|
|
|
|
static void freeClusterManagerNode(clusterManagerNode *node) {
|
|
if (node->context != NULL) redisFree(node->context);
|
|
if (node->friends != NULL) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(node->friends,&li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *fn = ln->value;
|
|
freeClusterManagerNode(fn);
|
|
}
|
|
listRelease(node->friends);
|
|
node->friends = NULL;
|
|
}
|
|
if (node->name != NULL) sdsfree(node->name);
|
|
if (node->replicate != NULL) sdsfree(node->replicate);
|
|
if ((node->flags & CLUSTER_MANAGER_FLAG_FRIEND) && node->ip)
|
|
sdsfree(node->ip);
|
|
int i;
|
|
if (node->migrating != NULL) {
|
|
for (i = 0; i < node->migrating_count; i++) sdsfree(node->migrating[i]);
|
|
zfree(node->migrating);
|
|
}
|
|
if (node->importing != NULL) {
|
|
for (i = 0; i < node->importing_count; i++) sdsfree(node->importing[i]);
|
|
zfree(node->importing);
|
|
}
|
|
if (node->flags_str != NULL) {
|
|
freeClusterManagerNodeFlags(node->flags_str);
|
|
node->flags_str = NULL;
|
|
}
|
|
zfree(node);
|
|
}
|
|
|
|
static void freeClusterManager(void) {
|
|
listIter li;
|
|
listNode *ln;
|
|
if (cluster_manager.nodes != NULL) {
|
|
listRewind(cluster_manager.nodes,&li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
freeClusterManagerNode(n);
|
|
}
|
|
listRelease(cluster_manager.nodes);
|
|
cluster_manager.nodes = NULL;
|
|
}
|
|
if (cluster_manager.errors != NULL) {
|
|
listRewind(cluster_manager.errors,&li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
sds err = ln->value;
|
|
sdsfree(err);
|
|
}
|
|
listRelease(cluster_manager.errors);
|
|
cluster_manager.errors = NULL;
|
|
}
|
|
if (clusterManagerUncoveredSlots != NULL)
|
|
dictRelease(clusterManagerUncoveredSlots);
|
|
}
|
|
|
|
static clusterManagerNode *clusterManagerNewNode(char *ip, int port) {
|
|
clusterManagerNode *node = zmalloc(sizeof(*node));
|
|
node->context = NULL;
|
|
node->name = NULL;
|
|
node->ip = ip;
|
|
node->port = port;
|
|
node->current_epoch = 0;
|
|
node->ping_sent = 0;
|
|
node->ping_recv = 0;
|
|
node->flags = 0;
|
|
node->flags_str = NULL;
|
|
node->replicate = NULL;
|
|
node->dirty = 0;
|
|
node->friends = NULL;
|
|
node->migrating = NULL;
|
|
node->importing = NULL;
|
|
node->migrating_count = 0;
|
|
node->importing_count = 0;
|
|
node->replicas_count = 0;
|
|
node->weight = 1.0f;
|
|
node->balance = 0;
|
|
clusterManagerNodeResetSlots(node);
|
|
return node;
|
|
}
|
|
|
|
/* Check whether reply is NULL or its type is REDIS_REPLY_ERROR. In the
|
|
* latest case, if the 'err' arg is not NULL, it gets allocated with a copy
|
|
* of reply error (it's up to the caller function to free it), elsewhere
|
|
* the error is directly printed. */
|
|
static int clusterManagerCheckRedisReply(clusterManagerNode *n,
|
|
redisReply *r, char **err)
|
|
{
|
|
int is_err = 0;
|
|
if (!r || (is_err = (r->type == REDIS_REPLY_ERROR))) {
|
|
if (is_err) {
|
|
if (err != NULL) {
|
|
*err = zmalloc((r->len + 1) * sizeof(char));
|
|
strcpy(*err, r->str);
|
|
} else CLUSTER_MANAGER_PRINT_REPLY_ERROR(n, r->str);
|
|
}
|
|
return 0;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static void clusterManagerRemoveNodeFromList(list *nodelist,
|
|
clusterManagerNode *node) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(nodelist, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
if (node == ln->value) {
|
|
listDelNode(nodelist, ln);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Return the node with the specified name (ID) or NULL. */
|
|
static clusterManagerNode *clusterManagerNodeByName(const char *name) {
|
|
if (cluster_manager.nodes == NULL) return NULL;
|
|
clusterManagerNode *found = NULL;
|
|
sds lcname = sdsempty();
|
|
lcname = sdscpy(lcname, name);
|
|
sdstolower(lcname);
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->name && !sdscmp(n->name, lcname)) {
|
|
found = n;
|
|
break;
|
|
}
|
|
}
|
|
sdsfree(lcname);
|
|
return found;
|
|
}
|
|
|
|
/* Like clusterManagerNodeByName but the specified name can be just the first
|
|
* part of the node ID as long as the prefix in unique across the
|
|
* cluster.
|
|
*/
|
|
static clusterManagerNode *clusterManagerNodeByAbbreviatedName(const char*name)
|
|
{
|
|
if (cluster_manager.nodes == NULL) return NULL;
|
|
clusterManagerNode *found = NULL;
|
|
sds lcname = sdsempty();
|
|
lcname = sdscpy(lcname, name);
|
|
sdstolower(lcname);
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->name &&
|
|
strstr(n->name, lcname) == n->name) {
|
|
found = n;
|
|
break;
|
|
}
|
|
}
|
|
sdsfree(lcname);
|
|
return found;
|
|
}
|
|
|
|
static void clusterManagerNodeResetSlots(clusterManagerNode *node) {
|
|
memset(node->slots, 0, sizeof(node->slots));
|
|
node->slots_count = 0;
|
|
}
|
|
|
|
/* Call "INFO" redis command on the specified node and return the reply. */
|
|
static redisReply *clusterManagerGetNodeRedisInfo(clusterManagerNode *node,
|
|
char **err)
|
|
{
|
|
redisReply *info = CLUSTER_MANAGER_COMMAND(node, "INFO");
|
|
if (err != NULL) *err = NULL;
|
|
if (info == NULL) return NULL;
|
|
if (info->type == REDIS_REPLY_ERROR) {
|
|
if (err != NULL) {
|
|
*err = zmalloc((info->len + 1) * sizeof(char));
|
|
strcpy(*err, info->str);
|
|
}
|
|
freeReplyObject(info);
|
|
return NULL;
|
|
}
|
|
return info;
|
|
}
|
|
|
|
static int clusterManagerNodeIsCluster(clusterManagerNode *node, char **err) {
|
|
redisReply *info = clusterManagerGetNodeRedisInfo(node, err);
|
|
if (info == NULL) return 0;
|
|
int is_cluster = (int) getLongInfoField(info->str, "cluster_enabled");
|
|
freeReplyObject(info);
|
|
return is_cluster;
|
|
}
|
|
|
|
/* Checks whether the node is empty. Node is considered not-empty if it has
|
|
* some key or if it already knows other nodes */
|
|
static int clusterManagerNodeIsEmpty(clusterManagerNode *node, char **err) {
|
|
redisReply *info = clusterManagerGetNodeRedisInfo(node, err);
|
|
int is_empty = 1;
|
|
if (info == NULL) return 0;
|
|
if (strstr(info->str, "db0:") != NULL) {
|
|
is_empty = 0;
|
|
goto result;
|
|
}
|
|
freeReplyObject(info);
|
|
info = CLUSTER_MANAGER_COMMAND(node, "CLUSTER INFO");
|
|
if (err != NULL) *err = NULL;
|
|
if (!clusterManagerCheckRedisReply(node, info, err)) {
|
|
is_empty = 0;
|
|
goto result;
|
|
}
|
|
long known_nodes = getLongInfoField(info->str, "cluster_known_nodes");
|
|
is_empty = (known_nodes == 1);
|
|
result:
|
|
freeReplyObject(info);
|
|
return is_empty;
|
|
}
|
|
|
|
/* Return the anti-affinity score, which is a measure of the amount of
|
|
* violations of anti-affinity in the current cluster layout, that is, how
|
|
* badly the masters and slaves are distributed in the different IP
|
|
* addresses so that slaves of the same master are not in the master
|
|
* host and are also in different hosts.
|
|
*
|
|
* The score is calculated as follows:
|
|
*
|
|
* SAME_AS_MASTER = 10000 * each slave in the same IP of its master.
|
|
* SAME_AS_SLAVE = 1 * each slave having the same IP as another slave
|
|
of the same master.
|
|
* FINAL_SCORE = SAME_AS_MASTER + SAME_AS_SLAVE
|
|
*
|
|
* So a greater score means a worse anti-affinity level, while zero
|
|
* means perfect anti-affinity.
|
|
*
|
|
* The anti affinity optimizator will try to get a score as low as
|
|
* possible. Since we do not want to sacrifice the fact that slaves should
|
|
* not be in the same host as the master, we assign 10000 times the score
|
|
* to this violation, so that we'll optimize for the second factor only
|
|
* if it does not impact the first one.
|
|
*
|
|
* The ipnodes argument is an array of clusterManagerNodeArray, one for
|
|
* each IP, while ip_count is the total number of IPs in the configuration.
|
|
*
|
|
* The function returns the above score, and the list of
|
|
* offending slaves can be stored into the 'offending' argument,
|
|
* so that the optimizer can try changing the configuration of the
|
|
* slaves violating the anti-affinity goals. */
|
|
static int clusterManagerGetAntiAffinityScore(clusterManagerNodeArray *ipnodes,
|
|
int ip_count, clusterManagerNode ***offending, int *offending_len)
|
|
{
|
|
int score = 0, i, j;
|
|
int node_len = cluster_manager.nodes->len;
|
|
clusterManagerNode **offending_p = NULL;
|
|
if (offending != NULL) {
|
|
*offending = zcalloc(node_len * sizeof(clusterManagerNode*));
|
|
offending_p = *offending;
|
|
}
|
|
/* For each set of nodes in the same host, split by
|
|
* related nodes (masters and slaves which are involved in
|
|
* replication of each other) */
|
|
for (i = 0; i < ip_count; i++) {
|
|
clusterManagerNodeArray *node_array = &(ipnodes[i]);
|
|
dict *related = dictCreate(&clusterManagerDictType, NULL);
|
|
char *ip = NULL;
|
|
for (j = 0; j < node_array->len; j++) {
|
|
clusterManagerNode *node = node_array->nodes[j];
|
|
if (node == NULL) continue;
|
|
if (!ip) ip = node->ip;
|
|
sds types, otypes;
|
|
// We always use the Master ID as key
|
|
sds key = (!node->replicate ? node->name : node->replicate);
|
|
assert(key != NULL);
|
|
dictEntry *entry = dictFind(related, key);
|
|
if (entry) otypes = (sds) dictGetVal(entry);
|
|
else {
|
|
otypes = sdsempty();
|
|
dictAdd(related, key, otypes);
|
|
}
|
|
// Master type 'm' is always set as the first character of the
|
|
// types string.
|
|
if (!node->replicate) types = sdscatprintf(otypes, "m%s", otypes);
|
|
else types = sdscat(otypes, "s");
|
|
if (types != otypes) dictReplace(related, key, types);
|
|
}
|
|
/* Now it's trivial to check, for each related group having the
|
|
* same host, what is their local score. */
|
|
dictIterator *iter = dictGetIterator(related);
|
|
dictEntry *entry;
|
|
while ((entry = dictNext(iter)) != NULL) {
|
|
sds types = (sds) dictGetVal(entry);
|
|
sds name = (sds) dictGetKey(entry);
|
|
int typeslen = sdslen(types);
|
|
if (typeslen < 2) continue;
|
|
if (types[0] == 'm') score += (10000 * (typeslen - 1));
|
|
else score += (1 * typeslen);
|
|
if (offending == NULL) continue;
|
|
/* Populate the list of offending nodes. */
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->replicate == NULL) continue;
|
|
if (!strcmp(n->replicate, name) && !strcmp(n->ip, ip)) {
|
|
*(offending_p++) = n;
|
|
if (offending_len != NULL) (*offending_len)++;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
//if (offending_len != NULL) *offending_len = offending_p - *offending;
|
|
dictReleaseIterator(iter);
|
|
dictRelease(related);
|
|
}
|
|
return score;
|
|
}
|
|
|
|
static void clusterManagerOptimizeAntiAffinity(clusterManagerNodeArray *ipnodes,
|
|
int ip_count)
|
|
{
|
|
clusterManagerNode **offenders = NULL;
|
|
int score = clusterManagerGetAntiAffinityScore(ipnodes, ip_count,
|
|
NULL, NULL);
|
|
if (score == 0) goto cleanup;
|
|
clusterManagerLogInfo(">>> Trying to optimize slaves allocation "
|
|
"for anti-affinity\n");
|
|
int node_len = cluster_manager.nodes->len;
|
|
int maxiter = 500 * node_len; // Effort is proportional to cluster size...
|
|
srand(time(NULL));
|
|
while (maxiter > 0) {
|
|
int offending_len = 0;
|
|
if (offenders != NULL) {
|
|
zfree(offenders);
|
|
offenders = NULL;
|
|
}
|
|
score = clusterManagerGetAntiAffinityScore(ipnodes,
|
|
ip_count,
|
|
&offenders,
|
|
&offending_len);
|
|
if (score == 0) break; // Optimal anti affinity reached
|
|
/* We'll try to randomly swap a slave's assigned master causing
|
|
* an affinity problem with another random slave, to see if we
|
|
* can improve the affinity. */
|
|
int rand_idx = rand() % offending_len;
|
|
clusterManagerNode *first = offenders[rand_idx],
|
|
*second = NULL;
|
|
clusterManagerNode **other_replicas = zcalloc((node_len - 1) *
|
|
sizeof(*other_replicas));
|
|
int other_replicas_count = 0;
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n != first && n->replicate != NULL)
|
|
other_replicas[other_replicas_count++] = n;
|
|
}
|
|
if (other_replicas_count == 0) {
|
|
zfree(other_replicas);
|
|
break;
|
|
}
|
|
rand_idx = rand() % other_replicas_count;
|
|
second = other_replicas[rand_idx];
|
|
char *first_master = first->replicate,
|
|
*second_master = second->replicate;
|
|
first->replicate = second_master, first->dirty = 1;
|
|
second->replicate = first_master, second->dirty = 1;
|
|
int new_score = clusterManagerGetAntiAffinityScore(ipnodes,
|
|
ip_count,
|
|
NULL, NULL);
|
|
/* If the change actually makes thing worse, revert. Otherwise
|
|
* leave as it is because the best solution may need a few
|
|
* combined swaps. */
|
|
if (new_score > score) {
|
|
first->replicate = first_master;
|
|
second->replicate = second_master;
|
|
}
|
|
zfree(other_replicas);
|
|
maxiter--;
|
|
}
|
|
score = clusterManagerGetAntiAffinityScore(ipnodes, ip_count, NULL, NULL);
|
|
char *msg;
|
|
int perfect = (score == 0);
|
|
int log_level = (perfect ? CLUSTER_MANAGER_LOG_LVL_SUCCESS :
|
|
CLUSTER_MANAGER_LOG_LVL_WARN);
|
|
if (perfect) msg = "[OK] Perfect anti-affinity obtained!";
|
|
else if (score >= 10000)
|
|
msg = ("[WARNING] Some slaves are in the same host as their master");
|
|
else
|
|
msg=("[WARNING] Some slaves of the same master are in the same host");
|
|
clusterManagerLog(log_level, "%s\n", msg);
|
|
cleanup:
|
|
zfree(offenders);
|
|
}
|
|
|
|
/* Return a representable string of the node's flags */
|
|
static sds clusterManagerNodeFlagString(clusterManagerNode *node) {
|
|
sds flags = sdsempty();
|
|
if (!node->flags_str) return flags;
|
|
int empty = 1;
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(node->flags_str, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
sds flag = ln->value;
|
|
if (strcmp(flag, "myself") == 0) continue;
|
|
if (!empty) flags = sdscat(flags, ",");
|
|
flags = sdscatfmt(flags, "%S", flag);
|
|
empty = 0;
|
|
}
|
|
return flags;
|
|
}
|
|
|
|
/* Return a representable string of the node's slots */
|
|
static sds clusterManagerNodeSlotsString(clusterManagerNode *node) {
|
|
sds slots = sdsempty();
|
|
int first_range_idx = -1, last_slot_idx = -1, i;
|
|
for (i = 0; i < CLUSTER_MANAGER_SLOTS; i++) {
|
|
int has_slot = node->slots[i];
|
|
if (has_slot) {
|
|
if (first_range_idx == -1) {
|
|
if (sdslen(slots)) slots = sdscat(slots, ",");
|
|
first_range_idx = i;
|
|
slots = sdscatfmt(slots, "[%u", i);
|
|
}
|
|
last_slot_idx = i;
|
|
} else {
|
|
if (last_slot_idx >= 0) {
|
|
if (first_range_idx == last_slot_idx)
|
|
slots = sdscat(slots, "]");
|
|
else slots = sdscatfmt(slots, "-%u]", last_slot_idx);
|
|
}
|
|
last_slot_idx = -1;
|
|
first_range_idx = -1;
|
|
}
|
|
}
|
|
if (last_slot_idx >= 0) {
|
|
if (first_range_idx == last_slot_idx) slots = sdscat(slots, "]");
|
|
else slots = sdscatfmt(slots, "-%u]", last_slot_idx);
|
|
}
|
|
return slots;
|
|
}
|
|
|
|
/* -----------------------------------------------------------------------------
|
|
* Key space handling
|
|
* -------------------------------------------------------------------------- */
|
|
|
|
/* We have 16384 hash slots. The hash slot of a given key is obtained
|
|
* as the least significant 14 bits of the crc16 of the key.
|
|
*
|
|
* However if the key contains the {...} pattern, only the part between
|
|
* { and } is hashed. This may be useful in the future to force certain
|
|
* keys to be in the same node (assuming no resharding is in progress). */
|
|
static unsigned int clusterManagerKeyHashSlot(char *key, int keylen) {
|
|
int s, e; /* start-end indexes of { and } */
|
|
|
|
for (s = 0; s < keylen; s++)
|
|
if (key[s] == '{') break;
|
|
|
|
/* No '{' ? Hash the whole key. This is the base case. */
|
|
if (s == keylen) return crc16(key,keylen) & 0x3FFF;
|
|
|
|
/* '{' found? Check if we have the corresponding '}'. */
|
|
for (e = s+1; e < keylen; e++)
|
|
if (key[e] == '}') break;
|
|
|
|
/* No '}' or nothing between {} ? Hash the whole key. */
|
|
if (e == keylen || e == s+1) return crc16(key,keylen) & 0x3FFF;
|
|
|
|
/* If we are here there is both a { and a } on its right. Hash
|
|
* what is in the middle between { and }. */
|
|
return crc16(key+s+1,e-s-1) & 0x3FFF;
|
|
}
|
|
|
|
/* Return a string representation of the cluster node. */
|
|
static sds clusterManagerNodeInfo(clusterManagerNode *node, int indent) {
|
|
sds info = sdsempty();
|
|
sds spaces = sdsempty();
|
|
int i;
|
|
for (i = 0; i < indent; i++) spaces = sdscat(spaces, " ");
|
|
if (indent) info = sdscat(info, spaces);
|
|
int is_master = !(node->flags & CLUSTER_MANAGER_FLAG_SLAVE);
|
|
char *role = (is_master ? "M" : "S");
|
|
sds slots = NULL;
|
|
if (node->dirty && node->replicate != NULL)
|
|
info = sdscatfmt(info, "S: %S %s:%u", node->name, node->ip, node->port);
|
|
else {
|
|
slots = clusterManagerNodeSlotsString(node);
|
|
sds flags = clusterManagerNodeFlagString(node);
|
|
info = sdscatfmt(info, "%s: %S %s:%u\n"
|
|
"%s slots:%S (%u slots) "
|
|
"%S",
|
|
role, node->name, node->ip, node->port, spaces,
|
|
slots, node->slots_count, flags);
|
|
sdsfree(slots);
|
|
sdsfree(flags);
|
|
}
|
|
if (node->replicate != NULL)
|
|
info = sdscatfmt(info, "\n%s replicates %S", spaces, node->replicate);
|
|
else if (node->replicas_count)
|
|
info = sdscatfmt(info, "\n%s %U additional replica(s)",
|
|
spaces, node->replicas_count);
|
|
sdsfree(spaces);
|
|
return info;
|
|
}
|
|
|
|
static void clusterManagerShowNodes(void) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
sds info = clusterManagerNodeInfo(node, 0);
|
|
printf("%s\n", (char *) info);
|
|
sdsfree(info);
|
|
}
|
|
}
|
|
|
|
static void clusterManagerShowClusterInfo(void) {
|
|
int masters = 0;
|
|
int keys = 0;
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
if (!(node->flags & CLUSTER_MANAGER_FLAG_SLAVE)) {
|
|
if (!node->name) continue;
|
|
int replicas = 0;
|
|
int dbsize = -1;
|
|
char name[9];
|
|
memcpy(name, node->name, 8);
|
|
name[8] = '\0';
|
|
listIter ri;
|
|
listNode *rn;
|
|
listRewind(cluster_manager.nodes, &ri);
|
|
while ((rn = listNext(&ri)) != NULL) {
|
|
clusterManagerNode *n = rn->value;
|
|
if (n == node || !(n->flags & CLUSTER_MANAGER_FLAG_SLAVE))
|
|
continue;
|
|
if (n->replicate && !strcmp(n->replicate, node->name))
|
|
replicas++;
|
|
}
|
|
redisReply *reply = CLUSTER_MANAGER_COMMAND(node, "DBSIZE");
|
|
if (reply != NULL || reply->type == REDIS_REPLY_INTEGER)
|
|
dbsize = reply->integer;
|
|
if (dbsize < 0) {
|
|
char *err = "";
|
|
if (reply != NULL && reply->type == REDIS_REPLY_ERROR)
|
|
err = reply->str;
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(node, err);
|
|
if (reply != NULL) freeReplyObject(reply);
|
|
return;
|
|
};
|
|
if (reply != NULL) freeReplyObject(reply);
|
|
printf("%s:%d (%s...) -> %d keys | %d slots | %d slaves.\n",
|
|
node->ip, node->port, name, dbsize,
|
|
node->slots_count, replicas);
|
|
masters++;
|
|
keys += dbsize;
|
|
}
|
|
}
|
|
clusterManagerLogOk("[OK] %d keys in %d masters.\n", keys, masters);
|
|
float keys_per_slot = keys / (float) CLUSTER_MANAGER_SLOTS;
|
|
printf("%.2f keys per slot on average.\n", keys_per_slot);
|
|
}
|
|
|
|
/* Flush dirty slots configuration of the node by calling CLUSTER ADDSLOTS */
|
|
static int clusterManagerAddSlots(clusterManagerNode *node, char**err)
|
|
{
|
|
redisReply *reply = NULL;
|
|
void *_reply = NULL;
|
|
int success = 1;
|
|
/* First two args are used for the command itself. */
|
|
int argc = node->slots_count + 2;
|
|
sds *argv = zmalloc(argc * sizeof(*argv));
|
|
size_t *argvlen = zmalloc(argc * sizeof(*argvlen));
|
|
argv[0] = "CLUSTER";
|
|
argv[1] = "ADDSLOTS";
|
|
argvlen[0] = 7;
|
|
argvlen[1] = 8;
|
|
*err = NULL;
|
|
int i, argv_idx = 2;
|
|
for (i = 0; i < CLUSTER_MANAGER_SLOTS; i++) {
|
|
if (argv_idx >= argc) break;
|
|
if (node->slots[i]) {
|
|
argv[argv_idx] = sdsfromlonglong((long long) i);
|
|
argvlen[argv_idx] = sdslen(argv[argv_idx]);
|
|
argv_idx++;
|
|
}
|
|
}
|
|
if (!argv_idx) {
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
redisAppendCommandArgv(node->context,argc,(const char**)argv,argvlen);
|
|
if (redisGetReply(node->context, &_reply) != REDIS_OK) {
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
reply = (redisReply*) _reply;
|
|
success = clusterManagerCheckRedisReply(node, reply, err);
|
|
cleanup:
|
|
zfree(argvlen);
|
|
if (argv != NULL) {
|
|
for (i = 2; i < argc; i++) sdsfree(argv[i]);
|
|
zfree(argv);
|
|
}
|
|
if (reply != NULL) freeReplyObject(reply);
|
|
return success;
|
|
}
|
|
|
|
/* Set slot status to "importing" or "migrating" */
|
|
static int clusterManagerSetSlot(clusterManagerNode *node1,
|
|
clusterManagerNode *node2,
|
|
int slot, const char *status, char **err) {
|
|
redisReply *reply = CLUSTER_MANAGER_COMMAND(node1, "CLUSTER "
|
|
"SETSLOT %d %s %s",
|
|
slot, status,
|
|
(char *) node2->name);
|
|
if (err != NULL) *err = NULL;
|
|
if (!reply) return 0;
|
|
int success = 1;
|
|
if (reply->type == REDIS_REPLY_ERROR) {
|
|
success = 0;
|
|
if (err != NULL) {
|
|
*err = zmalloc((reply->len + 1) * sizeof(char));
|
|
strcpy(*err, reply->str);
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(node1, err);
|
|
}
|
|
goto cleanup;
|
|
}
|
|
cleanup:
|
|
freeReplyObject(reply);
|
|
return success;
|
|
}
|
|
|
|
/* Migrate keys taken from reply->elements. It returns the reply from the
|
|
* MIGRATE command, or NULL if something goes wrong. If the argument 'dots'
|
|
* is not NULL, a dot will be printed for every migrated key. */
|
|
static redisReply *clusterManagerMigrateKeysInReply(clusterManagerNode *source,
|
|
clusterManagerNode *target,
|
|
redisReply *reply,
|
|
int replace, int timeout,
|
|
char *dots)
|
|
{
|
|
redisReply *migrate_reply = NULL;
|
|
char **argv = NULL;
|
|
size_t *argv_len = NULL;
|
|
int c = (replace ? 8 : 7);
|
|
size_t argc = c + reply->elements;
|
|
size_t i, offset = 6; // Keys Offset
|
|
argv = zcalloc(argc * sizeof(char *));
|
|
argv_len = zcalloc(argc * sizeof(size_t));
|
|
char portstr[255];
|
|
char timeoutstr[255];
|
|
snprintf(portstr, 10, "%d", target->port);
|
|
snprintf(timeoutstr, 10, "%d", timeout);
|
|
argv[0] = "MIGRATE";
|
|
argv_len[0] = 7;
|
|
argv[1] = target->ip;
|
|
argv_len[1] = strlen(target->ip);
|
|
argv[2] = portstr;
|
|
argv_len[2] = strlen(portstr);
|
|
argv[3] = "";
|
|
argv_len[3] = 0;
|
|
argv[4] = "0";
|
|
argv_len[4] = 1;
|
|
argv[5] = timeoutstr;
|
|
argv_len[5] = strlen(timeoutstr);
|
|
if (replace) {
|
|
argv[offset] = "REPLACE";
|
|
argv_len[offset] = 7;
|
|
offset++;
|
|
}
|
|
argv[offset] = "KEYS";
|
|
argv_len[offset] = 4;
|
|
offset++;
|
|
for (i = 0; i < reply->elements; i++) {
|
|
redisReply *entry = reply->element[i];
|
|
size_t idx = i + offset;
|
|
assert(entry->type == REDIS_REPLY_STRING);
|
|
argv[idx] = (char *) sdsnew(entry->str);
|
|
argv_len[idx] = entry->len;
|
|
if (dots) dots[i] = '.';
|
|
}
|
|
if (dots) dots[reply->elements] = '\0';
|
|
void *_reply = NULL;
|
|
redisAppendCommandArgv(source->context,argc,
|
|
(const char**)argv,argv_len);
|
|
int success = (redisGetReply(source->context, &_reply) == REDIS_OK);
|
|
for (i = 0; i < reply->elements; i++) sdsfree(argv[i + offset]);
|
|
if (!success) goto cleanup;
|
|
migrate_reply = (redisReply *) _reply;
|
|
cleanup:
|
|
zfree(argv);
|
|
zfree(argv_len);
|
|
return migrate_reply;
|
|
}
|
|
|
|
/* Migrate all keys in the given slot from source to target.*/
|
|
static int clusterManagerMigrateKeysInSlot(clusterManagerNode *source,
|
|
clusterManagerNode *target,
|
|
int slot, int timeout,
|
|
int pipeline, int verbose,
|
|
char **err)
|
|
{
|
|
int success = 1;
|
|
int do_fix = (config.cluster_manager_command.flags &
|
|
CLUSTER_MANAGER_CMD_FLAG_FIX);
|
|
while (1) {
|
|
char *dots = NULL;
|
|
redisReply *reply = NULL, *migrate_reply = NULL;
|
|
reply = CLUSTER_MANAGER_COMMAND(source, "CLUSTER "
|
|
"GETKEYSINSLOT %d %d", slot,
|
|
pipeline);
|
|
success = (reply != NULL);
|
|
if (!success) return 0;
|
|
if (reply->type == REDIS_REPLY_ERROR) {
|
|
success = 0;
|
|
if (err != NULL) {
|
|
*err = zmalloc((reply->len + 1) * sizeof(char));
|
|
strcpy(*err, reply->str);
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(source, err);
|
|
}
|
|
goto next;
|
|
}
|
|
assert(reply->type == REDIS_REPLY_ARRAY);
|
|
size_t count = reply->elements;
|
|
if (count == 0) {
|
|
freeReplyObject(reply);
|
|
break;
|
|
}
|
|
if (verbose) dots = zmalloc((count+1) * sizeof(char));
|
|
/* Calling MIGRATE command. */
|
|
migrate_reply = clusterManagerMigrateKeysInReply(source, target,
|
|
reply, 0, timeout,
|
|
dots);
|
|
if (migrate_reply == NULL) goto next;
|
|
if (migrate_reply->type == REDIS_REPLY_ERROR) {
|
|
if (do_fix && strstr(migrate_reply->str, "BUSYKEY")) {
|
|
clusterManagerLogWarn("*** Target key exists. "
|
|
"Replacing it for FIX.\n");
|
|
freeReplyObject(migrate_reply);
|
|
/* Try to migrate keys adding REPLACE option. */
|
|
migrate_reply = clusterManagerMigrateKeysInReply(source,
|
|
target,
|
|
reply,
|
|
1, timeout,
|
|
NULL);
|
|
success = (migrate_reply != NULL &&
|
|
migrate_reply->type != REDIS_REPLY_ERROR);
|
|
} else success = 0;
|
|
if (!success) {
|
|
if (migrate_reply != NULL) {
|
|
if (err) {
|
|
*err = zmalloc((migrate_reply->len + 1) * sizeof(char));
|
|
strcpy(*err, migrate_reply->str);
|
|
}
|
|
printf("\n");
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(source,
|
|
migrate_reply->str);
|
|
}
|
|
goto next;
|
|
}
|
|
}
|
|
if (verbose) {
|
|
printf("%s", dots);
|
|
fflush(stdout);
|
|
}
|
|
next:
|
|
if (reply != NULL) freeReplyObject(reply);
|
|
if (migrate_reply != NULL) freeReplyObject(migrate_reply);
|
|
if (dots) zfree(dots);
|
|
if (!success) break;
|
|
}
|
|
return success;
|
|
}
|
|
|
|
/* Move slots between source and target nodes using MIGRATE.
|
|
*
|
|
* Options:
|
|
* CLUSTER_MANAGER_OPT_VERBOSE -- Print a dot for every moved key.
|
|
* CLUSTER_MANAGER_OPT_COLD -- Move keys without opening slots /
|
|
* reconfiguring the nodes.
|
|
* CLUSTER_MANAGER_OPT_UPDATE -- Update node->slots for source/target nodes.
|
|
* CLUSTER_MANAGER_OPT_QUIET -- Don't print info messages.
|
|
*/
|
|
static int clusterManagerMoveSlot(clusterManagerNode *source,
|
|
clusterManagerNode *target,
|
|
int slot, int opts, char**err)
|
|
{
|
|
if (!(opts & CLUSTER_MANAGER_OPT_QUIET)) {
|
|
printf("Moving slot %d from %s:%d to %s:%d: ", slot, source->ip,
|
|
source->port, target->ip, target->port);
|
|
fflush(stdout);
|
|
}
|
|
if (err != NULL) *err = NULL;
|
|
int pipeline = config.cluster_manager_command.pipeline,
|
|
timeout = config.cluster_manager_command.timeout,
|
|
print_dots = (opts & CLUSTER_MANAGER_OPT_VERBOSE),
|
|
option_cold = (opts & CLUSTER_MANAGER_OPT_COLD),
|
|
success = 1;
|
|
if (!option_cold) {
|
|
success = clusterManagerSetSlot(target, source, slot,
|
|
"importing", err);
|
|
if (!success) return 0;
|
|
success = clusterManagerSetSlot(source, target, slot,
|
|
"migrating", err);
|
|
if (!success) return 0;
|
|
}
|
|
success = clusterManagerMigrateKeysInSlot(source, target, slot, timeout,
|
|
pipeline, print_dots, err);
|
|
if (!(opts & CLUSTER_MANAGER_OPT_QUIET)) printf("\n");
|
|
if (!success) return 0;
|
|
/* Set the new node as the owner of the slot in all the known nodes. */
|
|
if (!option_cold) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE) continue;
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(n, "CLUSTER "
|
|
"SETSLOT %d %s %s",
|
|
slot, "node",
|
|
target->name);
|
|
success = (r != NULL);
|
|
if (!success) return 0;
|
|
if (r->type == REDIS_REPLY_ERROR) {
|
|
success = 0;
|
|
if (err != NULL) {
|
|
*err = zmalloc((r->len + 1) * sizeof(char));
|
|
strcpy(*err, r->str);
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(n, err);
|
|
}
|
|
}
|
|
freeReplyObject(r);
|
|
if (!success) return 0;
|
|
}
|
|
}
|
|
/* Update the node logical config */
|
|
if (opts & CLUSTER_MANAGER_OPT_UPDATE) {
|
|
source->slots[slot] = 0;
|
|
target->slots[slot] = 1;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
/* Flush the dirty node configuration by calling replicate for slaves or
|
|
* adding the slots defined in the masters. */
|
|
static int clusterManagerFlushNodeConfig(clusterManagerNode *node, char **err) {
|
|
if (!node->dirty) return 0;
|
|
redisReply *reply = NULL;
|
|
int is_err = 0, success = 1;
|
|
if (err != NULL) *err = NULL;
|
|
if (node->replicate != NULL) {
|
|
reply = CLUSTER_MANAGER_COMMAND(node, "CLUSTER REPLICATE %s",
|
|
node->replicate);
|
|
if (reply == NULL || (is_err = (reply->type == REDIS_REPLY_ERROR))) {
|
|
if (is_err && err != NULL) {
|
|
*err = zmalloc((reply->len + 1) * sizeof(char));
|
|
strcpy(*err, reply->str);
|
|
}
|
|
success = 0;
|
|
/* If the cluster did not already joined it is possible that
|
|
* the slave does not know the master node yet. So on errors
|
|
* we return ASAP leaving the dirty flag set, to flush the
|
|
* config later. */
|
|
goto cleanup;
|
|
}
|
|
} else {
|
|
int added = clusterManagerAddSlots(node, err);
|
|
if (!added || *err != NULL) success = 0;
|
|
}
|
|
node->dirty = 0;
|
|
cleanup:
|
|
if (reply != NULL) freeReplyObject(reply);
|
|
return success;
|
|
}
|
|
|
|
/* Wait until the cluster configuration is consistent. */
|
|
static void clusterManagerWaitForClusterJoin(void) {
|
|
printf("Waiting for the cluster to join\n");
|
|
while(!clusterManagerIsConfigConsistent()) {
|
|
printf(".");
|
|
fflush(stdout);
|
|
sleep(1);
|
|
}
|
|
printf("\n");
|
|
}
|
|
|
|
/* Load node's cluster configuration by calling "CLUSTER NODES" command.
|
|
* Node's configuration (name, replicate, slots, ...) is then updated.
|
|
* If CLUSTER_MANAGER_OPT_GETFRIENDS flag is set into 'opts' argument,
|
|
* and node already knows other nodes, the node's friends list is populated
|
|
* with the other nodes info. */
|
|
static int clusterManagerNodeLoadInfo(clusterManagerNode *node, int opts,
|
|
char **err)
|
|
{
|
|
redisReply *reply = CLUSTER_MANAGER_COMMAND(node, "CLUSTER NODES");
|
|
int success = 1;
|
|
*err = NULL;
|
|
if (!clusterManagerCheckRedisReply(node, reply, err)) {
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
int getfriends = (opts & CLUSTER_MANAGER_OPT_GETFRIENDS);
|
|
char *lines = reply->str, *p, *line;
|
|
while ((p = strstr(lines, "\n")) != NULL) {
|
|
*p = '\0';
|
|
line = lines;
|
|
lines = p + 1;
|
|
char *name = NULL, *addr = NULL, *flags = NULL, *master_id = NULL,
|
|
*ping_sent = NULL, *ping_recv = NULL, *config_epoch = NULL,
|
|
*link_status = NULL;
|
|
UNUSED(link_status);
|
|
int i = 0;
|
|
while ((p = strchr(line, ' ')) != NULL) {
|
|
*p = '\0';
|
|
char *token = line;
|
|
line = p + 1;
|
|
switch(i++){
|
|
case 0: name = token; break;
|
|
case 1: addr = token; break;
|
|
case 2: flags = token; break;
|
|
case 3: master_id = token; break;
|
|
case 4: ping_sent = token; break;
|
|
case 5: ping_recv = token; break;
|
|
case 6: config_epoch = token; break;
|
|
case 7: link_status = token; break;
|
|
}
|
|
if (i == 8) break; // Slots
|
|
}
|
|
if (!flags) {
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
int myself = (strstr(flags, "myself") != NULL);
|
|
clusterManagerNode *currentNode = NULL;
|
|
if (myself) {
|
|
node->flags |= CLUSTER_MANAGER_FLAG_MYSELF;
|
|
currentNode = node;
|
|
clusterManagerNodeResetSlots(node);
|
|
if (i == 8) {
|
|
int remaining = strlen(line);
|
|
while (remaining > 0) {
|
|
p = strchr(line, ' ');
|
|
if (p == NULL) p = line + remaining;
|
|
remaining -= (p - line);
|
|
|
|
char *slotsdef = line;
|
|
*p = '\0';
|
|
if (remaining) {
|
|
line = p + 1;
|
|
remaining--;
|
|
} else line = p;
|
|
char *dash = NULL;
|
|
if (slotsdef[0] == '[') {
|
|
slotsdef++;
|
|
if ((p = strstr(slotsdef, "->-"))) { // Migrating
|
|
*p = '\0';
|
|
p += 3;
|
|
char *closing_bracket = strchr(p, ']');
|
|
if (closing_bracket) *closing_bracket = '\0';
|
|
sds slot = sdsnew(slotsdef);
|
|
sds dst = sdsnew(p);
|
|
node->migrating_count += 2;
|
|
node->migrating = zrealloc(node->migrating,
|
|
(node->migrating_count * sizeof(sds)));
|
|
node->migrating[node->migrating_count - 2] =
|
|
slot;
|
|
node->migrating[node->migrating_count - 1] =
|
|
dst;
|
|
} else if ((p = strstr(slotsdef, "-<-"))) {//Importing
|
|
*p = '\0';
|
|
p += 3;
|
|
char *closing_bracket = strchr(p, ']');
|
|
if (closing_bracket) *closing_bracket = '\0';
|
|
sds slot = sdsnew(slotsdef);
|
|
sds src = sdsnew(p);
|
|
node->importing_count += 2;
|
|
node->importing = zrealloc(node->importing,
|
|
(node->importing_count * sizeof(sds)));
|
|
node->importing[node->importing_count - 2] =
|
|
slot;
|
|
node->importing[node->importing_count - 1] =
|
|
src;
|
|
}
|
|
} else if ((dash = strchr(slotsdef, '-')) != NULL) {
|
|
p = dash;
|
|
int start, stop;
|
|
*p = '\0';
|
|
start = atoi(slotsdef);
|
|
stop = atoi(p + 1);
|
|
node->slots_count += (stop - (start - 1));
|
|
while (start <= stop) node->slots[start++] = 1;
|
|
} else if (p > slotsdef) {
|
|
node->slots[atoi(slotsdef)] = 1;
|
|
node->slots_count++;
|
|
}
|
|
}
|
|
}
|
|
node->dirty = 0;
|
|
} else if (!getfriends) {
|
|
if (!(node->flags & CLUSTER_MANAGER_FLAG_MYSELF)) continue;
|
|
else break;
|
|
} else {
|
|
if (addr == NULL) {
|
|
fprintf(stderr, "Error: invalid CLUSTER NODES reply\n");
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
char *c = strrchr(addr, '@');
|
|
if (c != NULL) *c = '\0';
|
|
c = strrchr(addr, ':');
|
|
if (c == NULL) {
|
|
fprintf(stderr, "Error: invalid CLUSTER NODES reply\n");
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
*c = '\0';
|
|
int port = atoi(++c);
|
|
currentNode = clusterManagerNewNode(sdsnew(addr), port);
|
|
currentNode->flags |= CLUSTER_MANAGER_FLAG_FRIEND;
|
|
if (node->friends == NULL) node->friends = listCreate();
|
|
listAddNodeTail(node->friends, currentNode);
|
|
}
|
|
if (name != NULL) {
|
|
if (currentNode->name) sdsfree(currentNode->name);
|
|
currentNode->name = sdsnew(name);
|
|
}
|
|
if (currentNode->flags_str != NULL)
|
|
freeClusterManagerNodeFlags(currentNode->flags_str);
|
|
currentNode->flags_str = listCreate();
|
|
int flag_len;
|
|
while ((flag_len = strlen(flags)) > 0) {
|
|
sds flag = NULL;
|
|
char *fp = strchr(flags, ',');
|
|
if (fp) {
|
|
*fp = '\0';
|
|
flag = sdsnew(flags);
|
|
flags = fp + 1;
|
|
} else {
|
|
flag = sdsnew(flags);
|
|
flags += flag_len;
|
|
}
|
|
if (strcmp(flag, "noaddr") == 0)
|
|
currentNode->flags |= CLUSTER_MANAGER_FLAG_NOADDR;
|
|
else if (strcmp(flag, "disconnected") == 0)
|
|
currentNode->flags |= CLUSTER_MANAGER_FLAG_DISCONNECT;
|
|
else if (strcmp(flag, "fail") == 0)
|
|
currentNode->flags |= CLUSTER_MANAGER_FLAG_FAIL;
|
|
else if (strcmp(flag, "slave") == 0) {
|
|
currentNode->flags |= CLUSTER_MANAGER_FLAG_SLAVE;
|
|
if (master_id != NULL) {
|
|
if (currentNode->replicate) sdsfree(currentNode->replicate);
|
|
currentNode->replicate = sdsnew(master_id);
|
|
}
|
|
}
|
|
listAddNodeTail(currentNode->flags_str, flag);
|
|
}
|
|
if (config_epoch != NULL)
|
|
currentNode->current_epoch = atoll(config_epoch);
|
|
if (ping_sent != NULL) currentNode->ping_sent = atoll(ping_sent);
|
|
if (ping_recv != NULL) currentNode->ping_recv = atoll(ping_recv);
|
|
if (!getfriends && myself) break;
|
|
}
|
|
cleanup:
|
|
if (reply) freeReplyObject(reply);
|
|
return success;
|
|
}
|
|
|
|
/* Retrieves info about the cluster using argument 'node' as the starting
|
|
* point. All nodes will be loaded inside the cluster_manager.nodes list.
|
|
* Warning: if something goes wrong, it will free the starting node before
|
|
* returning 0. */
|
|
static int clusterManagerLoadInfoFromNode(clusterManagerNode *node, int opts) {
|
|
if (node->context == NULL)
|
|
CLUSTER_MANAGER_NODE_CONNECT(node);
|
|
if (node->context->err) {
|
|
fprintf(stderr,"Could not connect to Redis at ");
|
|
fprintf(stderr,"%s:%d: %s\n", node->ip, node->port,
|
|
node->context->errstr);
|
|
freeClusterManagerNode(node);
|
|
return 0;
|
|
}
|
|
opts |= CLUSTER_MANAGER_OPT_GETFRIENDS;
|
|
char *e = NULL;
|
|
if (!clusterManagerNodeIsCluster(node, &e)) {
|
|
clusterManagerPrintNotClusterNodeError(node, e);
|
|
if (e) zfree(e);
|
|
freeClusterManagerNode(node);
|
|
return 0;
|
|
}
|
|
e = NULL;
|
|
if (!clusterManagerNodeLoadInfo(node, opts, &e)) {
|
|
if (e) {
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(node, e);
|
|
zfree(e);
|
|
}
|
|
freeClusterManagerNode(node);
|
|
return 0;
|
|
}
|
|
listIter li;
|
|
listNode *ln;
|
|
if (cluster_manager.nodes != NULL) {
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL)
|
|
freeClusterManagerNode((clusterManagerNode *) ln->value);
|
|
listRelease(cluster_manager.nodes);
|
|
}
|
|
cluster_manager.nodes = listCreate();
|
|
listAddNodeTail(cluster_manager.nodes, node);
|
|
if (node->friends != NULL) {
|
|
listRewind(node->friends, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *friend = ln->value;
|
|
if (!friend->ip || !friend->port) goto invalid_friend;
|
|
if (!friend->context)
|
|
CLUSTER_MANAGER_NODE_CONNECT(friend);
|
|
if (friend->context->err) goto invalid_friend;
|
|
e = NULL;
|
|
if (clusterManagerNodeLoadInfo(friend, 0, &e)) {
|
|
if (friend->flags & (CLUSTER_MANAGER_FLAG_NOADDR |
|
|
CLUSTER_MANAGER_FLAG_DISCONNECT |
|
|
CLUSTER_MANAGER_FLAG_FAIL))
|
|
goto invalid_friend;
|
|
listAddNodeTail(cluster_manager.nodes, friend);
|
|
} else {
|
|
clusterManagerLogErr("[ERR] Unable to load info for "
|
|
"node %s:%d\n",
|
|
friend->ip, friend->port);
|
|
goto invalid_friend;
|
|
}
|
|
continue;
|
|
invalid_friend:
|
|
freeClusterManagerNode(friend);
|
|
}
|
|
listRelease(node->friends);
|
|
node->friends = NULL;
|
|
}
|
|
// Count replicas for each node
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->replicate != NULL) {
|
|
clusterManagerNode *master = clusterManagerNodeByName(n->replicate);
|
|
if (master == NULL) {
|
|
clusterManagerLogWarn("*** WARNING: %s:%d claims to be "
|
|
"slave of unknown node ID %s.\n",
|
|
n->ip, n->port, n->replicate);
|
|
} else master->replicas_count++;
|
|
}
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
/* Compare functions used by various sorting operations. */
|
|
int clusterManagerSlotCompare(const void *slot1, const void *slot2) {
|
|
const char **i1 = (const char **)slot1;
|
|
const char **i2 = (const char **)slot2;
|
|
return strcmp(*i1, *i2);
|
|
}
|
|
|
|
int clusterManagerSlotCountCompareDesc(const void *n1, const void *n2) {
|
|
clusterManagerNode *node1 = *((clusterManagerNode **) n1);
|
|
clusterManagerNode *node2 = *((clusterManagerNode **) n2);
|
|
return node2->slots_count - node1->slots_count;
|
|
}
|
|
|
|
int clusterManagerCompareNodeBalance(const void *n1, const void *n2) {
|
|
clusterManagerNode *node1 = *((clusterManagerNode **) n1);
|
|
clusterManagerNode *node2 = *((clusterManagerNode **) n2);
|
|
return node1->balance - node2->balance;
|
|
}
|
|
|
|
static sds clusterManagerGetConfigSignature(clusterManagerNode *node) {
|
|
sds signature = NULL;
|
|
int node_count = 0, i = 0, name_len = 0;
|
|
char **node_configs = NULL;
|
|
redisReply *reply = CLUSTER_MANAGER_COMMAND(node, "CLUSTER NODES");
|
|
if (reply == NULL || reply->type == REDIS_REPLY_ERROR)
|
|
goto cleanup;
|
|
char *lines = reply->str, *p, *line;
|
|
while ((p = strstr(lines, "\n")) != NULL) {
|
|
i = 0;
|
|
*p = '\0';
|
|
line = lines;
|
|
lines = p + 1;
|
|
char *nodename = NULL;
|
|
int tot_size = 0;
|
|
while ((p = strchr(line, ' ')) != NULL) {
|
|
*p = '\0';
|
|
char *token = line;
|
|
line = p + 1;
|
|
if (i == 0) {
|
|
nodename = token;
|
|
tot_size = (p - token);
|
|
name_len = tot_size++; // Make room for ':' in tot_size
|
|
} else if (i == 8) break;
|
|
i++;
|
|
}
|
|
if (i != 8) continue;
|
|
if (nodename == NULL) continue;
|
|
int remaining = strlen(line);
|
|
if (remaining == 0) continue;
|
|
char **slots = NULL;
|
|
int c = 0;
|
|
while (remaining > 0) {
|
|
p = strchr(line, ' ');
|
|
if (p == NULL) p = line + remaining;
|
|
int size = (p - line);
|
|
remaining -= size;
|
|
tot_size += size;
|
|
char *slotsdef = line;
|
|
*p = '\0';
|
|
if (remaining) {
|
|
line = p + 1;
|
|
remaining--;
|
|
} else line = p;
|
|
if (slotsdef[0] != '[') {
|
|
c++;
|
|
slots = zrealloc(slots, (c * sizeof(char *)));
|
|
slots[c - 1] = slotsdef;
|
|
}
|
|
}
|
|
if (c > 0) {
|
|
if (c > 1)
|
|
qsort(slots, c, sizeof(char *), clusterManagerSlotCompare);
|
|
node_count++;
|
|
node_configs =
|
|
zrealloc(node_configs, (node_count * sizeof(char *)));
|
|
/* Make room for '|' separators. */
|
|
tot_size += (sizeof(char) * (c - 1));
|
|
char *cfg = zmalloc((sizeof(char) * tot_size) + 1);
|
|
memcpy(cfg, nodename, name_len);
|
|
char *sp = cfg + name_len;
|
|
*(sp++) = ':';
|
|
for (i = 0; i < c; i++) {
|
|
if (i > 0) *(sp++) = '|';
|
|
int slen = strlen(slots[i]);
|
|
memcpy(sp, slots[i], slen);
|
|
sp += slen;
|
|
}
|
|
*(sp++) = '\0';
|
|
node_configs[node_count - 1] = cfg;
|
|
}
|
|
zfree(slots);
|
|
}
|
|
if (node_count > 0) {
|
|
if (node_count > 1) {
|
|
qsort(node_configs, node_count, sizeof(char *),
|
|
clusterManagerSlotCompare);
|
|
}
|
|
signature = sdsempty();
|
|
for (i = 0; i < node_count; i++) {
|
|
if (i > 0) signature = sdscatprintf(signature, "%c", '|');
|
|
signature = sdscatfmt(signature, "%s", node_configs[i]);
|
|
}
|
|
}
|
|
cleanup:
|
|
if (reply != NULL) freeReplyObject(reply);
|
|
if (node_configs != NULL) {
|
|
for (i = 0; i < node_count; i++) zfree(node_configs[i]);
|
|
zfree(node_configs);
|
|
}
|
|
return signature;
|
|
}
|
|
|
|
static int clusterManagerIsConfigConsistent(void) {
|
|
if (cluster_manager.nodes == NULL) return 0;
|
|
int consistent = (listLength(cluster_manager.nodes) <= 1);
|
|
// If the Cluster has only one node, it's always consistent
|
|
if (consistent) return 1;
|
|
sds first_cfg = NULL;
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
sds cfg = clusterManagerGetConfigSignature(node);
|
|
if (cfg == NULL) {
|
|
consistent = 0;
|
|
break;
|
|
}
|
|
if (first_cfg == NULL) first_cfg = cfg;
|
|
else {
|
|
consistent = !sdscmp(first_cfg, cfg);
|
|
sdsfree(cfg);
|
|
if (!consistent) break;
|
|
}
|
|
}
|
|
if (first_cfg != NULL) sdsfree(first_cfg);
|
|
return consistent;
|
|
}
|
|
|
|
/* Add the error string to cluster_manager.errors and print it. */
|
|
static void clusterManagerOnError(sds err) {
|
|
if (cluster_manager.errors == NULL)
|
|
cluster_manager.errors = listCreate();
|
|
listAddNodeTail(cluster_manager.errors, err);
|
|
clusterManagerLogErr("%s\n", (char *) err);
|
|
}
|
|
|
|
/* Check the slots coverage of the cluster. The 'all_slots' argument must be
|
|
* and array of 16384 bytes. Every covered slot will be set to 1 in the
|
|
* 'all_slots' array. The function returns the total number if covered slots.*/
|
|
static int clusterManagerGetCoveredSlots(char *all_slots) {
|
|
if (cluster_manager.nodes == NULL) return 0;
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
int totslots = 0, i;
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
for (i = 0; i < CLUSTER_MANAGER_SLOTS; i++) {
|
|
if (node->slots[i] && !all_slots[i]) {
|
|
all_slots[i] = 1;
|
|
totslots++;
|
|
}
|
|
}
|
|
}
|
|
return totslots;
|
|
}
|
|
|
|
static void clusterManagerPrintSlotsList(list *slots) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(slots, &li);
|
|
sds first = NULL;
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
sds slot = ln->value;
|
|
if (!first) first = slot;
|
|
else printf(", ");
|
|
printf("%s", slot);
|
|
}
|
|
printf("\n");
|
|
}
|
|
|
|
/* Return the node, among 'nodes' with the greatest number of keys
|
|
* in the specified slot. */
|
|
static clusterManagerNode * clusterManagerGetNodeWithMostKeysInSlot(list *nodes,
|
|
int slot,
|
|
char **err)
|
|
{
|
|
clusterManagerNode *node = NULL;
|
|
int numkeys = 0;
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(nodes, &li);
|
|
if (err) *err = NULL;
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE || n->replicate)
|
|
continue;
|
|
redisReply *r =
|
|
CLUSTER_MANAGER_COMMAND(n, "CLUSTER COUNTKEYSINSLOT %d", slot);
|
|
int success = clusterManagerCheckRedisReply(n, r, err);
|
|
if (success) {
|
|
if (r->integer > numkeys || node == NULL) {
|
|
numkeys = r->integer;
|
|
node = n;
|
|
}
|
|
}
|
|
if (r != NULL) freeReplyObject(r);
|
|
/* If the reply contains errors */
|
|
if (!success) {
|
|
if (err != NULL && *err != NULL)
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(n, err);
|
|
node = NULL;
|
|
break;
|
|
}
|
|
}
|
|
return node;
|
|
}
|
|
|
|
/* This function returns the master that has the least number of replicas
|
|
* in the cluster. If there are multiple masters with the same smaller
|
|
* number of replicas, one at random is returned. */
|
|
|
|
static clusterManagerNode *clusterManagerNodeWithLeastReplicas() {
|
|
clusterManagerNode *node = NULL;
|
|
int lowest_count = 0;
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE) continue;
|
|
if (node == NULL || n->replicas_count < lowest_count) {
|
|
node = n;
|
|
lowest_count = n->replicas_count;
|
|
}
|
|
}
|
|
return node;
|
|
}
|
|
|
|
static int clusterManagerFixSlotsCoverage(char *all_slots) {
|
|
int i, fixed = 0;
|
|
list *none = NULL, *single = NULL, *multi = NULL;
|
|
clusterManagerLogInfo(">>> Fixing slots coverage...\n");
|
|
printf("List of not covered slots: \n");
|
|
int uncovered_count = 0;
|
|
sds log = sdsempty();
|
|
for (i = 0; i < CLUSTER_MANAGER_SLOTS; i++) {
|
|
int covered = all_slots[i];
|
|
if (!covered) {
|
|
sds key = sdsfromlonglong((long long) i);
|
|
if (uncovered_count++ > 0) printf(",");
|
|
printf("%s", (char *) key);
|
|
list *slot_nodes = listCreate();
|
|
sds slot_nodes_str = sdsempty();
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE || n->replicate)
|
|
continue;
|
|
redisReply *reply = CLUSTER_MANAGER_COMMAND(n,
|
|
"CLUSTER GETKEYSINSLOT %d %d", i, 1);
|
|
if (!clusterManagerCheckRedisReply(n, reply, NULL)) {
|
|
fixed = -1;
|
|
if (reply) freeReplyObject(reply);
|
|
goto cleanup;
|
|
}
|
|
assert(reply->type == REDIS_REPLY_ARRAY);
|
|
if (reply->elements > 0) {
|
|
listAddNodeTail(slot_nodes, n);
|
|
if (listLength(slot_nodes) > 1)
|
|
slot_nodes_str = sdscat(slot_nodes_str, ", ");
|
|
slot_nodes_str = sdscatfmt(slot_nodes_str,
|
|
"%s:%u", n->ip, n->port);
|
|
}
|
|
freeReplyObject(reply);
|
|
}
|
|
log = sdscatfmt(log, "\nSlot %S has keys in %u nodes: %S",
|
|
key, listLength(slot_nodes), slot_nodes_str);
|
|
sdsfree(slot_nodes_str);
|
|
dictAdd(clusterManagerUncoveredSlots, key, slot_nodes);
|
|
}
|
|
}
|
|
printf("\n%s\n", log);
|
|
/* For every slot, take action depending on the actual condition:
|
|
* 1) No node has keys for this slot.
|
|
* 2) A single node has keys for this slot.
|
|
* 3) Multiple nodes have keys for this slot. */
|
|
none = listCreate();
|
|
single = listCreate();
|
|
multi = listCreate();
|
|
dictIterator *iter = dictGetIterator(clusterManagerUncoveredSlots);
|
|
dictEntry *entry;
|
|
while ((entry = dictNext(iter)) != NULL) {
|
|
sds slot = (sds) dictGetKey(entry);
|
|
list *nodes = (list *) dictGetVal(entry);
|
|
switch (listLength(nodes)){
|
|
case 0: listAddNodeTail(none, slot); break;
|
|
case 1: listAddNodeTail(single, slot); break;
|
|
default: listAddNodeTail(multi, slot); break;
|
|
}
|
|
}
|
|
dictReleaseIterator(iter);
|
|
|
|
/* Handle case "1": keys in no node. */
|
|
if (listLength(none) > 0) {
|
|
printf("The following uncovered slots have no keys "
|
|
"across the cluster:\n");
|
|
clusterManagerPrintSlotsList(none);
|
|
if (confirmWithYes("Fix these slots by covering with a random node?")){
|
|
srand(time(NULL));
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(none, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
sds slot = ln->value;
|
|
long idx = (long) (rand() % listLength(cluster_manager.nodes));
|
|
listNode *node_n = listIndex(cluster_manager.nodes, idx);
|
|
assert(node_n != NULL);
|
|
clusterManagerNode *n = node_n->value;
|
|
clusterManagerLogInfo(">>> Covering slot %s with %s:%d\n",
|
|
slot, n->ip, n->port);
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(n,
|
|
"CLUSTER ADDSLOTS %s", slot);
|
|
if (!clusterManagerCheckRedisReply(n, r, NULL)) fixed = -1;
|
|
if (r) freeReplyObject(r);
|
|
if (fixed < 0) goto cleanup;
|
|
/* Since CLUSTER ADDSLOTS succeeded, we also update the slot
|
|
* info into the node struct, in order to keep it synced */
|
|
n->slots[atoi(slot)] = 1;
|
|
fixed++;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Handle case "2": keys only in one node. */
|
|
if (listLength(single) > 0) {
|
|
printf("The following uncovered slots have keys in just one node:\n");
|
|
clusterManagerPrintSlotsList(single);
|
|
if (confirmWithYes("Fix these slots by covering with those nodes?")){
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(single, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
sds slot = ln->value;
|
|
dictEntry *entry = dictFind(clusterManagerUncoveredSlots, slot);
|
|
assert(entry != NULL);
|
|
list *nodes = (list *) dictGetVal(entry);
|
|
listNode *fn = listFirst(nodes);
|
|
assert(fn != NULL);
|
|
clusterManagerNode *n = fn->value;
|
|
clusterManagerLogInfo(">>> Covering slot %s with %s:%d\n",
|
|
slot, n->ip, n->port);
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(n,
|
|
"CLUSTER ADDSLOTS %s", slot);
|
|
if (!clusterManagerCheckRedisReply(n, r, NULL)) fixed = -1;
|
|
if (r) freeReplyObject(r);
|
|
if (fixed < 0) goto cleanup;
|
|
/* Since CLUSTER ADDSLOTS succeeded, we also update the slot
|
|
* info into the node struct, in order to keep it synced */
|
|
n->slots[atoi(slot)] = 1;
|
|
fixed++;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Handle case "3": keys in multiple nodes. */
|
|
if (listLength(multi) > 0) {
|
|
printf("The following uncovered slots have keys in multiple nodes:\n");
|
|
clusterManagerPrintSlotsList(multi);
|
|
if (confirmWithYes("Fix these slots by moving keys "
|
|
"into a single node?")) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(multi, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
sds slot = ln->value;
|
|
dictEntry *entry = dictFind(clusterManagerUncoveredSlots, slot);
|
|
assert(entry != NULL);
|
|
list *nodes = (list *) dictGetVal(entry);
|
|
int s = atoi(slot);
|
|
clusterManagerNode *target =
|
|
clusterManagerGetNodeWithMostKeysInSlot(nodes, s, NULL);
|
|
if (target == NULL) {
|
|
fixed = -1;
|
|
goto cleanup;
|
|
}
|
|
clusterManagerLogInfo(">>> Covering slot %s moving keys "
|
|
"to %s:%d\n", slot,
|
|
target->ip, target->port);
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(target,
|
|
"CLUSTER ADDSLOTS %s", slot);
|
|
if (!clusterManagerCheckRedisReply(target, r, NULL)) fixed = -1;
|
|
if (r) freeReplyObject(r);
|
|
if (fixed < 0) goto cleanup;
|
|
r = CLUSTER_MANAGER_COMMAND(target,
|
|
"CLUSTER SETSLOT %s %s", slot, "STABLE");
|
|
if (!clusterManagerCheckRedisReply(target, r, NULL)) fixed = -1;
|
|
if (r) freeReplyObject(r);
|
|
if (fixed < 0) goto cleanup;
|
|
/* Since CLUSTER ADDSLOTS succeeded, we also update the slot
|
|
* info into the node struct, in order to keep it synced */
|
|
target->slots[atoi(slot)] = 1;
|
|
listIter nli;
|
|
listNode *nln;
|
|
listRewind(nodes, &nli);
|
|
while ((nln = listNext(&nli)) != NULL) {
|
|
clusterManagerNode *src = nln->value;
|
|
if (src == target) continue;
|
|
/* Set the source node in 'importing' state
|
|
* (even if we will actually migrate keys away)
|
|
* in order to avoid receiving redirections
|
|
* for MIGRATE. */
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(src,
|
|
"CLUSTER SETSLOT %s %s %s", slot,
|
|
"IMPORTING", target->name);
|
|
if (!clusterManagerCheckRedisReply(target, r, NULL))
|
|
fixed = -1;
|
|
if (r) freeReplyObject(r);
|
|
if (fixed < 0) goto cleanup;
|
|
int opts = CLUSTER_MANAGER_OPT_VERBOSE |
|
|
CLUSTER_MANAGER_OPT_COLD;
|
|
if (!clusterManagerMoveSlot(src, target, s, opts, NULL)) {
|
|
fixed = -1;
|
|
goto cleanup;
|
|
}
|
|
}
|
|
fixed++;
|
|
}
|
|
}
|
|
}
|
|
cleanup:
|
|
sdsfree(log);
|
|
if (none) listRelease(none);
|
|
if (single) listRelease(single);
|
|
if (multi) listRelease(multi);
|
|
return fixed;
|
|
}
|
|
|
|
/* Slot 'slot' was found to be in importing or migrating state in one or
|
|
* more nodes. This function fixes this condition by migrating keys where
|
|
* it seems more sensible. */
|
|
static int clusterManagerFixOpenSlot(int slot) {
|
|
clusterManagerLogInfo(">>> Fixing open slot %d\n", slot);
|
|
/* Try to obtain the current slot owner, according to the current
|
|
* nodes configuration. */
|
|
int success = 1;
|
|
list *owners = listCreate();
|
|
list *migrating = listCreate();
|
|
list *importing = listCreate();
|
|
sds migrating_str = sdsempty();
|
|
sds importing_str = sdsempty();
|
|
clusterManagerNode *owner = NULL;
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE) continue;
|
|
if (n->slots[slot]) {
|
|
if (owner == NULL) owner = n;
|
|
listAddNodeTail(owners, n);
|
|
}
|
|
}
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE) continue;
|
|
if (n->migrating) {
|
|
for (int i = 0; i < n->migrating_count; i += 2) {
|
|
sds migrating_slot = n->migrating[i];
|
|
if (atoi(migrating_slot) == slot) {
|
|
char *sep = (listLength(migrating) == 0 ? "" : ",");
|
|
migrating_str = sdscatfmt(migrating_str, "%s%S:%u",
|
|
sep, n->ip, n->port);
|
|
listAddNodeTail(migrating, n);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
if (n->importing) {
|
|
for (int i = 0; i < n->importing_count; i += 2) {
|
|
sds importing_slot = n->importing[i];
|
|
if (atoi(importing_slot) == slot) {
|
|
char *sep = (listLength(importing) == 0 ? "" : ",");
|
|
importing_str = sdscatfmt(importing_str, "%s%S:%u",
|
|
sep, n->ip, n->port);
|
|
listAddNodeTail(importing, n);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
printf("Set as migrating in: %s\n", migrating_str);
|
|
printf("Set as importing in: %s\n", importing_str);
|
|
/* If there is no slot owner, set as owner the slot with the biggest
|
|
* number of keys, among the set of migrating / importing nodes. */
|
|
if (owner == NULL) {
|
|
clusterManagerLogInfo(">>> Nobody claims ownership, "
|
|
"selecting an owner...\n");
|
|
owner = clusterManagerGetNodeWithMostKeysInSlot(cluster_manager.nodes,
|
|
slot, NULL);
|
|
// If we still don't have an owner, we can't fix it.
|
|
if (owner == NULL) {
|
|
clusterManagerLogErr("[ERR] Can't select a slot owner. "
|
|
"Impossible to fix.\n");
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
|
|
// Use ADDSLOTS to assign the slot.
|
|
clusterManagerLogWarn("*** Configuring %s:%d as the slot owner\n",
|
|
owner->ip, owner->port);
|
|
redisReply *reply = CLUSTER_MANAGER_COMMAND(owner, "CLUSTER "
|
|
"SETSLOT %d %s",
|
|
slot, "STABLE");
|
|
success = clusterManagerCheckRedisReply(owner, reply, NULL);
|
|
if (reply) freeReplyObject(reply);
|
|
if (!success) goto cleanup;
|
|
reply = CLUSTER_MANAGER_COMMAND(owner, "CLUSTER ADDSLOTS %d", slot);
|
|
success = clusterManagerCheckRedisReply(owner, reply, NULL);
|
|
if (reply) freeReplyObject(reply);
|
|
if (!success) goto cleanup;
|
|
/* Since CLUSTER ADDSLOTS succeeded, we also update the slot
|
|
* info into the node struct, in order to keep it synced */
|
|
owner->slots[slot] = 1;
|
|
/* Make sure this information will propagate. Not strictly needed
|
|
* since there is no past owner, so all the other nodes will accept
|
|
* whatever epoch this node will claim the slot with. */
|
|
reply = CLUSTER_MANAGER_COMMAND(owner, "CLUSTER BUMPEPOCH");
|
|
success = clusterManagerCheckRedisReply(owner, reply, NULL);
|
|
if (reply) freeReplyObject(reply);
|
|
if (!success) goto cleanup;
|
|
/* Remove the owner from the list of migrating/importing
|
|
* nodes. */
|
|
clusterManagerRemoveNodeFromList(migrating, owner);
|
|
clusterManagerRemoveNodeFromList(importing, owner);
|
|
}
|
|
/* If there are multiple owners of the slot, we need to fix it
|
|
* so that a single node is the owner and all the other nodes
|
|
* are in importing state. Later the fix can be handled by one
|
|
* of the base cases above.
|
|
*
|
|
* Note that this case also covers multiple nodes having the slot
|
|
* in migrating state, since migrating is a valid state only for
|
|
* slot owners. */
|
|
if (listLength(owners) > 1) {
|
|
owner = clusterManagerGetNodeWithMostKeysInSlot(owners, slot, NULL);
|
|
listRewind(owners, &li);
|
|
redisReply *reply = NULL;
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n == owner) continue;
|
|
reply = CLUSTER_MANAGER_COMMAND(n, "CLUSTER DELSLOT %d", slot);
|
|
success = clusterManagerCheckRedisReply(n, reply, NULL);
|
|
if (reply) freeReplyObject(reply);
|
|
if (!success) goto cleanup;
|
|
success = clusterManagerSetSlot(n, owner, slot, "importing", NULL);
|
|
if (!success) goto cleanup;
|
|
clusterManagerRemoveNodeFromList(importing, n); //Avoid duplicates
|
|
listAddNodeTail(importing, n);
|
|
}
|
|
reply = CLUSTER_MANAGER_COMMAND(owner, "CLUSTER BUMPEPOCH");
|
|
success = clusterManagerCheckRedisReply(owner, reply, NULL);
|
|
if (reply) freeReplyObject(reply);
|
|
if (!success) goto cleanup;
|
|
}
|
|
int move_opts = CLUSTER_MANAGER_OPT_VERBOSE;
|
|
/* Case 1: The slot is in migrating state in one slot, and in
|
|
* importing state in 1 slot. That's trivial to address. */
|
|
if (listLength(migrating) == 1 && listLength(importing) == 1) {
|
|
clusterManagerNode *src = listFirst(migrating)->value;
|
|
clusterManagerNode *dst = listFirst(importing)->value;
|
|
success = clusterManagerMoveSlot(src, dst, slot, move_opts, NULL);
|
|
}
|
|
/* Case 2: There are multiple nodes that claim the slot as importing,
|
|
* they probably got keys about the slot after a restart so opened
|
|
* the slot. In this case we just move all the keys to the owner
|
|
* according to the configuration. */
|
|
else if (listLength(migrating) == 0 && listLength(importing) > 0) {
|
|
clusterManagerLogInfo(">>> Moving all the %d slot keys to its "
|
|
"owner %s:%d\n", slot, owner->ip, owner->port);
|
|
move_opts |= CLUSTER_MANAGER_OPT_COLD;
|
|
listRewind(importing, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n == owner) continue;
|
|
success = clusterManagerMoveSlot(n, owner, slot, move_opts, NULL);
|
|
if (!success) goto cleanup;
|
|
clusterManagerLogInfo(">>> Setting %d as STABLE in "
|
|
"%s:%d\n", slot, n->ip, n->port);
|
|
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(n, "CLUSTER SETSLOT %d %s",
|
|
slot, "STABLE");
|
|
success = clusterManagerCheckRedisReply(n, r, NULL);
|
|
if (r) freeReplyObject(r);
|
|
if (!success) goto cleanup;
|
|
}
|
|
} else {
|
|
int try_to_close_slot = (listLength(importing) == 0 &&
|
|
listLength(migrating) == 1);
|
|
if (try_to_close_slot) {
|
|
clusterManagerNode *n = listFirst(migrating)->value;
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(n,
|
|
"CLUSTER GETKEYSINSLOT %d %d", slot, 10);
|
|
success = clusterManagerCheckRedisReply(n, r, NULL);
|
|
if (r) {
|
|
if (success) try_to_close_slot = (r->elements == 0);
|
|
freeReplyObject(r);
|
|
}
|
|
if (!success) goto cleanup;
|
|
}
|
|
/* Case 3: There are no slots claiming to be in importing state, but
|
|
* there is a migrating node that actually don't have any key. We
|
|
* can just close the slot, probably a reshard interrupted in the middle. */
|
|
if (try_to_close_slot) {
|
|
clusterManagerNode *n = listFirst(migrating)->value;
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(n, "CLUSTER SETSLOT %d %s",
|
|
slot, "STABLE");
|
|
success = clusterManagerCheckRedisReply(n, r, NULL);
|
|
if (r) freeReplyObject(r);
|
|
if (!success) goto cleanup;
|
|
} else {
|
|
success = 0;
|
|
clusterManagerLogErr("[ERR] Sorry, redis-cli can't fix this slot "
|
|
"yet (work in progress). Slot is set as "
|
|
"migrating in %s, as importing in %s, "
|
|
"owner is %s:%d\n", migrating_str,
|
|
importing_str, owner->ip, owner->port);
|
|
}
|
|
}
|
|
cleanup:
|
|
listRelease(owners);
|
|
listRelease(migrating);
|
|
listRelease(importing);
|
|
sdsfree(migrating_str);
|
|
sdsfree(importing_str);
|
|
return success;
|
|
}
|
|
|
|
static int clusterManagerCheckCluster(int quiet) {
|
|
listNode *ln = listFirst(cluster_manager.nodes);
|
|
if (!ln) return 0;
|
|
int result = 1;
|
|
int do_fix = config.cluster_manager_command.flags &
|
|
CLUSTER_MANAGER_CMD_FLAG_FIX;
|
|
clusterManagerNode *node = ln->value;
|
|
clusterManagerLogInfo(">>> Performing Cluster Check (using node %s:%d)\n",
|
|
node->ip, node->port);
|
|
if (!quiet) clusterManagerShowNodes();
|
|
if (!clusterManagerIsConfigConsistent()) {
|
|
sds err = sdsnew("[ERR] Nodes don't agree about configuration!");
|
|
clusterManagerOnError(err);
|
|
result = 0;
|
|
} else {
|
|
clusterManagerLogOk("[OK] All nodes agree about slots "
|
|
"configuration.\n");
|
|
}
|
|
// Check open slots
|
|
clusterManagerLogInfo(">>> Check for open slots...\n");
|
|
listIter li;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
int i;
|
|
dict *open_slots = NULL;
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->migrating != NULL) {
|
|
if (open_slots == NULL)
|
|
open_slots = dictCreate(&clusterManagerDictType, NULL);
|
|
sds errstr = sdsempty();
|
|
errstr = sdscatprintf(errstr,
|
|
"[WARNING] Node %s:%d has slots in "
|
|
"migrating state ",
|
|
n->ip,
|
|
n->port);
|
|
for (i = 0; i < n->migrating_count; i += 2) {
|
|
sds slot = n->migrating[i];
|
|
dictAdd(open_slots, slot, sdsdup(n->migrating[i + 1]));
|
|
char *fmt = (i > 0 ? ",%S" : "%S");
|
|
errstr = sdscatfmt(errstr, fmt, slot);
|
|
}
|
|
errstr = sdscat(errstr, ".");
|
|
clusterManagerOnError(errstr);
|
|
}
|
|
if (n->importing != NULL) {
|
|
if (open_slots == NULL)
|
|
open_slots = dictCreate(&clusterManagerDictType, NULL);
|
|
sds errstr = sdsempty();
|
|
errstr = sdscatprintf(errstr,
|
|
"[WARNING] Node %s:%d has slots in "
|
|
"importing state ",
|
|
n->ip,
|
|
n->port);
|
|
for (i = 0; i < n->importing_count; i += 2) {
|
|
sds slot = n->importing[i];
|
|
dictAdd(open_slots, slot, sdsdup(n->importing[i + 1]));
|
|
char *fmt = (i > 0 ? ",%S" : "%S");
|
|
errstr = sdscatfmt(errstr, fmt, slot);
|
|
}
|
|
errstr = sdscat(errstr, ".");
|
|
clusterManagerOnError(errstr);
|
|
}
|
|
}
|
|
if (open_slots != NULL) {
|
|
result = 0;
|
|
dictIterator *iter = dictGetIterator(open_slots);
|
|
dictEntry *entry;
|
|
sds errstr = sdsnew("[WARNING] The following slots are open: ");
|
|
i = 0;
|
|
while ((entry = dictNext(iter)) != NULL) {
|
|
sds slot = (sds) dictGetKey(entry);
|
|
char *fmt = (i++ > 0 ? ",%S" : "%S");
|
|
errstr = sdscatfmt(errstr, fmt, slot);
|
|
}
|
|
clusterManagerLogErr("%s.\n", (char *) errstr);
|
|
sdsfree(errstr);
|
|
if (do_fix) {
|
|
// Fix open slots.
|
|
dictReleaseIterator(iter);
|
|
iter = dictGetIterator(open_slots);
|
|
while ((entry = dictNext(iter)) != NULL) {
|
|
sds slot = (sds) dictGetKey(entry);
|
|
result = clusterManagerFixOpenSlot(atoi(slot));
|
|
if (!result) break;
|
|
}
|
|
}
|
|
dictReleaseIterator(iter);
|
|
dictRelease(open_slots);
|
|
}
|
|
clusterManagerLogInfo(">>> Check slots coverage...\n");
|
|
char slots[CLUSTER_MANAGER_SLOTS];
|
|
memset(slots, 0, CLUSTER_MANAGER_SLOTS);
|
|
int coverage = clusterManagerGetCoveredSlots(slots);
|
|
if (coverage == CLUSTER_MANAGER_SLOTS) {
|
|
clusterManagerLogOk("[OK] All %d slots covered.\n",
|
|
CLUSTER_MANAGER_SLOTS);
|
|
} else {
|
|
sds err = sdsempty();
|
|
err = sdscatprintf(err, "[ERR] Not all %d slots are "
|
|
"covered by nodes.\n",
|
|
CLUSTER_MANAGER_SLOTS);
|
|
clusterManagerOnError(err);
|
|
result = 0;
|
|
if (do_fix/* && result*/) {
|
|
dictType dtype = clusterManagerDictType;
|
|
dtype.valDestructor = dictListDestructor;
|
|
clusterManagerUncoveredSlots = dictCreate(&dtype, NULL);
|
|
int fixed = clusterManagerFixSlotsCoverage(slots);
|
|
if (fixed > 0) result = 1;
|
|
}
|
|
}
|
|
return result;
|
|
}
|
|
|
|
static clusterManagerNode *clusterNodeForResharding(char *id,
|
|
clusterManagerNode *target,
|
|
int *raise_err)
|
|
{
|
|
clusterManagerNode *node = NULL;
|
|
const char *invalid_node_msg = "*** The specified node (%s) is not known "
|
|
"or not a master, please retry.\n";
|
|
node = clusterManagerNodeByName(id);
|
|
*raise_err = 0;
|
|
if (!node || node->flags & CLUSTER_MANAGER_FLAG_SLAVE) {
|
|
clusterManagerLogErr(invalid_node_msg, id);
|
|
*raise_err = 1;
|
|
return NULL;
|
|
} else if (node != NULL && target != NULL) {
|
|
if (!strcmp(node->name, target->name)) {
|
|
clusterManagerLogErr( "*** It is not possible to use "
|
|
"the target node as "
|
|
"source node.\n");
|
|
return NULL;
|
|
}
|
|
}
|
|
return node;
|
|
}
|
|
|
|
static list *clusterManagerComputeReshardTable(list *sources, int numslots) {
|
|
list *moved = listCreate();
|
|
int src_count = listLength(sources), i = 0, tot_slots = 0, j;
|
|
clusterManagerNode **sorted = zmalloc(src_count * sizeof(**sorted));
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(sources, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
tot_slots += node->slots_count;
|
|
sorted[i++] = node;
|
|
}
|
|
qsort(sorted, src_count, sizeof(clusterManagerNode *),
|
|
clusterManagerSlotCountCompareDesc);
|
|
for (i = 0; i < src_count; i++) {
|
|
clusterManagerNode *node = sorted[i];
|
|
float n = ((float) numslots / tot_slots * node->slots_count);
|
|
if (i == 0) n = ceil(n);
|
|
else n = floor(n);
|
|
int max = (int) n, count = 0;
|
|
for (j = 0; j < CLUSTER_MANAGER_SLOTS; j++) {
|
|
int slot = node->slots[j];
|
|
if (!slot) continue;
|
|
if (count >= max || (int)listLength(moved) >= numslots) break;
|
|
clusterManagerReshardTableItem *item = zmalloc(sizeof(*item));
|
|
item->source = node;
|
|
item->slot = j;
|
|
listAddNodeTail(moved, item);
|
|
count++;
|
|
}
|
|
}
|
|
zfree(sorted);
|
|
return moved;
|
|
}
|
|
|
|
static void clusterManagerShowReshardTable(list *table) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(table, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerReshardTableItem *item = ln->value;
|
|
clusterManagerNode *n = item->source;
|
|
printf(" Moving slot %d from %s\n", item->slot, (char *) n->name);
|
|
}
|
|
}
|
|
|
|
static void clusterManagerReleaseReshardTable(list *table) {
|
|
if (table != NULL) {
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(table, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerReshardTableItem *item = ln->value;
|
|
zfree(item);
|
|
}
|
|
listRelease(table);
|
|
}
|
|
}
|
|
|
|
static void clusterManagerLog(int level, const char* fmt, ...) {
|
|
int use_colors =
|
|
(config.cluster_manager_command.flags & CLUSTER_MANAGER_CMD_FLAG_COLOR);
|
|
if (use_colors) {
|
|
printf("\033[");
|
|
switch (level) {
|
|
case CLUSTER_MANAGER_LOG_LVL_INFO: printf(LOG_COLOR_BOLD); break;
|
|
case CLUSTER_MANAGER_LOG_LVL_WARN: printf(LOG_COLOR_YELLOW); break;
|
|
case CLUSTER_MANAGER_LOG_LVL_ERR: printf(LOG_COLOR_RED); break;
|
|
case CLUSTER_MANAGER_LOG_LVL_SUCCESS: printf(LOG_COLOR_GREEN); break;
|
|
default: printf(LOG_COLOR_RESET); break;
|
|
}
|
|
}
|
|
va_list ap;
|
|
va_start(ap, fmt);
|
|
vprintf(fmt, ap);
|
|
va_end(ap);
|
|
if (use_colors) printf("\033[" LOG_COLOR_RESET);
|
|
}
|
|
|
|
static void clusterManagerNodeArrayInit(clusterManagerNodeArray *array,
|
|
int alloc_len)
|
|
{
|
|
array->nodes = zcalloc(alloc_len * sizeof(clusterManagerNode*));
|
|
array->alloc = array->nodes;
|
|
array->len = alloc_len;
|
|
array->count = 0;
|
|
}
|
|
|
|
/* Reset array->nodes to the original array allocation and re-count non-NULL
|
|
* nodes. */
|
|
static void clusterManagerNodeArrayReset(clusterManagerNodeArray *array) {
|
|
if (array->nodes > array->alloc) {
|
|
array->len = array->nodes - array->alloc;
|
|
array->nodes = array->alloc;
|
|
array->count = 0;
|
|
int i = 0;
|
|
for(; i < array->len; i++) {
|
|
if (array->nodes[i] != NULL) array->count++;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Shift array->nodes and store the shifted node into 'nodeptr'. */
|
|
static void clusterManagerNodeArrayShift(clusterManagerNodeArray *array,
|
|
clusterManagerNode **nodeptr)
|
|
{
|
|
assert(array->nodes < (array->nodes + array->len));
|
|
/* If the first node to be shifted is not NULL, decrement count. */
|
|
if (*array->nodes != NULL) array->count--;
|
|
/* Store the first node to be shifted into 'nodeptr'. */
|
|
*nodeptr = *array->nodes;
|
|
/* Shift the nodes array and decrement length. */
|
|
array->nodes++;
|
|
array->len--;
|
|
}
|
|
|
|
static void clusterManagerNodeArrayAdd(clusterManagerNodeArray *array,
|
|
clusterManagerNode *node)
|
|
{
|
|
assert(array->nodes < (array->nodes + array->len));
|
|
assert(node != NULL);
|
|
assert(array->count < array->len);
|
|
array->nodes[array->count++] = node;
|
|
}
|
|
|
|
static void clusterManagerPrintNotEmptyNodeError(clusterManagerNode *node,
|
|
char *err)
|
|
{
|
|
char *msg;
|
|
if (err) msg = err;
|
|
else {
|
|
msg = "is not empty. Either the node already knows other "
|
|
"nodes (check with CLUSTER NODES) or contains some "
|
|
"key in database 0.";
|
|
}
|
|
clusterManagerLogErr("[ERR] Node %s:%d %s\n", node->ip, node->port, msg);
|
|
}
|
|
|
|
static void clusterManagerPrintNotClusterNodeError(clusterManagerNode *node,
|
|
char *err)
|
|
{
|
|
char *msg = (err ? err : "is not configured as a cluster node.");
|
|
clusterManagerLogErr("[ERR] Node %s:%d %s\n", node->ip, node->port, msg);
|
|
}
|
|
|
|
/* Execute redis-cli in Cluster Manager mode */
|
|
static void clusterManagerMode(clusterManagerCommandProc *proc) {
|
|
int argc = config.cluster_manager_command.argc;
|
|
char **argv = config.cluster_manager_command.argv;
|
|
cluster_manager.nodes = NULL;
|
|
if (!proc(argc, argv)) goto cluster_manager_err;
|
|
freeClusterManager();
|
|
exit(0);
|
|
cluster_manager_err:
|
|
freeClusterManager();
|
|
sdsfree(config.hostip);
|
|
sdsfree(config.mb_delim);
|
|
exit(1);
|
|
}
|
|
|
|
/* Cluster Manager Commands */
|
|
|
|
static int clusterManagerCommandCreate(int argc, char **argv) {
|
|
int i, j, success = 1;
|
|
cluster_manager.nodes = listCreate();
|
|
for (i = 0; i < argc; i++) {
|
|
char *addr = argv[i];
|
|
char *c = strrchr(addr, '@');
|
|
if (c != NULL) *c = '\0';
|
|
c = strrchr(addr, ':');
|
|
if (c == NULL) {
|
|
fprintf(stderr, "Invalid address format: %s\n", addr);
|
|
return 0;
|
|
}
|
|
*c = '\0';
|
|
char *ip = addr;
|
|
int port = atoi(++c);
|
|
clusterManagerNode *node = clusterManagerNewNode(ip, port);
|
|
CLUSTER_MANAGER_NODE_CONNECT(node);
|
|
if (node->context->err) {
|
|
fprintf(stderr,"Could not connect to Redis at ");
|
|
fprintf(stderr,"%s:%d: %s\n", ip, port, node->context->errstr);
|
|
freeClusterManagerNode(node);
|
|
return 0;
|
|
}
|
|
char *err = NULL;
|
|
if (!clusterManagerNodeIsCluster(node, &err)) {
|
|
clusterManagerPrintNotClusterNodeError(node, err);
|
|
if (err) zfree(err);
|
|
freeClusterManagerNode(node);
|
|
return 0;
|
|
}
|
|
err = NULL;
|
|
if (!clusterManagerNodeLoadInfo(node, 0, &err)) {
|
|
if (err) {
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(node, err);
|
|
zfree(err);
|
|
}
|
|
freeClusterManagerNode(node);
|
|
return 0;
|
|
}
|
|
err = NULL;
|
|
if (!clusterManagerNodeIsEmpty(node, &err)) {
|
|
clusterManagerPrintNotEmptyNodeError(node, err);
|
|
if (err) zfree(err);
|
|
freeClusterManagerNode(node);
|
|
return 0;
|
|
}
|
|
listAddNodeTail(cluster_manager.nodes, node);
|
|
}
|
|
int node_len = cluster_manager.nodes->len;
|
|
int replicas = config.cluster_manager_command.replicas;
|
|
int masters_count = CLUSTER_MANAGER_MASTERS_COUNT(node_len, replicas);
|
|
if (masters_count < 3) {
|
|
clusterManagerLogErr(
|
|
"*** ERROR: Invalid configuration for cluster creation.\n"
|
|
"*** Redis Cluster requires at least 3 master nodes.\n"
|
|
"*** This is not possible with %d nodes and %d replicas per node.",
|
|
node_len, replicas);
|
|
clusterManagerLogErr("\n*** At least %d nodes are required.\n",
|
|
3 * (replicas + 1));
|
|
return 0;
|
|
}
|
|
clusterManagerLogInfo(">>> Performing hash slots allocation "
|
|
"on %d nodes...\n", node_len);
|
|
int interleaved_len = 0, ip_count = 0;
|
|
clusterManagerNode **interleaved = zcalloc(node_len*sizeof(**interleaved));
|
|
char **ips = zcalloc(node_len * sizeof(char*));
|
|
clusterManagerNodeArray *ip_nodes = zcalloc(node_len * sizeof(*ip_nodes));
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
int found = 0;
|
|
for (i = 0; i < ip_count; i++) {
|
|
char *ip = ips[i];
|
|
if (!strcmp(ip, n->ip)) {
|
|
found = 1;
|
|
break;
|
|
}
|
|
}
|
|
if (!found) {
|
|
ips[ip_count++] = n->ip;
|
|
}
|
|
clusterManagerNodeArray *node_array = &(ip_nodes[i]);
|
|
if (node_array->nodes == NULL)
|
|
clusterManagerNodeArrayInit(node_array, node_len);
|
|
clusterManagerNodeArrayAdd(node_array, n);
|
|
}
|
|
while (interleaved_len < node_len) {
|
|
for (i = 0; i < ip_count; i++) {
|
|
clusterManagerNodeArray *node_array = &(ip_nodes[i]);
|
|
if (node_array->count > 0) {
|
|
clusterManagerNode *n = NULL;
|
|
clusterManagerNodeArrayShift(node_array, &n);
|
|
interleaved[interleaved_len++] = n;
|
|
}
|
|
}
|
|
}
|
|
clusterManagerNode **masters = interleaved;
|
|
interleaved += masters_count;
|
|
interleaved_len -= masters_count;
|
|
float slots_per_node = CLUSTER_MANAGER_SLOTS / (float) masters_count;
|
|
long first = 0;
|
|
float cursor = 0.0f;
|
|
for (i = 0; i < masters_count; i++) {
|
|
clusterManagerNode *master = masters[i];
|
|
long last = lround(cursor + slots_per_node - 1);
|
|
if (last > CLUSTER_MANAGER_SLOTS || i == (masters_count - 1))
|
|
last = CLUSTER_MANAGER_SLOTS - 1;
|
|
if (last < first) last = first;
|
|
printf("Master[%d] -> Slots %lu - %lu\n", i, first, last);
|
|
master->slots_count = 0;
|
|
for (j = first; j <= last; j++) {
|
|
master->slots[j] = 1;
|
|
master->slots_count++;
|
|
}
|
|
master->dirty = 1;
|
|
first = last + 1;
|
|
cursor += slots_per_node;
|
|
}
|
|
|
|
int assign_unused = 0, available_count = interleaved_len;
|
|
assign_replicas:
|
|
for (i = 0; i < masters_count; i++) {
|
|
clusterManagerNode *master = masters[i];
|
|
int assigned_replicas = 0;
|
|
while (assigned_replicas < replicas) {
|
|
if (available_count == 0) break;
|
|
clusterManagerNode *found = NULL, *slave = NULL;
|
|
int firstNodeIdx = -1;
|
|
for (j = 0; j < interleaved_len; j++) {
|
|
clusterManagerNode *n = interleaved[j];
|
|
if (n == NULL) continue;
|
|
if (strcmp(n->ip, master->ip)) {
|
|
found = n;
|
|
interleaved[j] = NULL;
|
|
break;
|
|
}
|
|
if (firstNodeIdx < 0) firstNodeIdx = j;
|
|
}
|
|
if (found) slave = found;
|
|
else if (firstNodeIdx >= 0) {
|
|
slave = interleaved[firstNodeIdx];
|
|
interleaved_len -= (interleaved - (interleaved + firstNodeIdx));
|
|
interleaved += (firstNodeIdx + 1);
|
|
}
|
|
if (slave != NULL) {
|
|
assigned_replicas++;
|
|
available_count--;
|
|
if (slave->replicate) sdsfree(slave->replicate);
|
|
slave->replicate = sdsnew(master->name);
|
|
slave->dirty = 1;
|
|
} else break;
|
|
printf("Adding replica %s:%d to %s:%d\n", slave->ip, slave->port,
|
|
master->ip, master->port);
|
|
if (assign_unused) break;
|
|
}
|
|
}
|
|
if (!assign_unused && available_count > 0) {
|
|
assign_unused = 1;
|
|
printf("Adding extra replicas...\n");
|
|
goto assign_replicas;
|
|
}
|
|
for (i = 0; i < ip_count; i++) {
|
|
clusterManagerNodeArray *node_array = ip_nodes + i;
|
|
clusterManagerNodeArrayReset(node_array);
|
|
}
|
|
clusterManagerOptimizeAntiAffinity(ip_nodes, ip_count);
|
|
clusterManagerShowNodes();
|
|
if (confirmWithYes("Can I set the above configuration?")) {
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
char *err = NULL;
|
|
int flushed = clusterManagerFlushNodeConfig(node, &err);
|
|
if (!flushed && node->dirty && !node->replicate) {
|
|
if (err != NULL) {
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(node, err);
|
|
zfree(err);
|
|
}
|
|
success = 0;
|
|
goto cleanup;
|
|
} else if (err != NULL) zfree(err);
|
|
}
|
|
clusterManagerLogInfo(">>> Nodes configuration updated\n");
|
|
clusterManagerLogInfo(">>> Assign a different config epoch to "
|
|
"each node\n");
|
|
int config_epoch = 1;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
redisReply *reply = NULL;
|
|
reply = CLUSTER_MANAGER_COMMAND(node,
|
|
"cluster set-config-epoch %d",
|
|
config_epoch++);
|
|
if (reply != NULL) freeReplyObject(reply);
|
|
}
|
|
clusterManagerLogInfo(">>> Sending CLUSTER MEET messages to join "
|
|
"the cluster\n");
|
|
clusterManagerNode *first = NULL;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
if (first == NULL) {
|
|
first = node;
|
|
continue;
|
|
}
|
|
redisReply *reply = NULL;
|
|
reply = CLUSTER_MANAGER_COMMAND(node, "cluster meet %s %d",
|
|
first->ip, first->port);
|
|
int is_err = 0;
|
|
if (reply != NULL) {
|
|
if ((is_err = reply->type == REDIS_REPLY_ERROR))
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(node, reply->str);
|
|
freeReplyObject(reply);
|
|
} else {
|
|
is_err = 1;
|
|
fprintf(stderr, "Failed to send CLUSTER MEET command.\n");
|
|
}
|
|
if (is_err) {
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
}
|
|
/* Give one second for the join to start, in order to avoid that
|
|
* waiting for cluster join will find all the nodes agree about
|
|
* the config as they are still empty with unassigned slots. */
|
|
sleep(1);
|
|
clusterManagerWaitForClusterJoin();
|
|
/* Useful for the replicas */
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
if (!node->dirty) continue;
|
|
char *err = NULL;
|
|
int flushed = clusterManagerFlushNodeConfig(node, &err);
|
|
if (!flushed && !node->replicate) {
|
|
if (err != NULL) {
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(node, err);
|
|
zfree(err);
|
|
}
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
}
|
|
// Reset Nodes
|
|
listRewind(cluster_manager.nodes, &li);
|
|
clusterManagerNode *first_node = NULL;
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *node = ln->value;
|
|
if (!first_node) first_node = node;
|
|
else freeClusterManagerNode(node);
|
|
}
|
|
listEmpty(cluster_manager.nodes);
|
|
if (!clusterManagerLoadInfoFromNode(first_node, 0)) {
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
clusterManagerCheckCluster(0);
|
|
}
|
|
cleanup:
|
|
/* Free everything */
|
|
zfree(masters);
|
|
zfree(ips);
|
|
for (i = 0; i < node_len; i++) {
|
|
clusterManagerNodeArray *node_array = ip_nodes + i;
|
|
CLUSTER_MANAGER_NODE_ARRAY_FREE(node_array);
|
|
}
|
|
zfree(ip_nodes);
|
|
return success;
|
|
}
|
|
|
|
static int clusterManagerCommandAddNode(int argc, char **argv) {
|
|
int success = 1;
|
|
redisReply *reply = NULL;
|
|
char *ref_ip = NULL, *ip = NULL;
|
|
int ref_port = 0, port = 0;
|
|
if (!getClusterHostFromCmdArgs(argc - 1, argv + 1, &ref_ip, &ref_port))
|
|
goto invalid_args;
|
|
if (!getClusterHostFromCmdArgs(1, argv, &ip, &port))
|
|
goto invalid_args;
|
|
clusterManagerLogInfo(">>> Adding node %s:%d to cluster %s:%d\n", ip, port,
|
|
ref_ip, ref_port);
|
|
// Check the existing cluster
|
|
clusterManagerNode *refnode = clusterManagerNewNode(ref_ip, ref_port);
|
|
if (!clusterManagerLoadInfoFromNode(refnode, 0)) return 0;
|
|
if (!clusterManagerCheckCluster(0)) return 0;
|
|
|
|
/* If --cluster-master-id was specified, try to resolve it now so that we
|
|
* abort before starting with the node configuration. */
|
|
clusterManagerNode *master_node = NULL;
|
|
if (config.cluster_manager_command.flags & CLUSTER_MANAGER_CMD_FLAG_SLAVE) {
|
|
char *master_id = config.cluster_manager_command.master_id;
|
|
if (master_id != NULL) {
|
|
master_node = clusterManagerNodeByName(master_id);
|
|
if (master_node == NULL) {
|
|
clusterManagerLogErr("[ERR] No such master ID %s\n", master_id);
|
|
return 0;
|
|
}
|
|
} else {
|
|
master_node = clusterManagerNodeWithLeastReplicas();
|
|
assert(master_node != NULL);
|
|
printf("Automatically selected master %s:%d\n", master_node->ip,
|
|
master_node->port);
|
|
}
|
|
}
|
|
|
|
// Add the new node
|
|
clusterManagerNode *new_node = clusterManagerNewNode(ip, port);
|
|
int added = 0;
|
|
CLUSTER_MANAGER_NODE_CONNECT(new_node);
|
|
if (new_node->context->err) {
|
|
clusterManagerLogErr("[ERR] Sorry, can't connect to node %s:%d\n",
|
|
ip, port);
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
char *err = NULL;
|
|
if (!(success = clusterManagerNodeIsCluster(new_node, &err))) {
|
|
clusterManagerPrintNotClusterNodeError(new_node, err);
|
|
if (err) zfree(err);
|
|
goto cleanup;
|
|
}
|
|
if (!clusterManagerNodeLoadInfo(new_node, 0, &err)) {
|
|
if (err) {
|
|
CLUSTER_MANAGER_PRINT_REPLY_ERROR(new_node, err);
|
|
zfree(err);
|
|
}
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
if (!(success = clusterManagerNodeIsEmpty(new_node, &err))) {
|
|
clusterManagerPrintNotEmptyNodeError(new_node, err);
|
|
if (err) zfree(err);
|
|
goto cleanup;
|
|
}
|
|
clusterManagerNode *first = listFirst(cluster_manager.nodes)->value;
|
|
listAddNodeTail(cluster_manager.nodes, new_node);
|
|
added = 1;
|
|
|
|
// Send CLUSTER MEET command to the new node
|
|
clusterManagerLogInfo(">>> Send CLUSTER MEET to node %s:%d to make it "
|
|
"join the cluster.\n", ip, port);
|
|
reply = CLUSTER_MANAGER_COMMAND(new_node, "CLUSTER MEET %s %d",
|
|
first->ip, first->port);
|
|
if (!(success = clusterManagerCheckRedisReply(new_node, reply, NULL)))
|
|
goto cleanup;
|
|
|
|
/* Additional configuration is needed if the node is added as a slave. */
|
|
if (master_node) {
|
|
sleep(1);
|
|
clusterManagerWaitForClusterJoin();
|
|
clusterManagerLogInfo(">>> Configure node as replica of %s:%d.\n",
|
|
master_node->ip, master_node->port);
|
|
freeReplyObject(reply);
|
|
reply = CLUSTER_MANAGER_COMMAND(new_node, "CLUSTER REPLICATE %s",
|
|
master_node->name);
|
|
if (!(success = clusterManagerCheckRedisReply(new_node, reply, NULL)))
|
|
goto cleanup;
|
|
}
|
|
clusterManagerLogOk("[OK] New node added correctly.\n");
|
|
cleanup:
|
|
if (!added && new_node) freeClusterManagerNode(new_node);
|
|
if (reply) freeReplyObject(reply);
|
|
return success;
|
|
invalid_args:
|
|
fprintf(stderr, CLUSTER_MANAGER_INVALID_HOST_ARG);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandDeleteNode(int argc, char **argv) {
|
|
UNUSED(argc);
|
|
int success = 1;
|
|
int port = 0;
|
|
char *ip = NULL;
|
|
if (!getClusterHostFromCmdArgs(1, argv, &ip, &port)) goto invalid_args;
|
|
char *node_id = argv[1];
|
|
clusterManagerLogInfo(">>> Removing node %s from cluster %s:%d\n",
|
|
node_id, ip, port);
|
|
clusterManagerNode *ref_node = clusterManagerNewNode(ip, port);
|
|
clusterManagerNode *node = NULL;
|
|
|
|
// Load cluster information
|
|
if (!clusterManagerLoadInfoFromNode(ref_node, 0)) return 0;
|
|
|
|
// Check if the node exists and is not empty
|
|
node = clusterManagerNodeByName(node_id);
|
|
if (node == NULL) {
|
|
clusterManagerLogErr("[ERR] No such node ID %s\n", node_id);
|
|
return 0;
|
|
}
|
|
if (node->slots_count != 0) {
|
|
clusterManagerLogErr("[ERR] Node %s:%d is not empty! Reshard data "
|
|
"away and try again.\n", node->ip, node->port);
|
|
return 0;
|
|
}
|
|
|
|
// Send CLUSTER FORGET to all the nodes but the node to remove
|
|
clusterManagerLogInfo(">>> Sending CLUSTER FORGET messages to the "
|
|
"cluster...\n");
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n == node) continue;
|
|
if (n->replicate && !strcasecmp(n->replicate, node_id)) {
|
|
// Reconfigure the slave to replicate with some other node
|
|
clusterManagerNode *master = clusterManagerNodeWithLeastReplicas();
|
|
assert(master != NULL);
|
|
clusterManagerLogInfo(">>> %s:%d as replica of %s:%d\n",
|
|
n->ip, n->port, master->ip, master->port);
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(n, "CLUSTER REPLICATE %s",
|
|
master->name);
|
|
success = clusterManagerCheckRedisReply(n, r, NULL);
|
|
if (r) freeReplyObject(r);
|
|
if (!success) return 0;
|
|
}
|
|
redisReply *r = CLUSTER_MANAGER_COMMAND(n, "CLUSTER FORGET %s",
|
|
node_id);
|
|
success = clusterManagerCheckRedisReply(n, r, NULL);
|
|
if (r) freeReplyObject(r);
|
|
if (!success) return 0;
|
|
}
|
|
|
|
// Finally shutdown the node
|
|
clusterManagerLogInfo(">>> SHUTDOWN the node.\n");
|
|
redisReply *r = redisCommand(node->context, "SHUTDOWN");
|
|
success = clusterManagerCheckRedisReply(node, r, NULL);
|
|
if (r) freeReplyObject(r);
|
|
return success;
|
|
invalid_args:
|
|
fprintf(stderr, CLUSTER_MANAGER_INVALID_HOST_ARG);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandInfo(int argc, char **argv) {
|
|
int port = 0;
|
|
char *ip = NULL;
|
|
if (!getClusterHostFromCmdArgs(argc, argv, &ip, &port)) goto invalid_args;
|
|
clusterManagerNode *node = clusterManagerNewNode(ip, port);
|
|
if (!clusterManagerLoadInfoFromNode(node, 0)) return 0;
|
|
clusterManagerShowClusterInfo();
|
|
return 1;
|
|
invalid_args:
|
|
fprintf(stderr, CLUSTER_MANAGER_INVALID_HOST_ARG);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandCheck(int argc, char **argv) {
|
|
int port = 0;
|
|
char *ip = NULL;
|
|
if (!getClusterHostFromCmdArgs(argc, argv, &ip, &port)) goto invalid_args;
|
|
clusterManagerNode *node = clusterManagerNewNode(ip, port);
|
|
if (!clusterManagerLoadInfoFromNode(node, 0)) return 0;
|
|
clusterManagerShowClusterInfo();
|
|
return clusterManagerCheckCluster(0);
|
|
invalid_args:
|
|
fprintf(stderr, CLUSTER_MANAGER_INVALID_HOST_ARG);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandFix(int argc, char **argv) {
|
|
config.cluster_manager_command.flags |= CLUSTER_MANAGER_CMD_FLAG_FIX;
|
|
return clusterManagerCommandCheck(argc, argv);
|
|
}
|
|
|
|
static int clusterManagerCommandReshard(int argc, char **argv) {
|
|
int port = 0;
|
|
char *ip = NULL;
|
|
if (!getClusterHostFromCmdArgs(argc, argv, &ip, &port)) goto invalid_args;
|
|
clusterManagerNode *node = clusterManagerNewNode(ip, port);
|
|
if (!clusterManagerLoadInfoFromNode(node, 0)) return 0;
|
|
clusterManagerCheckCluster(0);
|
|
if (cluster_manager.errors && listLength(cluster_manager.errors) > 0) {
|
|
fflush(stdout);
|
|
fprintf(stderr,
|
|
"*** Please fix your cluster problems before resharding\n");
|
|
return 0;
|
|
}
|
|
int slots = config.cluster_manager_command.slots;
|
|
if (!slots) {
|
|
while (slots <= 0 || slots > CLUSTER_MANAGER_SLOTS) {
|
|
printf("How many slots do you want to move (from 1 to %d)? ",
|
|
CLUSTER_MANAGER_SLOTS);
|
|
fflush(stdout);
|
|
char buf[6];
|
|
int nread = read(fileno(stdin),buf,6);
|
|
if (nread <= 0) continue;
|
|
int last_idx = nread - 1;
|
|
if (buf[last_idx] != '\n') {
|
|
int ch;
|
|
while ((ch = getchar()) != '\n' && ch != EOF) {}
|
|
}
|
|
buf[last_idx] = '\0';
|
|
slots = atoi(buf);
|
|
}
|
|
}
|
|
char buf[255];
|
|
char *to = config.cluster_manager_command.to,
|
|
*from = config.cluster_manager_command.from;
|
|
while (to == NULL) {
|
|
printf("What is the receiving node ID? ");
|
|
fflush(stdout);
|
|
int nread = read(fileno(stdin),buf,255);
|
|
if (nread <= 0) continue;
|
|
int last_idx = nread - 1;
|
|
if (buf[last_idx] != '\n') {
|
|
int ch;
|
|
while ((ch = getchar()) != '\n' && ch != EOF) {}
|
|
}
|
|
buf[last_idx] = '\0';
|
|
if (strlen(buf) > 0) to = buf;
|
|
}
|
|
int raise_err = 0;
|
|
clusterManagerNode *target = clusterNodeForResharding(to, NULL, &raise_err);
|
|
if (target == NULL) return 0;
|
|
list *sources = listCreate();
|
|
list *table = NULL;
|
|
int all = 0, result = 1;
|
|
if (from == NULL) {
|
|
printf("Please enter all the source node IDs.\n");
|
|
printf(" Type 'all' to use all the nodes as source nodes for "
|
|
"the hash slots.\n");
|
|
printf(" Type 'done' once you entered all the source nodes IDs.\n");
|
|
while (1) {
|
|
printf("Source node #%lu: ", listLength(sources) + 1);
|
|
fflush(stdout);
|
|
int nread = read(fileno(stdin),buf,255);
|
|
if (nread <= 0) continue;
|
|
int last_idx = nread - 1;
|
|
if (buf[last_idx] != '\n') {
|
|
int ch;
|
|
while ((ch = getchar()) != '\n' && ch != EOF) {}
|
|
}
|
|
buf[last_idx] = '\0';
|
|
if (!strcmp(buf, "done")) break;
|
|
else if (!strcmp(buf, "all")) {
|
|
all = 1;
|
|
break;
|
|
} else {
|
|
clusterManagerNode *src =
|
|
clusterNodeForResharding(buf, target, &raise_err);
|
|
if (src != NULL) listAddNodeTail(sources, src);
|
|
else if (raise_err) {
|
|
result = 0;
|
|
goto cleanup;
|
|
}
|
|
}
|
|
}
|
|
} else {
|
|
char *p;
|
|
while((p = strchr(from, ',')) != NULL) {
|
|
*p = '\0';
|
|
if (!strcmp(from, "all")) {
|
|
all = 1;
|
|
break;
|
|
} else {
|
|
clusterManagerNode *src =
|
|
clusterNodeForResharding(from, target, &raise_err);
|
|
if (src != NULL) listAddNodeTail(sources, src);
|
|
else if (raise_err) {
|
|
result = 0;
|
|
goto cleanup;
|
|
}
|
|
}
|
|
from = p + 1;
|
|
}
|
|
/* Check if there's still another source to process. */
|
|
if (!all && strlen(from) > 0) {
|
|
if (!strcmp(from, "all")) all = 1;
|
|
if (!all) {
|
|
clusterManagerNode *src =
|
|
clusterNodeForResharding(from, target, &raise_err);
|
|
if (src != NULL) listAddNodeTail(sources, src);
|
|
else if (raise_err) {
|
|
result = 0;
|
|
goto cleanup;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
listIter li;
|
|
listNode *ln;
|
|
if (all) {
|
|
listEmpty(sources);
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE || n->replicate)
|
|
continue;
|
|
if (!sdscmp(n->name, target->name)) continue;
|
|
listAddNodeTail(sources, n);
|
|
}
|
|
}
|
|
if (listLength(sources) == 0) {
|
|
fprintf(stderr, "*** No source nodes given, operation aborted.\n");
|
|
result = 0;
|
|
goto cleanup;
|
|
}
|
|
printf("\nReady to move %d slots.\n", slots);
|
|
printf(" Source nodes:\n");
|
|
listRewind(sources, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *src = ln->value;
|
|
sds info = clusterManagerNodeInfo(src, 4);
|
|
printf("%s\n", info);
|
|
sdsfree(info);
|
|
}
|
|
printf(" Destination node:\n");
|
|
sds info = clusterManagerNodeInfo(target, 4);
|
|
printf("%s\n", info);
|
|
sdsfree(info);
|
|
table = clusterManagerComputeReshardTable(sources, slots);
|
|
printf(" Resharding plan:\n");
|
|
clusterManagerShowReshardTable(table);
|
|
if (!(config.cluster_manager_command.flags &
|
|
CLUSTER_MANAGER_CMD_FLAG_YES))
|
|
{
|
|
printf("Do you want to proceed with the proposed "
|
|
"reshard plan (yes/no)? ");
|
|
fflush(stdout);
|
|
char buf[4];
|
|
int nread = read(fileno(stdin),buf,4);
|
|
buf[3] = '\0';
|
|
if (nread <= 0 || strcmp("yes", buf) != 0) {
|
|
result = 0;
|
|
goto cleanup;
|
|
}
|
|
}
|
|
int opts = CLUSTER_MANAGER_OPT_VERBOSE;
|
|
listRewind(table, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerReshardTableItem *item = ln->value;
|
|
char *err = NULL;
|
|
result = clusterManagerMoveSlot(item->source, target, item->slot,
|
|
opts, &err);
|
|
if (!result) {
|
|
if (err != NULL) {
|
|
//clusterManagerLogErr("\n%s\n", err);
|
|
zfree(err);
|
|
}
|
|
goto cleanup;
|
|
}
|
|
}
|
|
cleanup:
|
|
listRelease(sources);
|
|
clusterManagerReleaseReshardTable(table);
|
|
return result;
|
|
invalid_args:
|
|
fprintf(stderr, CLUSTER_MANAGER_INVALID_HOST_ARG);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandRebalance(int argc, char **argv) {
|
|
int port = 0;
|
|
char *ip = NULL;
|
|
clusterManagerNode **weightedNodes = NULL;
|
|
list *involved = NULL;
|
|
if (!getClusterHostFromCmdArgs(argc, argv, &ip, &port)) goto invalid_args;
|
|
clusterManagerNode *node = clusterManagerNewNode(ip, port);
|
|
if (!clusterManagerLoadInfoFromNode(node, 0)) return 0;
|
|
int result = 1, i;
|
|
if (config.cluster_manager_command.weight != NULL) {
|
|
for (i = 0; i < config.cluster_manager_command.weight_argc; i++) {
|
|
char *name = config.cluster_manager_command.weight[i];
|
|
char *p = strchr(name, '=');
|
|
if (p == NULL) {
|
|
result = 0;
|
|
goto cleanup;
|
|
}
|
|
*p = '\0';
|
|
float w = atof(++p);
|
|
clusterManagerNode *n = clusterManagerNodeByAbbreviatedName(name);
|
|
if (n == NULL) {
|
|
clusterManagerLogErr("*** No such master node %s\n", name);
|
|
result = 0;
|
|
goto cleanup;
|
|
}
|
|
n->weight = w;
|
|
}
|
|
}
|
|
float total_weight = 0;
|
|
int nodes_involved = 0;
|
|
int use_empty = config.cluster_manager_command.flags &
|
|
CLUSTER_MANAGER_CMD_FLAG_EMPTYMASTER;
|
|
involved = listCreate();
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
/* Compute the total cluster weight. */
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE || n->replicate)
|
|
continue;
|
|
if (!use_empty && n->slots_count == 0) {
|
|
n->weight = 0;
|
|
continue;
|
|
}
|
|
total_weight += n->weight;
|
|
nodes_involved++;
|
|
listAddNodeTail(involved, n);
|
|
}
|
|
weightedNodes = zmalloc(nodes_involved * sizeof(clusterManagerNode *));
|
|
if (weightedNodes == NULL) goto cleanup;
|
|
/* Check cluster, only proceed if it looks sane. */
|
|
clusterManagerCheckCluster(1);
|
|
if (cluster_manager.errors && listLength(cluster_manager.errors) > 0) {
|
|
clusterManagerLogErr("*** Please fix your cluster problems "
|
|
"before rebalancing" );
|
|
result = 0;
|
|
goto cleanup;
|
|
}
|
|
/* Calculate the slots balance for each node. It's the number of
|
|
* slots the node should lose (if positive) or gain (if negative)
|
|
* in order to be balanced. */
|
|
int threshold_reached = 0, total_balance = 0;
|
|
float threshold = config.cluster_manager_command.threshold;
|
|
i = 0;
|
|
listRewind(involved, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
weightedNodes[i++] = n;
|
|
int expected = (int) (((float)CLUSTER_MANAGER_SLOTS / total_weight) *
|
|
n->weight);
|
|
n->balance = n->slots_count - expected;
|
|
total_balance += n->balance;
|
|
/* Compute the percentage of difference between the
|
|
* expected number of slots and the real one, to see
|
|
* if it's over the threshold specified by the user. */
|
|
int over_threshold = 0;
|
|
if (threshold > 0) {
|
|
if (n->slots_count > 0) {
|
|
float err_perc = fabs((100-(100.0*expected/n->slots_count)));
|
|
if (err_perc > threshold) over_threshold = 1;
|
|
} else if (expected > 1) {
|
|
over_threshold = 1;
|
|
}
|
|
}
|
|
if (over_threshold) threshold_reached = 1;
|
|
}
|
|
if (!threshold_reached) {
|
|
clusterManagerLogWarn("*** No rebalancing needed! "
|
|
"All nodes are within the %.2f%% threshold.\n",
|
|
config.cluster_manager_command.threshold);
|
|
goto cleanup;
|
|
}
|
|
/* Because of rounding, it is possible that the balance of all nodes
|
|
* summed does not give 0. Make sure that nodes that have to provide
|
|
* slots are always matched by nodes receiving slots. */
|
|
while (total_balance > 0) {
|
|
listRewind(involved, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->balance <= 0 && total_balance > 0) {
|
|
n->balance--;
|
|
total_balance--;
|
|
}
|
|
}
|
|
}
|
|
/* Sort nodes by their slots balance. */
|
|
qsort(weightedNodes, nodes_involved, sizeof(clusterManagerNode *),
|
|
clusterManagerCompareNodeBalance);
|
|
clusterManagerLogInfo(">>> Rebalancing across %d nodes. "
|
|
"Total weight = %.2f\n",
|
|
nodes_involved, total_weight);
|
|
if (config.verbose) {
|
|
for (i = 0; i < nodes_involved; i++) {
|
|
clusterManagerNode *n = weightedNodes[i];
|
|
printf("%s:%d balance is %d slots\n", n->ip, n->port, n->balance);
|
|
}
|
|
}
|
|
/* Now we have at the start of the 'sn' array nodes that should get
|
|
* slots, at the end nodes that must give slots.
|
|
* We take two indexes, one at the start, and one at the end,
|
|
* incrementing or decrementing the indexes accordingly til we
|
|
* find nodes that need to get/provide slots. */
|
|
int dst_idx = 0;
|
|
int src_idx = nodes_involved - 1;
|
|
int simulate = config.cluster_manager_command.flags &
|
|
CLUSTER_MANAGER_CMD_FLAG_SIMULATE;
|
|
while (dst_idx < src_idx) {
|
|
clusterManagerNode *dst = weightedNodes[dst_idx];
|
|
clusterManagerNode *src = weightedNodes[src_idx];
|
|
int db = abs(dst->balance);
|
|
int sb = abs(src->balance);
|
|
int numslots = (db < sb ? db : sb);
|
|
if (numslots > 0) {
|
|
printf("Moving %d slots from %s:%d to %s:%d\n", numslots,
|
|
src->ip,
|
|
src->port,
|
|
dst->ip,
|
|
dst->port);
|
|
/* Actually move the slots. */
|
|
list *lsrc = listCreate(), *table = NULL;
|
|
listAddNodeTail(lsrc, src);
|
|
table = clusterManagerComputeReshardTable(lsrc, numslots);
|
|
listRelease(lsrc);
|
|
int table_len = (int) listLength(table);
|
|
if (!table || table_len != numslots) {
|
|
clusterManagerLogErr("*** Assertion failed: Reshard table "
|
|
"!= number of slots");
|
|
result = 0;
|
|
goto end_move;
|
|
}
|
|
if (simulate) {
|
|
for (i = 0; i < table_len; i++) printf("#");
|
|
} else {
|
|
int opts = CLUSTER_MANAGER_OPT_QUIET |
|
|
CLUSTER_MANAGER_OPT_UPDATE;
|
|
listRewind(table, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerReshardTableItem *item = ln->value;
|
|
result = clusterManagerMoveSlot(item->source,
|
|
dst,
|
|
item->slot,
|
|
opts, NULL);
|
|
if (!result) goto end_move;
|
|
printf("#");
|
|
fflush(stdout);
|
|
}
|
|
|
|
}
|
|
printf("\n");
|
|
end_move:
|
|
clusterManagerReleaseReshardTable(table);
|
|
if (!result) goto cleanup;
|
|
}
|
|
/* Update nodes balance. */
|
|
dst->balance += numslots;
|
|
src->balance -= numslots;
|
|
if (dst->balance == 0) dst_idx++;
|
|
if (src->balance == 0) src_idx --;
|
|
}
|
|
cleanup:
|
|
if (involved != NULL) listRelease(involved);
|
|
if (weightedNodes != NULL) zfree(weightedNodes);
|
|
return result;
|
|
invalid_args:
|
|
fprintf(stderr, CLUSTER_MANAGER_INVALID_HOST_ARG);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandSetTimeout(int argc, char **argv) {
|
|
UNUSED(argc);
|
|
int port = 0;
|
|
char *ip = NULL;
|
|
if (!getClusterHostFromCmdArgs(1, argv, &ip, &port)) goto invalid_args;
|
|
int timeout = atoi(argv[1]);
|
|
if (timeout < 100) {
|
|
fprintf(stderr, "Setting a node timeout of less than 100 "
|
|
"milliseconds is a bad idea.\n");
|
|
return 0;
|
|
}
|
|
// Load cluster information
|
|
clusterManagerNode *node = clusterManagerNewNode(ip, port);
|
|
if (!clusterManagerLoadInfoFromNode(node, 0)) return 0;
|
|
int ok_count = 0, err_count = 0;
|
|
|
|
clusterManagerLogInfo(">>> Reconfiguring node timeout in every "
|
|
"cluster node...\n");
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
char *err = NULL;
|
|
redisReply *reply = CLUSTER_MANAGER_COMMAND(n, "CONFIG %s %s %d",
|
|
"SET",
|
|
"cluster-node-timeout",
|
|
timeout);
|
|
if (reply == NULL) goto reply_err;
|
|
int ok = clusterManagerCheckRedisReply(n, reply, &err);
|
|
freeReplyObject(reply);
|
|
if (!ok) goto reply_err;
|
|
reply = CLUSTER_MANAGER_COMMAND(n, "CONFIG %s", "REWRITE");
|
|
if (reply == NULL) goto reply_err;
|
|
ok = clusterManagerCheckRedisReply(n, reply, &err);
|
|
freeReplyObject(reply);
|
|
if (!ok) goto reply_err;
|
|
clusterManagerLogWarn("*** New timeout set for %s:%d\n", n->ip,
|
|
n->port);
|
|
ok_count++;
|
|
continue;
|
|
reply_err:
|
|
if (err == NULL) err = "";
|
|
clusterManagerLogErr("ERR setting node-timeot for %s:%d: %s\n", n->ip,
|
|
n->port, err);
|
|
err_count++;
|
|
}
|
|
clusterManagerLogInfo(">>> New node timeout set. %d OK, %d ERR.\n",
|
|
ok_count, err_count);
|
|
return 1;
|
|
invalid_args:
|
|
fprintf(stderr, CLUSTER_MANAGER_INVALID_HOST_ARG);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandImport(int argc, char **argv) {
|
|
int success = 1;
|
|
int port = 0, src_port = 0;
|
|
char *ip = NULL, *src_ip = NULL;
|
|
char *invalid_args_msg = NULL;
|
|
if (!getClusterHostFromCmdArgs(argc, argv, &ip, &port)) {
|
|
invalid_args_msg = CLUSTER_MANAGER_INVALID_HOST_ARG;
|
|
goto invalid_args;
|
|
}
|
|
if (config.cluster_manager_command.from == NULL) {
|
|
invalid_args_msg = "[ERR] Option '--cluster-from' is required for "
|
|
"subcommand 'import'.\n";
|
|
goto invalid_args;
|
|
}
|
|
char *src_host[] = {config.cluster_manager_command.from};
|
|
if (!getClusterHostFromCmdArgs(1, src_host, &src_ip, &src_port)) {
|
|
invalid_args_msg = "[ERR] Invalid --cluster-from host. You need to "
|
|
"pass a valid address (ie. 120.0.0.1:7000).\n";
|
|
goto invalid_args;
|
|
}
|
|
clusterManagerLogInfo(">>> Importing data from %s:%d to cluster %s:%d\n",
|
|
src_ip, src_port, ip, port);
|
|
|
|
clusterManagerNode *refnode = clusterManagerNewNode(ip, port);
|
|
if (!clusterManagerLoadInfoFromNode(refnode, 0)) return 0;
|
|
if (!clusterManagerCheckCluster(0)) return 0;
|
|
char *reply_err = NULL;
|
|
redisReply *src_reply = NULL;
|
|
// Connect to the source node.
|
|
redisContext *src_ctx = redisConnect(src_ip, src_port);
|
|
if (src_ctx->err) {
|
|
success = 0;
|
|
fprintf(stderr,"Could not connect to Redis at %s:%d: %s.\n", src_ip,
|
|
src_port, src_ctx->errstr);
|
|
goto cleanup;
|
|
}
|
|
src_reply = reconnectingRedisCommand(src_ctx, "INFO");
|
|
if (!src_reply || src_reply->type == REDIS_REPLY_ERROR) {
|
|
if (src_reply && src_reply->str) reply_err = src_reply->str;
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
if (getLongInfoField(src_reply->str, "cluster_enabled")) {
|
|
clusterManagerLogErr("[ERR] The source node should not be a "
|
|
"cluster node.\n");
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
freeReplyObject(src_reply);
|
|
src_reply = reconnectingRedisCommand(src_ctx, "DBSIZE");
|
|
if (!src_reply || src_reply->type == REDIS_REPLY_ERROR) {
|
|
if (src_reply && src_reply->str) reply_err = src_reply->str;
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
int size = src_reply->integer, i;
|
|
clusterManagerLogWarn("*** Importing %d keys from DB 0\n", size);
|
|
|
|
// Build a slot -> node map
|
|
clusterManagerNode *slots_map[CLUSTER_MANAGER_SLOTS];
|
|
memset(slots_map, 0, sizeof(slots_map));
|
|
listIter li;
|
|
listNode *ln;
|
|
for (i = 0; i < CLUSTER_MANAGER_SLOTS; i++) {
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (n->flags & CLUSTER_MANAGER_FLAG_SLAVE) continue;
|
|
if (n->slots_count == 0) continue;
|
|
if (n->slots[i]) {
|
|
slots_map[i] = n;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
char cmdfmt[50] = "MIGRATE %s %d %s %d %d";
|
|
if (config.cluster_manager_command.flags & CLUSTER_MANAGER_CMD_FLAG_COPY)
|
|
strcat(cmdfmt, " %s");
|
|
if (config.cluster_manager_command.flags & CLUSTER_MANAGER_CMD_FLAG_REPLACE)
|
|
strcat(cmdfmt, " %s");
|
|
|
|
/* Use SCAN to iterate over the keys, migrating to the
|
|
* right node as needed. */
|
|
int cursor = -999, timeout = config.cluster_manager_command.timeout;
|
|
while (cursor != 0) {
|
|
if (cursor < 0) cursor = 0;
|
|
freeReplyObject(src_reply);
|
|
src_reply = reconnectingRedisCommand(src_ctx, "SCAN %d COUNT %d",
|
|
cursor, 1000);
|
|
if (!src_reply || src_reply->type == REDIS_REPLY_ERROR) {
|
|
if (src_reply && src_reply->str) reply_err = src_reply->str;
|
|
success = 0;
|
|
goto cleanup;
|
|
}
|
|
assert(src_reply->type == REDIS_REPLY_ARRAY);
|
|
assert(src_reply->elements >= 2);
|
|
assert(src_reply->element[1]->type == REDIS_REPLY_ARRAY);
|
|
if (src_reply->element[0]->type == REDIS_REPLY_STRING)
|
|
cursor = atoi(src_reply->element[0]->str);
|
|
else if (src_reply->element[0]->type == REDIS_REPLY_INTEGER)
|
|
cursor = src_reply->element[0]->integer;
|
|
int keycount = src_reply->element[1]->elements;
|
|
for (i = 0; i < keycount; i++) {
|
|
redisReply *kr = src_reply->element[1]->element[i];
|
|
assert(kr->type == REDIS_REPLY_STRING);
|
|
char *key = kr->str;
|
|
uint16_t slot = clusterManagerKeyHashSlot(key, kr->len);
|
|
clusterManagerNode *target = slots_map[slot];
|
|
printf("Migrating %s to %s:%d: ", key, target->ip, target->port);
|
|
redisReply *r = reconnectingRedisCommand(src_ctx, cmdfmt,
|
|
target->ip, target->port,
|
|
key, 0, timeout,
|
|
"COPY", "REPLACE");
|
|
if (!r || r->type == REDIS_REPLY_ERROR) {
|
|
if (r && r->str) {
|
|
clusterManagerLogErr("Source %s:%d replied with "
|
|
"error:\n%s\n", src_ip, src_port,
|
|
r->str);
|
|
}
|
|
success = 0;
|
|
}
|
|
freeReplyObject(r);
|
|
if (!success) goto cleanup;
|
|
clusterManagerLogOk("OK\n");
|
|
}
|
|
}
|
|
cleanup:
|
|
if (reply_err)
|
|
clusterManagerLogErr("Source %s:%d replied with error:\n%s\n",
|
|
src_ip, src_port, reply_err);
|
|
if (src_ctx) redisFree(src_ctx);
|
|
if (src_reply) freeReplyObject(src_reply);
|
|
return success;
|
|
invalid_args:
|
|
fprintf(stderr, "%s", invalid_args_msg);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandCall(int argc, char **argv) {
|
|
int port = 0, i;
|
|
char *ip = NULL;
|
|
if (!getClusterHostFromCmdArgs(1, argv, &ip, &port)) goto invalid_args;
|
|
clusterManagerNode *refnode = clusterManagerNewNode(ip, port);
|
|
if (!clusterManagerLoadInfoFromNode(refnode, 0)) return 0;
|
|
argc--;
|
|
argv++;
|
|
size_t *argvlen = zmalloc(argc*sizeof(size_t));
|
|
clusterManagerLogInfo(">>> Calling");
|
|
for (i = 0; i < argc; i++) {
|
|
argvlen[i] = strlen(argv[i]);
|
|
printf(" %s", argv[i]);
|
|
}
|
|
printf("\n");
|
|
listIter li;
|
|
listNode *ln;
|
|
listRewind(cluster_manager.nodes, &li);
|
|
while ((ln = listNext(&li)) != NULL) {
|
|
clusterManagerNode *n = ln->value;
|
|
if (!n->context) CLUSTER_MANAGER_NODE_CONNECT(n);
|
|
redisReply *reply = NULL;
|
|
redisAppendCommandArgv(n->context, argc, (const char **) argv, argvlen);
|
|
int status = redisGetReply(n->context, (void **)(&reply));
|
|
if (status != REDIS_OK || reply == NULL )
|
|
printf("%s:%d: Failed!\n", n->ip, n->port);
|
|
else {
|
|
sds formatted_reply = cliFormatReplyTTY(reply, "");
|
|
printf("%s:%d: %s\n", n->ip, n->port, (char *) formatted_reply);
|
|
sdsfree(formatted_reply);
|
|
}
|
|
if (reply != NULL) freeReplyObject(reply);
|
|
}
|
|
zfree(argvlen);
|
|
return 1;
|
|
invalid_args:
|
|
fprintf(stderr, CLUSTER_MANAGER_INVALID_HOST_ARG);
|
|
return 0;
|
|
}
|
|
|
|
static int clusterManagerCommandHelp(int argc, char **argv) {
|
|
UNUSED(argc);
|
|
UNUSED(argv);
|
|
int commands_count = sizeof(clusterManagerCommands) /
|
|
sizeof(clusterManagerCommandDef);
|
|
int i = 0, j;
|
|
fprintf(stderr, "Cluster Manager Commands:\n");
|
|
int padding = 15;
|
|
for (; i < commands_count; i++) {
|
|
clusterManagerCommandDef *def = &(clusterManagerCommands[i]);
|
|
int namelen = strlen(def->name), padlen = padding - namelen;
|
|
fprintf(stderr, " %s", def->name);
|
|
for (j = 0; j < padlen; j++) fprintf(stderr, " ");
|
|
fprintf(stderr, "%s\n", (def->args ? def->args : ""));
|
|
if (def->options != NULL) {
|
|
int optslen = strlen(def->options);
|
|
char *p = def->options, *eos = p + optslen;
|
|
char *comma = NULL;
|
|
while ((comma = strchr(p, ',')) != NULL) {
|
|
int deflen = (int)(comma - p);
|
|
char buf[255];
|
|
memcpy(buf, p, deflen);
|
|
buf[deflen] = '\0';
|
|
for (j = 0; j < padding; j++) fprintf(stderr, " ");
|
|
fprintf(stderr, " --cluster-%s\n", buf);
|
|
p = comma + 1;
|
|
if (p >= eos) break;
|
|
}
|
|
if (p < eos) {
|
|
for (j = 0; j < padding; j++) fprintf(stderr, " ");
|
|
fprintf(stderr, " --cluster-%s\n", p);
|
|
}
|
|
}
|
|
}
|
|
fprintf(stderr, "\nFor check, fix, reshard, del-node, set-timeout you "
|
|
"can specify the host and port of any working node in "
|
|
"the cluster.\n\n");
|
|
return 0;
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Latency and latency history modes
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
static void latencyModePrint(long long min, long long max, double avg, long long count) {
|
|
if (config.output == OUTPUT_STANDARD) {
|
|
printf("min: %lld, max: %lld, avg: %.2f (%lld samples)",
|
|
min, max, avg, count);
|
|
fflush(stdout);
|
|
} else if (config.output == OUTPUT_CSV) {
|
|
printf("%lld,%lld,%.2f,%lld\n", min, max, avg, count);
|
|
} else if (config.output == OUTPUT_RAW) {
|
|
printf("%lld %lld %.2f %lld\n", min, max, avg, count);
|
|
}
|
|
}
|
|
|
|
#define LATENCY_SAMPLE_RATE 10 /* milliseconds. */
|
|
#define LATENCY_HISTORY_DEFAULT_INTERVAL 15000 /* milliseconds. */
|
|
static void latencyMode(void) {
|
|
redisReply *reply;
|
|
long long start, latency, min = 0, max = 0, tot = 0, count = 0;
|
|
long long history_interval =
|
|
config.interval ? config.interval/1000 :
|
|
LATENCY_HISTORY_DEFAULT_INTERVAL;
|
|
double avg;
|
|
long long history_start = mstime();
|
|
|
|
/* Set a default for the interval in case of --latency option
|
|
* with --raw, --csv or when it is redirected to non tty. */
|
|
if (config.interval == 0) {
|
|
config.interval = 1000;
|
|
} else {
|
|
config.interval /= 1000; /* We need to convert to milliseconds. */
|
|
}
|
|
|
|
if (!context) exit(1);
|
|
while(1) {
|
|
start = mstime();
|
|
reply = reconnectingRedisCommand(context,"PING");
|
|
if (reply == NULL) {
|
|
fprintf(stderr,"\nI/O error\n");
|
|
exit(1);
|
|
}
|
|
latency = mstime()-start;
|
|
freeReplyObject(reply);
|
|
count++;
|
|
if (count == 1) {
|
|
min = max = tot = latency;
|
|
avg = (double) latency;
|
|
} else {
|
|
if (latency < min) min = latency;
|
|
if (latency > max) max = latency;
|
|
tot += latency;
|
|
avg = (double) tot/count;
|
|
}
|
|
|
|
if (config.output == OUTPUT_STANDARD) {
|
|
printf("\x1b[0G\x1b[2K"); /* Clear the line. */
|
|
latencyModePrint(min,max,avg,count);
|
|
} else {
|
|
if (config.latency_history) {
|
|
latencyModePrint(min,max,avg,count);
|
|
} else if (mstime()-history_start > config.interval) {
|
|
latencyModePrint(min,max,avg,count);
|
|
exit(0);
|
|
}
|
|
}
|
|
|
|
if (config.latency_history && mstime()-history_start > history_interval)
|
|
{
|
|
printf(" -- %.2f seconds range\n", (float)(mstime()-history_start)/1000);
|
|
history_start = mstime();
|
|
min = max = tot = count = 0;
|
|
}
|
|
usleep(LATENCY_SAMPLE_RATE * 1000);
|
|
}
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Latency distribution mode -- requires 256 colors xterm
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
#define LATENCY_DIST_DEFAULT_INTERVAL 1000 /* milliseconds. */
|
|
|
|
/* Structure to store samples distribution. */
|
|
struct distsamples {
|
|
long long max; /* Max latency to fit into this interval (usec). */
|
|
long long count; /* Number of samples in this interval. */
|
|
int character; /* Associated character in visualization. */
|
|
};
|
|
|
|
/* Helper function for latencyDistMode(). Performs the spectrum visualization
|
|
* of the collected samples targeting an xterm 256 terminal.
|
|
*
|
|
* Takes an array of distsamples structures, ordered from smaller to bigger
|
|
* 'max' value. Last sample max must be 0, to mean that it olds all the
|
|
* samples greater than the previous one, and is also the stop sentinel.
|
|
*
|
|
* "tot' is the total number of samples in the different buckets, so it
|
|
* is the SUM(samples[i].conut) for i to 0 up to the max sample.
|
|
*
|
|
* As a side effect the function sets all the buckets count to 0. */
|
|
void showLatencyDistSamples(struct distsamples *samples, long long tot) {
|
|
int j;
|
|
|
|
/* We convert samples into a index inside the palette
|
|
* proportional to the percentage a given bucket represents.
|
|
* This way intensity of the different parts of the spectrum
|
|
* don't change relative to the number of requests, which avoids to
|
|
* pollute the visualization with non-latency related info. */
|
|
printf("\033[38;5;0m"); /* Set foreground color to black. */
|
|
for (j = 0; ; j++) {
|
|
int coloridx =
|
|
ceil((float) samples[j].count / tot * (spectrum_palette_size-1));
|
|
int color = spectrum_palette[coloridx];
|
|
printf("\033[48;5;%dm%c", (int)color, samples[j].character);
|
|
samples[j].count = 0;
|
|
if (samples[j].max == 0) break; /* Last sample. */
|
|
}
|
|
printf("\033[0m\n");
|
|
fflush(stdout);
|
|
}
|
|
|
|
/* Show the legend: different buckets values and colors meaning, so
|
|
* that the spectrum is more easily readable. */
|
|
void showLatencyDistLegend(void) {
|
|
int j;
|
|
|
|
printf("---------------------------------------------\n");
|
|
printf(". - * # .01 .125 .25 .5 milliseconds\n");
|
|
printf("1,2,3,...,9 from 1 to 9 milliseconds\n");
|
|
printf("A,B,C,D,E 10,20,30,40,50 milliseconds\n");
|
|
printf("F,G,H,I,J .1,.2,.3,.4,.5 seconds\n");
|
|
printf("K,L,M,N,O,P,Q,? 1,2,4,8,16,30,60,>60 seconds\n");
|
|
printf("From 0 to 100%%: ");
|
|
for (j = 0; j < spectrum_palette_size; j++) {
|
|
printf("\033[48;5;%dm ", spectrum_palette[j]);
|
|
}
|
|
printf("\033[0m\n");
|
|
printf("---------------------------------------------\n");
|
|
}
|
|
|
|
static void latencyDistMode(void) {
|
|
redisReply *reply;
|
|
long long start, latency, count = 0;
|
|
long long history_interval =
|
|
config.interval ? config.interval/1000 :
|
|
LATENCY_DIST_DEFAULT_INTERVAL;
|
|
long long history_start = ustime();
|
|
int j, outputs = 0;
|
|
|
|
struct distsamples samples[] = {
|
|
/* We use a mostly logarithmic scale, with certain linear intervals
|
|
* which are more interesting than others, like 1-10 milliseconds
|
|
* range. */
|
|
{10,0,'.'}, /* 0.01 ms */
|
|
{125,0,'-'}, /* 0.125 ms */
|
|
{250,0,'*'}, /* 0.25 ms */
|
|
{500,0,'#'}, /* 0.5 ms */
|
|
{1000,0,'1'}, /* 1 ms */
|
|
{2000,0,'2'}, /* 2 ms */
|
|
{3000,0,'3'}, /* 3 ms */
|
|
{4000,0,'4'}, /* 4 ms */
|
|
{5000,0,'5'}, /* 5 ms */
|
|
{6000,0,'6'}, /* 6 ms */
|
|
{7000,0,'7'}, /* 7 ms */
|
|
{8000,0,'8'}, /* 8 ms */
|
|
{9000,0,'9'}, /* 9 ms */
|
|
{10000,0,'A'}, /* 10 ms */
|
|
{20000,0,'B'}, /* 20 ms */
|
|
{30000,0,'C'}, /* 30 ms */
|
|
{40000,0,'D'}, /* 40 ms */
|
|
{50000,0,'E'}, /* 50 ms */
|
|
{100000,0,'F'}, /* 0.1 s */
|
|
{200000,0,'G'}, /* 0.2 s */
|
|
{300000,0,'H'}, /* 0.3 s */
|
|
{400000,0,'I'}, /* 0.4 s */
|
|
{500000,0,'J'}, /* 0.5 s */
|
|
{1000000,0,'K'}, /* 1 s */
|
|
{2000000,0,'L'}, /* 2 s */
|
|
{4000000,0,'M'}, /* 4 s */
|
|
{8000000,0,'N'}, /* 8 s */
|
|
{16000000,0,'O'}, /* 16 s */
|
|
{30000000,0,'P'}, /* 30 s */
|
|
{60000000,0,'Q'}, /* 1 minute */
|
|
{0,0,'?'}, /* > 1 minute */
|
|
};
|
|
|
|
if (!context) exit(1);
|
|
while(1) {
|
|
start = ustime();
|
|
reply = reconnectingRedisCommand(context,"PING");
|
|
if (reply == NULL) {
|
|
fprintf(stderr,"\nI/O error\n");
|
|
exit(1);
|
|
}
|
|
latency = ustime()-start;
|
|
freeReplyObject(reply);
|
|
count++;
|
|
|
|
/* Populate the relevant bucket. */
|
|
for (j = 0; ; j++) {
|
|
if (samples[j].max == 0 || latency <= samples[j].max) {
|
|
samples[j].count++;
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* From time to time show the spectrum. */
|
|
if (count && (ustime()-history_start)/1000 > history_interval) {
|
|
if ((outputs++ % 20) == 0)
|
|
showLatencyDistLegend();
|
|
showLatencyDistSamples(samples,count);
|
|
history_start = ustime();
|
|
count = 0;
|
|
}
|
|
usleep(LATENCY_SAMPLE_RATE * 1000);
|
|
}
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Slave mode
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
/* Sends SYNC and reads the number of bytes in the payload. Used both by
|
|
* slaveMode() and getRDB(). */
|
|
unsigned long long sendSync(int fd) {
|
|
/* To start we need to send the SYNC command and return the payload.
|
|
* The hiredis client lib does not understand this part of the protocol
|
|
* and we don't want to mess with its buffers, so everything is performed
|
|
* using direct low-level I/O. */
|
|
char buf[4096], *p;
|
|
ssize_t nread;
|
|
|
|
/* Send the SYNC command. */
|
|
if (write(fd,"SYNC\r\n",6) != 6) {
|
|
fprintf(stderr,"Error writing to master\n");
|
|
exit(1);
|
|
}
|
|
|
|
/* Read $<payload>\r\n, making sure to read just up to "\n" */
|
|
p = buf;
|
|
while(1) {
|
|
nread = read(fd,p,1);
|
|
if (nread <= 0) {
|
|
fprintf(stderr,"Error reading bulk length while SYNCing\n");
|
|
exit(1);
|
|
}
|
|
if (*p == '\n' && p != buf) break;
|
|
if (*p != '\n') p++;
|
|
}
|
|
*p = '\0';
|
|
if (buf[0] == '-') {
|
|
printf("SYNC with master failed: %s\n", buf);
|
|
exit(1);
|
|
}
|
|
return strtoull(buf+1,NULL,10);
|
|
}
|
|
|
|
static void slaveMode(void) {
|
|
int fd = context->fd;
|
|
unsigned long long payload = sendSync(fd);
|
|
char buf[1024];
|
|
int original_output = config.output;
|
|
|
|
fprintf(stderr,"SYNC with master, discarding %llu "
|
|
"bytes of bulk transfer...\n", payload);
|
|
|
|
/* Discard the payload. */
|
|
while(payload) {
|
|
ssize_t nread;
|
|
|
|
nread = read(fd,buf,(payload > sizeof(buf)) ? sizeof(buf) : payload);
|
|
if (nread <= 0) {
|
|
fprintf(stderr,"Error reading RDB payload while SYNCing\n");
|
|
exit(1);
|
|
}
|
|
payload -= nread;
|
|
}
|
|
fprintf(stderr,"SYNC done. Logging commands from master.\n");
|
|
|
|
/* Now we can use hiredis to read the incoming protocol. */
|
|
config.output = OUTPUT_CSV;
|
|
while (cliReadReply(0) == REDIS_OK);
|
|
config.output = original_output;
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* RDB transfer mode
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
/* This function implements --rdb, so it uses the replication protocol in order
|
|
* to fetch the RDB file from a remote server. */
|
|
static void getRDB(void) {
|
|
int s = context->fd;
|
|
int fd;
|
|
unsigned long long payload = sendSync(s);
|
|
char buf[4096];
|
|
|
|
fprintf(stderr,"SYNC sent to master, writing %llu bytes to '%s'\n",
|
|
payload, config.rdb_filename);
|
|
|
|
/* Write to file. */
|
|
if (!strcmp(config.rdb_filename,"-")) {
|
|
fd = STDOUT_FILENO;
|
|
} else {
|
|
fd = open(config.rdb_filename, O_CREAT|O_WRONLY, 0644);
|
|
if (fd == -1) {
|
|
fprintf(stderr, "Error opening '%s': %s\n", config.rdb_filename,
|
|
strerror(errno));
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
while(payload) {
|
|
ssize_t nread, nwritten;
|
|
|
|
nread = read(s,buf,(payload > sizeof(buf)) ? sizeof(buf) : payload);
|
|
if (nread <= 0) {
|
|
fprintf(stderr,"I/O Error reading RDB payload from socket\n");
|
|
exit(1);
|
|
}
|
|
nwritten = write(fd, buf, nread);
|
|
if (nwritten != nread) {
|
|
fprintf(stderr,"Error writing data to file: %s\n",
|
|
(nwritten == -1) ? strerror(errno) : "short write");
|
|
exit(1);
|
|
}
|
|
payload -= nread;
|
|
}
|
|
close(s); /* Close the file descriptor ASAP as fsync() may take time. */
|
|
fsync(fd);
|
|
close(fd);
|
|
fprintf(stderr,"Transfer finished with success.\n");
|
|
exit(0);
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Bulk import (pipe) mode
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
#define PIPEMODE_WRITE_LOOP_MAX_BYTES (128*1024)
|
|
static void pipeMode(void) {
|
|
int fd = context->fd;
|
|
long long errors = 0, replies = 0, obuf_len = 0, obuf_pos = 0;
|
|
char ibuf[1024*16], obuf[1024*16]; /* Input and output buffers */
|
|
char aneterr[ANET_ERR_LEN];
|
|
redisReader *reader = redisReaderCreate();
|
|
redisReply *reply;
|
|
int eof = 0; /* True once we consumed all the standard input. */
|
|
int done = 0;
|
|
char magic[20]; /* Special reply we recognize. */
|
|
time_t last_read_time = time(NULL);
|
|
|
|
srand(time(NULL));
|
|
|
|
/* Use non blocking I/O. */
|
|
if (anetNonBlock(aneterr,fd) == ANET_ERR) {
|
|
fprintf(stderr, "Can't set the socket in non blocking mode: %s\n",
|
|
aneterr);
|
|
exit(1);
|
|
}
|
|
|
|
/* Transfer raw protocol and read replies from the server at the same
|
|
* time. */
|
|
while(!done) {
|
|
int mask = AE_READABLE;
|
|
|
|
if (!eof || obuf_len != 0) mask |= AE_WRITABLE;
|
|
mask = aeWait(fd,mask,1000);
|
|
|
|
/* Handle the readable state: we can read replies from the server. */
|
|
if (mask & AE_READABLE) {
|
|
ssize_t nread;
|
|
|
|
/* Read from socket and feed the hiredis reader. */
|
|
do {
|
|
nread = read(fd,ibuf,sizeof(ibuf));
|
|
if (nread == -1 && errno != EAGAIN && errno != EINTR) {
|
|
fprintf(stderr, "Error reading from the server: %s\n",
|
|
strerror(errno));
|
|
exit(1);
|
|
}
|
|
if (nread > 0) {
|
|
redisReaderFeed(reader,ibuf,nread);
|
|
last_read_time = time(NULL);
|
|
}
|
|
} while(nread > 0);
|
|
|
|
/* Consume replies. */
|
|
do {
|
|
if (redisReaderGetReply(reader,(void**)&reply) == REDIS_ERR) {
|
|
fprintf(stderr, "Error reading replies from server\n");
|
|
exit(1);
|
|
}
|
|
if (reply) {
|
|
if (reply->type == REDIS_REPLY_ERROR) {
|
|
fprintf(stderr,"%s\n", reply->str);
|
|
errors++;
|
|
} else if (eof && reply->type == REDIS_REPLY_STRING &&
|
|
reply->len == 20) {
|
|
/* Check if this is the reply to our final ECHO
|
|
* command. If so everything was received
|
|
* from the server. */
|
|
if (memcmp(reply->str,magic,20) == 0) {
|
|
printf("Last reply received from server.\n");
|
|
done = 1;
|
|
replies--;
|
|
}
|
|
}
|
|
replies++;
|
|
freeReplyObject(reply);
|
|
}
|
|
} while(reply);
|
|
}
|
|
|
|
/* Handle the writable state: we can send protocol to the server. */
|
|
if (mask & AE_WRITABLE) {
|
|
ssize_t loop_nwritten = 0;
|
|
|
|
while(1) {
|
|
/* Transfer current buffer to server. */
|
|
if (obuf_len != 0) {
|
|
ssize_t nwritten = write(fd,obuf+obuf_pos,obuf_len);
|
|
|
|
if (nwritten == -1) {
|
|
if (errno != EAGAIN && errno != EINTR) {
|
|
fprintf(stderr, "Error writing to the server: %s\n",
|
|
strerror(errno));
|
|
exit(1);
|
|
} else {
|
|
nwritten = 0;
|
|
}
|
|
}
|
|
obuf_len -= nwritten;
|
|
obuf_pos += nwritten;
|
|
loop_nwritten += nwritten;
|
|
if (obuf_len != 0) break; /* Can't accept more data. */
|
|
}
|
|
/* If buffer is empty, load from stdin. */
|
|
if (obuf_len == 0 && !eof) {
|
|
ssize_t nread = read(STDIN_FILENO,obuf,sizeof(obuf));
|
|
|
|
if (nread == 0) {
|
|
/* The ECHO sequence starts with a "\r\n" so that if there
|
|
* is garbage in the protocol we read from stdin, the ECHO
|
|
* will likely still be properly formatted.
|
|
* CRLF is ignored by Redis, so it has no effects. */
|
|
char echo[] =
|
|
"\r\n*2\r\n$4\r\nECHO\r\n$20\r\n01234567890123456789\r\n";
|
|
int j;
|
|
|
|
eof = 1;
|
|
/* Everything transferred, so we queue a special
|
|
* ECHO command that we can match in the replies
|
|
* to make sure everything was read from the server. */
|
|
for (j = 0; j < 20; j++)
|
|
magic[j] = rand() & 0xff;
|
|
memcpy(echo+21,magic,20);
|
|
memcpy(obuf,echo,sizeof(echo)-1);
|
|
obuf_len = sizeof(echo)-1;
|
|
obuf_pos = 0;
|
|
printf("All data transferred. Waiting for the last reply...\n");
|
|
} else if (nread == -1) {
|
|
fprintf(stderr, "Error reading from stdin: %s\n",
|
|
strerror(errno));
|
|
exit(1);
|
|
} else {
|
|
obuf_len = nread;
|
|
obuf_pos = 0;
|
|
}
|
|
}
|
|
if ((obuf_len == 0 && eof) ||
|
|
loop_nwritten > PIPEMODE_WRITE_LOOP_MAX_BYTES) break;
|
|
}
|
|
}
|
|
|
|
/* Handle timeout, that is, we reached EOF, and we are not getting
|
|
* replies from the server for a few seconds, nor the final ECHO is
|
|
* received. */
|
|
if (eof && config.pipe_timeout > 0 &&
|
|
time(NULL)-last_read_time > config.pipe_timeout)
|
|
{
|
|
fprintf(stderr,"No replies for %d seconds: exiting.\n",
|
|
config.pipe_timeout);
|
|
errors++;
|
|
break;
|
|
}
|
|
}
|
|
redisReaderFree(reader);
|
|
printf("errors: %lld, replies: %lld\n", errors, replies);
|
|
if (errors)
|
|
exit(1);
|
|
else
|
|
exit(0);
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Find big keys
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
#define TYPE_STRING 0
|
|
#define TYPE_LIST 1
|
|
#define TYPE_SET 2
|
|
#define TYPE_HASH 3
|
|
#define TYPE_ZSET 4
|
|
#define TYPE_STREAM 5
|
|
#define TYPE_NONE 6
|
|
#define TYPE_COUNT 7
|
|
|
|
static redisReply *sendScan(unsigned long long *it) {
|
|
redisReply *reply = redisCommand(context, "SCAN %llu", *it);
|
|
|
|
/* Handle any error conditions */
|
|
if(reply == NULL) {
|
|
fprintf(stderr, "\nI/O error\n");
|
|
exit(1);
|
|
} else if(reply->type == REDIS_REPLY_ERROR) {
|
|
fprintf(stderr, "SCAN error: %s\n", reply->str);
|
|
exit(1);
|
|
} else if(reply->type != REDIS_REPLY_ARRAY) {
|
|
fprintf(stderr, "Non ARRAY response from SCAN!\n");
|
|
exit(1);
|
|
} else if(reply->elements != 2) {
|
|
fprintf(stderr, "Invalid element count from SCAN!\n");
|
|
exit(1);
|
|
}
|
|
|
|
/* Validate our types are correct */
|
|
assert(reply->element[0]->type == REDIS_REPLY_STRING);
|
|
assert(reply->element[1]->type == REDIS_REPLY_ARRAY);
|
|
|
|
/* Update iterator */
|
|
*it = strtoull(reply->element[0]->str, NULL, 10);
|
|
|
|
return reply;
|
|
}
|
|
|
|
static int getDbSize(void) {
|
|
redisReply *reply;
|
|
int size;
|
|
|
|
reply = redisCommand(context, "DBSIZE");
|
|
|
|
if(reply == NULL || reply->type != REDIS_REPLY_INTEGER) {
|
|
fprintf(stderr, "Couldn't determine DBSIZE!\n");
|
|
exit(1);
|
|
}
|
|
|
|
/* Grab the number of keys and free our reply */
|
|
size = reply->integer;
|
|
freeReplyObject(reply);
|
|
|
|
return size;
|
|
}
|
|
|
|
static int toIntType(char *key, char *type) {
|
|
if(!strcmp(type, "string")) {
|
|
return TYPE_STRING;
|
|
} else if(!strcmp(type, "list")) {
|
|
return TYPE_LIST;
|
|
} else if(!strcmp(type, "set")) {
|
|
return TYPE_SET;
|
|
} else if(!strcmp(type, "hash")) {
|
|
return TYPE_HASH;
|
|
} else if(!strcmp(type, "zset")) {
|
|
return TYPE_ZSET;
|
|
} else if(!strcmp(type, "stream")) {
|
|
return TYPE_STREAM;
|
|
} else if(!strcmp(type, "none")) {
|
|
return TYPE_NONE;
|
|
} else {
|
|
fprintf(stderr, "Unknown type '%s' for key '%s'\n", type, key);
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
static void getKeyTypes(redisReply *keys, int *types) {
|
|
redisReply *reply;
|
|
unsigned int i;
|
|
|
|
/* Pipeline TYPE commands */
|
|
for(i=0;i<keys->elements;i++) {
|
|
redisAppendCommand(context, "TYPE %s", keys->element[i]->str);
|
|
}
|
|
|
|
/* Retrieve types */
|
|
for(i=0;i<keys->elements;i++) {
|
|
if(redisGetReply(context, (void**)&reply)!=REDIS_OK) {
|
|
fprintf(stderr, "Error getting type for key '%s' (%d: %s)\n",
|
|
keys->element[i]->str, context->err, context->errstr);
|
|
exit(1);
|
|
} else if(reply->type != REDIS_REPLY_STATUS) {
|
|
if(reply->type == REDIS_REPLY_ERROR) {
|
|
fprintf(stderr, "TYPE returned an error: %s\n", reply->str);
|
|
} else {
|
|
fprintf(stderr,
|
|
"Invalid reply type (%d) for TYPE on key '%s'!\n",
|
|
reply->type, keys->element[i]->str);
|
|
}
|
|
exit(1);
|
|
}
|
|
|
|
types[i] = toIntType(keys->element[i]->str, reply->str);
|
|
freeReplyObject(reply);
|
|
}
|
|
}
|
|
|
|
static void getKeySizes(redisReply *keys, int *types,
|
|
unsigned long long *sizes)
|
|
{
|
|
redisReply *reply;
|
|
char *sizecmds[] = {"STRLEN","LLEN","SCARD","HLEN","ZCARD"};
|
|
unsigned int i;
|
|
|
|
/* Pipeline size commands */
|
|
for(i=0;i<keys->elements;i++) {
|
|
/* Skip keys that were deleted */
|
|
if(types[i]==TYPE_NONE)
|
|
continue;
|
|
|
|
redisAppendCommand(context, "%s %s", sizecmds[types[i]],
|
|
keys->element[i]->str);
|
|
}
|
|
|
|
/* Retrieve sizes */
|
|
for(i=0;i<keys->elements;i++) {
|
|
/* Skip keys that disappeared between SCAN and TYPE */
|
|
if(types[i] == TYPE_NONE) {
|
|
sizes[i] = 0;
|
|
continue;
|
|
}
|
|
|
|
/* Retrieve size */
|
|
if(redisGetReply(context, (void**)&reply)!=REDIS_OK) {
|
|
fprintf(stderr, "Error getting size for key '%s' (%d: %s)\n",
|
|
keys->element[i]->str, context->err, context->errstr);
|
|
exit(1);
|
|
} else if(reply->type != REDIS_REPLY_INTEGER) {
|
|
/* Theoretically the key could have been removed and
|
|
* added as a different type between TYPE and SIZE */
|
|
fprintf(stderr,
|
|
"Warning: %s on '%s' failed (may have changed type)\n",
|
|
sizecmds[types[i]], keys->element[i]->str);
|
|
sizes[i] = 0;
|
|
} else {
|
|
sizes[i] = reply->integer;
|
|
}
|
|
|
|
freeReplyObject(reply);
|
|
}
|
|
}
|
|
|
|
static void findBigKeys(void) {
|
|
unsigned long long biggest[TYPE_COUNT] = {0}, counts[TYPE_COUNT] = {0}, totalsize[TYPE_COUNT] = {0};
|
|
unsigned long long sampled = 0, total_keys, totlen=0, *sizes=NULL, it=0;
|
|
sds maxkeys[TYPE_COUNT] = {0};
|
|
char *typename[] = {"string","list","set","hash","zset","stream","none"};
|
|
char *typeunit[] = {"bytes","items","members","fields","members","entries",""};
|
|
redisReply *reply, *keys;
|
|
unsigned int arrsize=0, i;
|
|
int type, *types=NULL;
|
|
double pct;
|
|
|
|
/* Total keys pre scanning */
|
|
total_keys = getDbSize();
|
|
|
|
/* Status message */
|
|
printf("\n# Scanning the entire keyspace to find biggest keys as well as\n");
|
|
printf("# average sizes per key type. You can use -i 0.1 to sleep 0.1 sec\n");
|
|
printf("# per 100 SCAN commands (not usually needed).\n\n");
|
|
|
|
/* New up sds strings to keep track of overall biggest per type */
|
|
for(i=0;i<TYPE_NONE; i++) {
|
|
maxkeys[i] = sdsempty();
|
|
if(!maxkeys[i]) {
|
|
fprintf(stderr, "Failed to allocate memory for largest key names!\n");
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
/* SCAN loop */
|
|
do {
|
|
/* Calculate approximate percentage completion */
|
|
pct = 100 * (double)sampled/total_keys;
|
|
|
|
/* Grab some keys and point to the keys array */
|
|
reply = sendScan(&it);
|
|
keys = reply->element[1];
|
|
|
|
/* Reallocate our type and size array if we need to */
|
|
if(keys->elements > arrsize) {
|
|
types = zrealloc(types, sizeof(int)*keys->elements);
|
|
sizes = zrealloc(sizes, sizeof(unsigned long long)*keys->elements);
|
|
|
|
if(!types || !sizes) {
|
|
fprintf(stderr, "Failed to allocate storage for keys!\n");
|
|
exit(1);
|
|
}
|
|
|
|
arrsize = keys->elements;
|
|
}
|
|
|
|
/* Retrieve types and then sizes */
|
|
getKeyTypes(keys, types);
|
|
getKeySizes(keys, types, sizes);
|
|
|
|
/* Now update our stats */
|
|
for(i=0;i<keys->elements;i++) {
|
|
if((type = types[i]) == TYPE_NONE)
|
|
continue;
|
|
|
|
totalsize[type] += sizes[i];
|
|
counts[type]++;
|
|
totlen += keys->element[i]->len;
|
|
sampled++;
|
|
|
|
if(biggest[type]<sizes[i]) {
|
|
printf(
|
|
"[%05.2f%%] Biggest %-6s found so far '%s' with %llu %s\n",
|
|
pct, typename[type], keys->element[i]->str, sizes[i],
|
|
typeunit[type]);
|
|
|
|
/* Keep track of biggest key name for this type */
|
|
maxkeys[type] = sdscpy(maxkeys[type], keys->element[i]->str);
|
|
if(!maxkeys[type]) {
|
|
fprintf(stderr, "Failed to allocate memory for key!\n");
|
|
exit(1);
|
|
}
|
|
|
|
/* Keep track of the biggest size for this type */
|
|
biggest[type] = sizes[i];
|
|
}
|
|
|
|
/* Update overall progress */
|
|
if(sampled % 1000000 == 0) {
|
|
printf("[%05.2f%%] Sampled %llu keys so far\n", pct, sampled);
|
|
}
|
|
}
|
|
|
|
/* Sleep if we've been directed to do so */
|
|
if(sampled && (sampled %100) == 0 && config.interval) {
|
|
usleep(config.interval);
|
|
}
|
|
|
|
freeReplyObject(reply);
|
|
} while(it != 0);
|
|
|
|
if(types) zfree(types);
|
|
if(sizes) zfree(sizes);
|
|
|
|
/* We're done */
|
|
printf("\n-------- summary -------\n\n");
|
|
|
|
printf("Sampled %llu keys in the keyspace!\n", sampled);
|
|
printf("Total key length in bytes is %llu (avg len %.2f)\n\n",
|
|
totlen, totlen ? (double)totlen/sampled : 0);
|
|
|
|
/* Output the biggest keys we found, for types we did find */
|
|
for(i=0;i<TYPE_NONE;i++) {
|
|
if(sdslen(maxkeys[i])>0) {
|
|
printf("Biggest %6s found '%s' has %llu %s\n", typename[i], maxkeys[i],
|
|
biggest[i], typeunit[i]);
|
|
}
|
|
}
|
|
|
|
printf("\n");
|
|
|
|
for(i=0;i<TYPE_NONE;i++) {
|
|
printf("%llu %ss with %llu %s (%05.2f%% of keys, avg size %.2f)\n",
|
|
counts[i], typename[i], totalsize[i], typeunit[i],
|
|
sampled ? 100 * (double)counts[i]/sampled : 0,
|
|
counts[i] ? (double)totalsize[i]/counts[i] : 0);
|
|
}
|
|
|
|
/* Free sds strings containing max keys */
|
|
for(i=0;i<TYPE_NONE;i++) {
|
|
sdsfree(maxkeys[i]);
|
|
}
|
|
|
|
/* Success! */
|
|
exit(0);
|
|
}
|
|
|
|
static void getKeyFreqs(redisReply *keys, unsigned long long *freqs) {
|
|
redisReply *reply;
|
|
unsigned int i;
|
|
|
|
/* Pipeline OBJECT freq commands */
|
|
for(i=0;i<keys->elements;i++) {
|
|
redisAppendCommand(context, "OBJECT freq %s", keys->element[i]->str);
|
|
}
|
|
|
|
/* Retrieve freqs */
|
|
for(i=0;i<keys->elements;i++) {
|
|
if(redisGetReply(context, (void**)&reply)!=REDIS_OK) {
|
|
fprintf(stderr, "Error getting freq for key '%s' (%d: %s)\n",
|
|
keys->element[i]->str, context->err, context->errstr);
|
|
exit(1);
|
|
} else if(reply->type != REDIS_REPLY_INTEGER) {
|
|
if(reply->type == REDIS_REPLY_ERROR) {
|
|
fprintf(stderr, "Error: %s\n", reply->str);
|
|
exit(1);
|
|
} else {
|
|
fprintf(stderr, "Warning: OBJECT freq on '%s' failed (may have been deleted)\n", keys->element[i]->str);
|
|
freqs[i] = 0;
|
|
}
|
|
} else {
|
|
freqs[i] = reply->integer;
|
|
}
|
|
freeReplyObject(reply);
|
|
}
|
|
}
|
|
|
|
#define HOTKEYS_SAMPLE 16
|
|
static void findHotKeys(void) {
|
|
redisReply *keys, *reply;
|
|
unsigned long long counters[HOTKEYS_SAMPLE] = {0};
|
|
sds hotkeys[HOTKEYS_SAMPLE] = {NULL};
|
|
unsigned long long sampled = 0, total_keys, *freqs = NULL, it = 0;
|
|
unsigned int arrsize = 0, i, k;
|
|
double pct;
|
|
|
|
/* Total keys pre scanning */
|
|
total_keys = getDbSize();
|
|
|
|
/* Status message */
|
|
printf("\n# Scanning the entire keyspace to find hot keys as well as\n");
|
|
printf("# average sizes per key type. You can use -i 0.1 to sleep 0.1 sec\n");
|
|
printf("# per 100 SCAN commands (not usually needed).\n\n");
|
|
|
|
/* SCAN loop */
|
|
do {
|
|
/* Calculate approximate percentage completion */
|
|
pct = 100 * (double)sampled/total_keys;
|
|
|
|
/* Grab some keys and point to the keys array */
|
|
reply = sendScan(&it);
|
|
keys = reply->element[1];
|
|
|
|
/* Reallocate our freqs array if we need to */
|
|
if(keys->elements > arrsize) {
|
|
freqs = zrealloc(freqs, sizeof(unsigned long long)*keys->elements);
|
|
|
|
if(!freqs) {
|
|
fprintf(stderr, "Failed to allocate storage for keys!\n");
|
|
exit(1);
|
|
}
|
|
|
|
arrsize = keys->elements;
|
|
}
|
|
|
|
getKeyFreqs(keys, freqs);
|
|
|
|
/* Now update our stats */
|
|
for(i=0;i<keys->elements;i++) {
|
|
sampled++;
|
|
/* Update overall progress */
|
|
if(sampled % 1000000 == 0) {
|
|
printf("[%05.2f%%] Sampled %llu keys so far\n", pct, sampled);
|
|
}
|
|
|
|
/* Use eviction pool here */
|
|
k = 0;
|
|
while (k < HOTKEYS_SAMPLE && freqs[i] > counters[k]) k++;
|
|
if (k == 0) continue;
|
|
k--;
|
|
if (k == 0 || counters[k] == 0) {
|
|
sdsfree(hotkeys[k]);
|
|
} else {
|
|
sdsfree(hotkeys[0]);
|
|
memmove(counters,counters+1,sizeof(counters[0])*k);
|
|
memmove(hotkeys,hotkeys+1,sizeof(hotkeys[0])*k);
|
|
}
|
|
counters[k] = freqs[i];
|
|
hotkeys[k] = sdsnew(keys->element[i]->str);
|
|
printf(
|
|
"[%05.2f%%] Hot key '%s' found so far with counter %llu\n",
|
|
pct, keys->element[i]->str, freqs[i]);
|
|
}
|
|
|
|
/* Sleep if we've been directed to do so */
|
|
if(sampled && (sampled %100) == 0 && config.interval) {
|
|
usleep(config.interval);
|
|
}
|
|
|
|
freeReplyObject(reply);
|
|
} while(it != 0);
|
|
|
|
if (freqs) zfree(freqs);
|
|
|
|
/* We're done */
|
|
printf("\n-------- summary -------\n\n");
|
|
|
|
printf("Sampled %llu keys in the keyspace!\n", sampled);
|
|
|
|
for (i=1; i<= HOTKEYS_SAMPLE; i++) {
|
|
k = HOTKEYS_SAMPLE - i;
|
|
if(counters[k]>0) {
|
|
printf("hot key found with counter: %llu\tkeyname: %s\n", counters[k], hotkeys[k]);
|
|
sdsfree(hotkeys[k]);
|
|
}
|
|
}
|
|
|
|
exit(0);
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Stats mode
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
/* Return the specified INFO field from the INFO command output "info".
|
|
* A new buffer is allocated for the result, that needs to be free'd.
|
|
* If the field is not found NULL is returned. */
|
|
static char *getInfoField(char *info, char *field) {
|
|
char *p = strstr(info,field);
|
|
char *n1, *n2;
|
|
char *result;
|
|
|
|
if (!p) return NULL;
|
|
p += strlen(field)+1;
|
|
n1 = strchr(p,'\r');
|
|
n2 = strchr(p,',');
|
|
if (n2 && n2 < n1) n1 = n2;
|
|
result = zmalloc(sizeof(char)*(n1-p)+1);
|
|
memcpy(result,p,(n1-p));
|
|
result[n1-p] = '\0';
|
|
return result;
|
|
}
|
|
|
|
/* Like the above function but automatically convert the result into
|
|
* a long. On error (missing field) LONG_MIN is returned. */
|
|
static long getLongInfoField(char *info, char *field) {
|
|
char *value = getInfoField(info,field);
|
|
long l;
|
|
|
|
if (!value) return LONG_MIN;
|
|
l = strtol(value,NULL,10);
|
|
zfree(value);
|
|
return l;
|
|
}
|
|
|
|
/* Convert number of bytes into a human readable string of the form:
|
|
* 100B, 2G, 100M, 4K, and so forth. */
|
|
void bytesToHuman(char *s, long long n) {
|
|
double d;
|
|
|
|
if (n < 0) {
|
|
*s = '-';
|
|
s++;
|
|
n = -n;
|
|
}
|
|
if (n < 1024) {
|
|
/* Bytes */
|
|
sprintf(s,"%lldB",n);
|
|
return;
|
|
} else if (n < (1024*1024)) {
|
|
d = (double)n/(1024);
|
|
sprintf(s,"%.2fK",d);
|
|
} else if (n < (1024LL*1024*1024)) {
|
|
d = (double)n/(1024*1024);
|
|
sprintf(s,"%.2fM",d);
|
|
} else if (n < (1024LL*1024*1024*1024)) {
|
|
d = (double)n/(1024LL*1024*1024);
|
|
sprintf(s,"%.2fG",d);
|
|
}
|
|
}
|
|
|
|
static void statMode(void) {
|
|
redisReply *reply;
|
|
long aux, requests = 0;
|
|
int i = 0;
|
|
|
|
while(1) {
|
|
char buf[64];
|
|
int j;
|
|
|
|
reply = reconnectingRedisCommand(context,"INFO");
|
|
if (reply->type == REDIS_REPLY_ERROR) {
|
|
printf("ERROR: %s\n", reply->str);
|
|
exit(1);
|
|
}
|
|
|
|
if ((i++ % 20) == 0) {
|
|
printf(
|
|
"------- data ------ --------------------- load -------------------- - child -\n"
|
|
"keys mem clients blocked requests connections \n");
|
|
}
|
|
|
|
/* Keys */
|
|
aux = 0;
|
|
for (j = 0; j < 20; j++) {
|
|
long k;
|
|
|
|
sprintf(buf,"db%d:keys",j);
|
|
k = getLongInfoField(reply->str,buf);
|
|
if (k == LONG_MIN) continue;
|
|
aux += k;
|
|
}
|
|
sprintf(buf,"%ld",aux);
|
|
printf("%-11s",buf);
|
|
|
|
/* Used memory */
|
|
aux = getLongInfoField(reply->str,"used_memory");
|
|
bytesToHuman(buf,aux);
|
|
printf("%-8s",buf);
|
|
|
|
/* Clients */
|
|
aux = getLongInfoField(reply->str,"connected_clients");
|
|
sprintf(buf,"%ld",aux);
|
|
printf(" %-8s",buf);
|
|
|
|
/* Blocked (BLPOPPING) Clients */
|
|
aux = getLongInfoField(reply->str,"blocked_clients");
|
|
sprintf(buf,"%ld",aux);
|
|
printf("%-8s",buf);
|
|
|
|
/* Requests */
|
|
aux = getLongInfoField(reply->str,"total_commands_processed");
|
|
sprintf(buf,"%ld (+%ld)",aux,requests == 0 ? 0 : aux-requests);
|
|
printf("%-19s",buf);
|
|
requests = aux;
|
|
|
|
/* Connections */
|
|
aux = getLongInfoField(reply->str,"total_connections_received");
|
|
sprintf(buf,"%ld",aux);
|
|
printf(" %-12s",buf);
|
|
|
|
/* Children */
|
|
aux = getLongInfoField(reply->str,"bgsave_in_progress");
|
|
aux |= getLongInfoField(reply->str,"aof_rewrite_in_progress") << 1;
|
|
aux |= getLongInfoField(reply->str,"loading") << 2;
|
|
switch(aux) {
|
|
case 0: break;
|
|
case 1:
|
|
printf("SAVE");
|
|
break;
|
|
case 2:
|
|
printf("AOF");
|
|
break;
|
|
case 3:
|
|
printf("SAVE+AOF");
|
|
break;
|
|
case 4:
|
|
printf("LOAD");
|
|
break;
|
|
}
|
|
|
|
printf("\n");
|
|
freeReplyObject(reply);
|
|
usleep(config.interval);
|
|
}
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Scan mode
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
static void scanMode(void) {
|
|
redisReply *reply;
|
|
unsigned long long cur = 0;
|
|
|
|
do {
|
|
if (config.pattern)
|
|
reply = redisCommand(context,"SCAN %llu MATCH %s",
|
|
cur,config.pattern);
|
|
else
|
|
reply = redisCommand(context,"SCAN %llu",cur);
|
|
if (reply == NULL) {
|
|
printf("I/O error\n");
|
|
exit(1);
|
|
} else if (reply->type == REDIS_REPLY_ERROR) {
|
|
printf("ERROR: %s\n", reply->str);
|
|
exit(1);
|
|
} else {
|
|
unsigned int j;
|
|
|
|
cur = strtoull(reply->element[0]->str,NULL,10);
|
|
for (j = 0; j < reply->element[1]->elements; j++)
|
|
printf("%s\n", reply->element[1]->element[j]->str);
|
|
}
|
|
freeReplyObject(reply);
|
|
} while(cur != 0);
|
|
|
|
exit(0);
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* LRU test mode
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
/* Return an integer from min to max (both inclusive) using a power-law
|
|
* distribution, depending on the value of alpha: the greater the alpha
|
|
* the more bias towards lower values.
|
|
*
|
|
* With alpha = 6.2 the output follows the 80-20 rule where 20% of
|
|
* the returned numbers will account for 80% of the frequency. */
|
|
long long powerLawRand(long long min, long long max, double alpha) {
|
|
double pl, r;
|
|
|
|
max += 1;
|
|
r = ((double)rand()) / RAND_MAX;
|
|
pl = pow(
|
|
((pow(max,alpha+1) - pow(min,alpha+1))*r + pow(min,alpha+1)),
|
|
(1.0/(alpha+1)));
|
|
return (max-1-(long long)pl)+min;
|
|
}
|
|
|
|
/* Generates a key name among a set of lru_test_sample_size keys, using
|
|
* an 80-20 distribution. */
|
|
void LRUTestGenKey(char *buf, size_t buflen) {
|
|
snprintf(buf, buflen, "lru:%lld",
|
|
powerLawRand(1, config.lru_test_sample_size, 6.2));
|
|
}
|
|
|
|
#define LRU_CYCLE_PERIOD 1000 /* 1000 milliseconds. */
|
|
#define LRU_CYCLE_PIPELINE_SIZE 250
|
|
static void LRUTestMode(void) {
|
|
redisReply *reply;
|
|
char key[128];
|
|
long long start_cycle;
|
|
int j;
|
|
|
|
srand(time(NULL)^getpid());
|
|
while(1) {
|
|
/* Perform cycles of 1 second with 50% writes and 50% reads.
|
|
* We use pipelining batching writes / reads N times per cycle in order
|
|
* to fill the target instance easily. */
|
|
start_cycle = mstime();
|
|
long long hits = 0, misses = 0;
|
|
while(mstime() - start_cycle < 1000) {
|
|
/* Write cycle. */
|
|
for (j = 0; j < LRU_CYCLE_PIPELINE_SIZE; j++) {
|
|
char val[6];
|
|
val[5] = '\0';
|
|
for (int i = 0; i < 5; i++) val[i] = 'A'+rand()%('z'-'A');
|
|
LRUTestGenKey(key,sizeof(key));
|
|
redisAppendCommand(context, "SET %s %s",key,val);
|
|
}
|
|
for (j = 0; j < LRU_CYCLE_PIPELINE_SIZE; j++)
|
|
redisGetReply(context, (void**)&reply);
|
|
|
|
/* Read cycle. */
|
|
for (j = 0; j < LRU_CYCLE_PIPELINE_SIZE; j++) {
|
|
LRUTestGenKey(key,sizeof(key));
|
|
redisAppendCommand(context, "GET %s",key);
|
|
}
|
|
for (j = 0; j < LRU_CYCLE_PIPELINE_SIZE; j++) {
|
|
if (redisGetReply(context, (void**)&reply) == REDIS_OK) {
|
|
switch(reply->type) {
|
|
case REDIS_REPLY_ERROR:
|
|
printf("%s\n", reply->str);
|
|
break;
|
|
case REDIS_REPLY_NIL:
|
|
misses++;
|
|
break;
|
|
default:
|
|
hits++;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (context->err) {
|
|
fprintf(stderr,"I/O error during LRU test\n");
|
|
exit(1);
|
|
}
|
|
}
|
|
/* Print stats. */
|
|
printf(
|
|
"%lld Gets/sec | Hits: %lld (%.2f%%) | Misses: %lld (%.2f%%)\n",
|
|
hits+misses,
|
|
hits, (double)hits/(hits+misses)*100,
|
|
misses, (double)misses/(hits+misses)*100);
|
|
}
|
|
exit(0);
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Intrisic latency mode.
|
|
*
|
|
* Measure max latency of a running process that does not result from
|
|
* syscalls. Basically this software should provide an hint about how much
|
|
* time the kernel leaves the process without a chance to run.
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
/* This is just some computation the compiler can't optimize out.
|
|
* Should run in less than 100-200 microseconds even using very
|
|
* slow hardware. Runs in less than 10 microseconds in modern HW. */
|
|
unsigned long compute_something_fast(void) {
|
|
unsigned char s[256], i, j, t;
|
|
int count = 1000, k;
|
|
unsigned long output = 0;
|
|
|
|
for (k = 0; k < 256; k++) s[k] = k;
|
|
|
|
i = 0;
|
|
j = 0;
|
|
while(count--) {
|
|
i++;
|
|
j = j + s[i];
|
|
t = s[i];
|
|
s[i] = s[j];
|
|
s[j] = t;
|
|
output += s[(s[i]+s[j])&255];
|
|
}
|
|
return output;
|
|
}
|
|
|
|
static void intrinsicLatencyModeStop(int s) {
|
|
UNUSED(s);
|
|
force_cancel_loop = 1;
|
|
}
|
|
|
|
static void intrinsicLatencyMode(void) {
|
|
long long test_end, run_time, max_latency = 0, runs = 0;
|
|
|
|
run_time = config.intrinsic_latency_duration*1000000;
|
|
test_end = ustime() + run_time;
|
|
signal(SIGINT, intrinsicLatencyModeStop);
|
|
|
|
while(1) {
|
|
long long start, end, latency;
|
|
|
|
start = ustime();
|
|
compute_something_fast();
|
|
end = ustime();
|
|
latency = end-start;
|
|
runs++;
|
|
if (latency <= 0) continue;
|
|
|
|
/* Reporting */
|
|
if (latency > max_latency) {
|
|
max_latency = latency;
|
|
printf("Max latency so far: %lld microseconds.\n", max_latency);
|
|
}
|
|
|
|
double avg_us = (double)run_time/runs;
|
|
double avg_ns = avg_us * 1e3;
|
|
if (force_cancel_loop || end > test_end) {
|
|
printf("\n%lld total runs "
|
|
"(avg latency: "
|
|
"%.4f microseconds / %.2f nanoseconds per run).\n",
|
|
runs, avg_us, avg_ns);
|
|
printf("Worst run took %.0fx longer than the average latency.\n",
|
|
max_latency / avg_us);
|
|
exit(0);
|
|
}
|
|
}
|
|
}
|
|
|
|
/*------------------------------------------------------------------------------
|
|
* Program main()
|
|
*--------------------------------------------------------------------------- */
|
|
|
|
int main(int argc, char **argv) {
|
|
int firstarg;
|
|
|
|
config.hostip = sdsnew("127.0.0.1");
|
|
config.hostport = 6379;
|
|
config.hostsocket = NULL;
|
|
config.repeat = 1;
|
|
config.interval = 0;
|
|
config.dbnum = 0;
|
|
config.interactive = 0;
|
|
config.shutdown = 0;
|
|
config.monitor_mode = 0;
|
|
config.pubsub_mode = 0;
|
|
config.latency_mode = 0;
|
|
config.latency_dist_mode = 0;
|
|
config.latency_history = 0;
|
|
config.lru_test_mode = 0;
|
|
config.lru_test_sample_size = 0;
|
|
config.cluster_mode = 0;
|
|
config.slave_mode = 0;
|
|
config.getrdb_mode = 0;
|
|
config.stat_mode = 0;
|
|
config.scan_mode = 0;
|
|
config.intrinsic_latency_mode = 0;
|
|
config.pattern = NULL;
|
|
config.rdb_filename = NULL;
|
|
config.pipe_mode = 0;
|
|
config.pipe_timeout = REDIS_CLI_DEFAULT_PIPE_TIMEOUT;
|
|
config.bigkeys = 0;
|
|
config.hotkeys = 0;
|
|
config.stdinarg = 0;
|
|
config.auth = NULL;
|
|
config.eval = NULL;
|
|
config.eval_ldb = 0;
|
|
config.eval_ldb_end = 0;
|
|
config.eval_ldb_sync = 0;
|
|
config.enable_ldb_on_eval = 0;
|
|
config.last_cmd_type = -1;
|
|
config.verbose = 0;
|
|
config.no_auth_warning = 0;
|
|
config.cluster_manager_command.name = NULL;
|
|
config.cluster_manager_command.argc = 0;
|
|
config.cluster_manager_command.argv = NULL;
|
|
config.cluster_manager_command.flags = 0;
|
|
config.cluster_manager_command.replicas = 0;
|
|
config.cluster_manager_command.from = NULL;
|
|
config.cluster_manager_command.to = NULL;
|
|
config.cluster_manager_command.weight = NULL;
|
|
config.cluster_manager_command.slots = 0;
|
|
config.cluster_manager_command.timeout = CLUSTER_MANAGER_MIGRATE_TIMEOUT;
|
|
config.cluster_manager_command.pipeline = CLUSTER_MANAGER_MIGRATE_PIPELINE;
|
|
config.cluster_manager_command.threshold =
|
|
CLUSTER_MANAGER_REBALANCE_THRESHOLD;
|
|
pref.hints = 1;
|
|
|
|
spectrum_palette = spectrum_palette_color;
|
|
spectrum_palette_size = spectrum_palette_color_size;
|
|
|
|
if (!isatty(fileno(stdout)) && (getenv("FAKETTY") == NULL))
|
|
config.output = OUTPUT_RAW;
|
|
else
|
|
config.output = OUTPUT_STANDARD;
|
|
config.mb_delim = sdsnew("\n");
|
|
|
|
firstarg = parseOptions(argc,argv);
|
|
argc -= firstarg;
|
|
argv += firstarg;
|
|
|
|
/* Cluster Manager mode */
|
|
if (CLUSTER_MANAGER_MODE()) {
|
|
clusterManagerCommandProc *proc = validateClusterManagerCommand();
|
|
if (!proc) {
|
|
sdsfree(config.hostip);
|
|
sdsfree(config.mb_delim);
|
|
exit(1);
|
|
}
|
|
clusterManagerMode(proc);
|
|
}
|
|
|
|
/* Latency mode */
|
|
if (config.latency_mode) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
latencyMode();
|
|
}
|
|
|
|
/* Latency distribution mode */
|
|
if (config.latency_dist_mode) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
latencyDistMode();
|
|
}
|
|
|
|
/* Slave mode */
|
|
if (config.slave_mode) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
slaveMode();
|
|
}
|
|
|
|
/* Get RDB mode. */
|
|
if (config.getrdb_mode) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
getRDB();
|
|
}
|
|
|
|
/* Pipe mode */
|
|
if (config.pipe_mode) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
pipeMode();
|
|
}
|
|
|
|
/* Find big keys */
|
|
if (config.bigkeys) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
findBigKeys();
|
|
}
|
|
|
|
/* Find hot keys */
|
|
if (config.hotkeys) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
findHotKeys();
|
|
}
|
|
|
|
/* Stat mode */
|
|
if (config.stat_mode) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
if (config.interval == 0) config.interval = 1000000;
|
|
statMode();
|
|
}
|
|
|
|
/* Scan mode */
|
|
if (config.scan_mode) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
scanMode();
|
|
}
|
|
|
|
/* LRU test mode */
|
|
if (config.lru_test_mode) {
|
|
if (cliConnect(0) == REDIS_ERR) exit(1);
|
|
LRUTestMode();
|
|
}
|
|
|
|
/* Intrinsic latency mode */
|
|
if (config.intrinsic_latency_mode) intrinsicLatencyMode();
|
|
|
|
/* Start interactive mode when no command is provided */
|
|
if (argc == 0 && !config.eval) {
|
|
/* Ignore SIGPIPE in interactive mode to force a reconnect */
|
|
signal(SIGPIPE, SIG_IGN);
|
|
|
|
/* Note that in repl mode we don't abort on connection error.
|
|
* A new attempt will be performed for every command send. */
|
|
cliConnect(0);
|
|
repl();
|
|
}
|
|
|
|
/* Otherwise, we have some arguments to execute */
|
|
if (cliConnect(0) != REDIS_OK) exit(1);
|
|
if (config.eval) {
|
|
return evalMode(argc,argv);
|
|
} else {
|
|
return noninteractive(argc,convertToSds(argc,argv));
|
|
}
|
|
}
|