]> git.saurik.com Git - redis.git/blame - src/redis.c
Comments about security of slave-read-only in redis.coinf.
[redis.git] / src / redis.c
CommitLineData
e2641e09 1/*
2 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 */
29
30#include "redis.h"
daa70b17 31#include "slowlog.h"
8f61a72f 32#include "bio.h"
e2641e09 33
e2641e09 34#include <time.h>
35#include <signal.h>
36#include <sys/wait.h>
37#include <errno.h>
38#include <assert.h>
39#include <ctype.h>
40#include <stdarg.h>
e2641e09 41#include <arpa/inet.h>
42#include <sys/stat.h>
43#include <fcntl.h>
44#include <sys/time.h>
45#include <sys/resource.h>
46#include <sys/uio.h>
47#include <limits.h>
48#include <float.h>
49#include <math.h>
2b00385d 50#include <sys/resource.h>
e2641e09 51
52/* Our shared "common" objects */
53
54struct sharedObjectsStruct shared;
55
c74b7c77 56/* Global vars that are actually used as constants. The following double
e2641e09 57 * values are used for double on-disk serialization, and are initialized
58 * at runtime to avoid strange compiler optimizations. */
59
60double R_Zero, R_PosInf, R_NegInf, R_Nan;
61
62/*================================= Globals ================================= */
63
64/* Global vars */
65struct redisServer server; /* server global state */
66struct redisCommand *commandTable;
5d02b00f 67
7501c66f 68/* Our command table.
69 *
70 * Every entry is composed of the following fields:
71 *
72 * name: a string representing the command name.
73 * function: pointer to the C function implementing the command.
74 * arity: number of arguments, it is possible to use -N to say >= N
75 * sflags: command flags as string. See below for a table of flags.
76 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
77 * get_keys_proc: an optional function to get key arguments from a command.
78 * This is only used when the following three fields are not
79 * enough to specify what arguments are keys.
80 * first_key_index: first argument that is a key
81 * last_key_index: last argument that is a key
82 * key_step: step to get all the keys from first to last argument. For instance
83 * in MSET the step is two since arguments are key,val,key,val,...
84 * microseconds: microseconds of total execution time for this command.
85 * calls: total number of calls of this command.
86 *
87 * The flags, microseconds and calls fields are computed by Redis and should
88 * always be set to zero.
89 *
90 * Command flags are expressed using strings where every character represents
91 * a flag. Later the populateCommandTable() function will take care of
92 * populating the real 'flags' field using this characters.
5d02b00f 93 *
94 * This is the meaning of the flags:
95 *
96 * w: write command (may modify the key space).
97 * r: read command (will never modify the key space).
98 * m: may increase memory usage once called. Don't allow if out of memory.
99 * a: admin command, like SAVE or SHUTDOWN.
100 * p: Pub/Sub related command.
b60ed6e8 101 * f: force replication of this command, regarless of server.dirty.
102 * s: command not allowed in scripts.
7e14a208 103 * R: random command. Command is not deterministic, that is, the same command
b60ed6e8 104 * with the same arguments, with the same key space, may have different
548efd91 105 * results. For instance SPOP and RANDOMKEY are two random commands.
106 * S: Sort command output array if called from script, so that the output
107 * is deterministic.
108 */
d7ed7fd2 109struct redisCommand redisCommandTable[] = {
5d02b00f 110 {"get",getCommand,2,"r",0,NULL,1,1,1,0,0},
111 {"set",setCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
112 {"setnx",setnxCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
39da5d1f 113 {"setex",setexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
114 {"psetex",psetexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
5d02b00f 115 {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
116 {"strlen",strlenCommand,2,"r",0,NULL,1,1,1,0,0},
117 {"del",delCommand,-2,"w",0,noPreloadGetKeys,1,-1,1,0,0},
118 {"exists",existsCommand,2,"r",0,NULL,1,1,1,0,0},
119 {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
120 {"getbit",getbitCommand,3,"r",0,NULL,1,1,1,0,0},
121 {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
122 {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
123 {"substr",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
124 {"incr",incrCommand,2,"wm",0,NULL,1,1,1,0,0},
125 {"decr",decrCommand,2,"wm",0,NULL,1,1,1,0,0},
126 {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
127 {"rpush",rpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
128 {"lpush",lpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
129 {"rpushx",rpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
130 {"lpushx",lpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
131 {"linsert",linsertCommand,5,"wm",0,NULL,1,1,1,0,0},
132 {"rpop",rpopCommand,2,"w",0,NULL,1,1,1,0,0},
133 {"lpop",lpopCommand,2,"w",0,NULL,1,1,1,0,0},
e41677b4 134 {"brpop",brpopCommand,-3,"ws",0,NULL,1,1,1,0,0},
135 {"brpoplpush",brpoplpushCommand,4,"wms",0,NULL,1,2,1,0,0},
136 {"blpop",blpopCommand,-3,"ws",0,NULL,1,-2,1,0,0},
5d02b00f 137 {"llen",llenCommand,2,"r",0,NULL,1,1,1,0,0},
138 {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
139 {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
140 {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
141 {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
142 {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
143 {"rpoplpush",rpoplpushCommand,3,"wm",0,NULL,1,2,1,0,0},
144 {"sadd",saddCommand,-3,"wm",0,NULL,1,1,1,0,0},
145 {"srem",sremCommand,-3,"w",0,NULL,1,1,1,0,0},
146 {"smove",smoveCommand,4,"w",0,NULL,1,2,1,0,0},
147 {"sismember",sismemberCommand,3,"r",0,NULL,1,1,1,0,0},
148 {"scard",scardCommand,2,"r",0,NULL,1,1,1,0,0},
15ef6053 149 {"spop",spopCommand,2,"wRs",0,NULL,1,1,1,0,0},
b60ed6e8 150 {"srandmember",srandmemberCommand,2,"rR",0,NULL,1,1,1,0,0},
548efd91 151 {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 152 {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 153 {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 154 {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 155 {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 156 {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 157 {"smembers",sinterCommand,2,"rS",0,NULL,1,1,1,0,0},
5d02b00f 158 {"zadd",zaddCommand,-4,"wm",0,NULL,1,1,1,0,0},
159 {"zincrby",zincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
160 {"zrem",zremCommand,-3,"w",0,NULL,1,1,1,0,0},
161 {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
162 {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
163 {"zunionstore",zunionstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
164 {"zinterstore",zinterstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
165 {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
166 {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
167 {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
168 {"zcount",zcountCommand,4,"r",0,NULL,1,1,1,0,0},
169 {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
170 {"zcard",zcardCommand,2,"r",0,NULL,1,1,1,0,0},
171 {"zscore",zscoreCommand,3,"r",0,NULL,1,1,1,0,0},
172 {"zrank",zrankCommand,3,"r",0,NULL,1,1,1,0,0},
173 {"zrevrank",zrevrankCommand,3,"r",0,NULL,1,1,1,0,0},
174 {"hset",hsetCommand,4,"wm",0,NULL,1,1,1,0,0},
175 {"hsetnx",hsetnxCommand,4,"wm",0,NULL,1,1,1,0,0},
176 {"hget",hgetCommand,3,"r",0,NULL,1,1,1,0,0},
177 {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
178 {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
179 {"hincrby",hincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
68bfe993 180 {"hincrbyfloat",hincrbyfloatCommand,4,"wm",0,NULL,1,1,1,0,0},
5d02b00f 181 {"hdel",hdelCommand,-3,"w",0,NULL,1,1,1,0,0},
182 {"hlen",hlenCommand,2,"r",0,NULL,1,1,1,0,0},
548efd91 183 {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
184 {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
5d02b00f 185 {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
186 {"hexists",hexistsCommand,3,"r",0,NULL,1,1,1,0,0},
187 {"incrby",incrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
188 {"decrby",decrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
5574b53e 189 {"incrbyfloat",incrbyfloatCommand,3,"wm",0,NULL,1,1,1,0,0},
5d02b00f 190 {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
191 {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
192 {"msetnx",msetnxCommand,-3,"wm",0,NULL,1,-1,2,0,0},
b60ed6e8 193 {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
5d02b00f 194 {"select",selectCommand,2,"r",0,NULL,0,0,0,0,0},
195 {"move",moveCommand,3,"w",0,NULL,1,1,1,0,0},
196 {"rename",renameCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
197 {"renamenx",renamenxCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
12d293ca 198 {"expire",expireCommand,3,"w",0,NULL,1,1,1,0,0},
199 {"expireat",expireatCommand,3,"w",0,NULL,1,1,1,0,0},
200 {"pexpire",pexpireCommand,3,"w",0,NULL,1,1,1,0,0},
201 {"pexpireat",pexpireatCommand,3,"w",0,NULL,1,1,1,0,0},
548efd91 202 {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
5d02b00f 203 {"dbsize",dbsizeCommand,1,"r",0,NULL,0,0,0,0,0},
e41677b4 204 {"auth",authCommand,2,"rs",0,NULL,0,0,0,0,0},
5d02b00f 205 {"ping",pingCommand,1,"r",0,NULL,0,0,0,0,0},
206 {"echo",echoCommand,2,"r",0,NULL,0,0,0,0,0},
e41677b4 207 {"save",saveCommand,1,"ars",0,NULL,0,0,0,0,0},
5d02b00f 208 {"bgsave",bgsaveCommand,1,"ar",0,NULL,0,0,0,0,0},
209 {"bgrewriteaof",bgrewriteaofCommand,1,"ar",0,NULL,0,0,0,0,0},
4ab8695d 210 {"shutdown",shutdownCommand,-1,"ar",0,NULL,0,0,0,0,0},
5d02b00f 211 {"lastsave",lastsaveCommand,1,"r",0,NULL,0,0,0,0,0},
212 {"type",typeCommand,2,"r",0,NULL,1,1,1,0,0},
b60ed6e8 213 {"multi",multiCommand,1,"rs",0,NULL,0,0,0,0,0},
05406168 214 {"exec",execCommand,1,"s",0,NULL,0,0,0,0,0},
b60ed6e8 215 {"discard",discardCommand,1,"rs",0,NULL,0,0,0,0,0},
216 {"sync",syncCommand,1,"ars",0,NULL,0,0,0,0,0},
5d02b00f 217 {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
218 {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
2c861050 219 {"sort",sortCommand,-2,"wmS",0,NULL,1,1,1,0,0},
5d02b00f 220 {"info",infoCommand,-1,"r",0,NULL,0,0,0,0,0},
b60ed6e8 221 {"monitor",monitorCommand,1,"ars",0,NULL,0,0,0,0,0},
12d293ca 222 {"ttl",ttlCommand,2,"r",0,NULL,1,1,1,0,0},
223 {"pttl",pttlCommand,2,"r",0,NULL,1,1,1,0,0},
5d02b00f 224 {"persist",persistCommand,2,"w",0,NULL,1,1,1,0,0},
b60ed6e8 225 {"slaveof",slaveofCommand,3,"aws",0,NULL,0,0,0,0,0},
38bb4522 226 {"debug",debugCommand,-2,"as",0,NULL,0,0,0,0,0},
5d02b00f 227 {"config",configCommand,-2,"ar",0,NULL,0,0,0,0,0},
b60ed6e8 228 {"subscribe",subscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
229 {"unsubscribe",unsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
230 {"psubscribe",psubscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
231 {"punsubscribe",punsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
6e6bbac7 232 {"publish",publishCommand,3,"pf",0,NULL,0,0,0,0,0},
b60ed6e8 233 {"watch",watchCommand,-2,"rs",0,noPreloadGetKeys,1,-1,1,0,0},
234 {"unwatch",unwatchCommand,1,"rs",0,NULL,0,0,0,0,0},
7afc3a96 235 {"restore",restoreCommand,4,"awm",0,NULL,1,1,1,0,0},
5d02b00f 236 {"migrate",migrateCommand,6,"aw",0,NULL,0,0,0,0,0},
1bcfa0f6 237 {"dump",dumpCommand,2,"ar",0,NULL,1,1,1,0,0},
238 {"object",objectCommand,-2,"r",0,NULL,2,2,2,0,0},
5d02b00f 239 {"client",clientCommand,-2,"ar",0,NULL,0,0,0,0,0},
05406168 240 {"eval",evalCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
241 {"evalsha",evalShaCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
070e3945 242 {"slowlog",slowlogCommand,-2,"r",0,NULL,0,0,0,0,0},
9494f1f1 243 {"script",scriptCommand,-2,"ras",0,NULL,0,0,0,0,0},
244 {"time",timeCommand,1,"rR",0,NULL,0,0,0,0,0}
e2641e09 245};
246
247/*============================ Utility functions ============================ */
248
9c104c68 249/* Low level logging. To use only for very big messages, otherwise
250 * redisLog() is to prefer. */
251void redisLogRaw(int level, const char *msg) {
e1a586ee
JH
252 const int syslogLevelMap[] = { LOG_DEBUG, LOG_INFO, LOG_NOTICE, LOG_WARNING };
253 const char *c = ".-*#";
254 time_t now = time(NULL);
e2641e09 255 FILE *fp;
23072961 256 char buf[64];
996d503d 257 int rawmode = (level & REDIS_LOG_RAW);
23072961 258
996d503d 259 level &= 0xff; /* clear flags */
23072961 260 if (level < server.verbosity) return;
e2641e09 261
262 fp = (server.logfile == NULL) ? stdout : fopen(server.logfile,"a");
263 if (!fp) return;
264
996d503d 265 if (rawmode) {
266 fprintf(fp,"%s",msg);
267 } else {
268 strftime(buf,sizeof(buf),"%d %b %H:%M:%S",localtime(&now));
269 fprintf(fp,"[%d] %s %c %s\n",(int)getpid(),buf,c[level],msg);
270 }
e1a586ee
JH
271 fflush(fp);
272
e2641e09 273 if (server.logfile) fclose(fp);
e1a586ee
JH
274
275 if (server.syslog_enabled) syslog(syslogLevelMap[level], "%s", msg);
e2641e09 276}
277
9c104c68 278/* Like redisLogRaw() but with printf-alike support. This is the funciton that
279 * is used across the code. The raw version is only used in order to dump
280 * the INFO output on crash. */
281void redisLog(int level, const char *fmt, ...) {
282 va_list ap;
283 char msg[REDIS_MAX_LOGMSG_LEN];
284
996d503d 285 if ((level&0xff) < server.verbosity) return;
9c104c68 286
287 va_start(ap, fmt);
288 vsnprintf(msg, sizeof(msg), fmt, ap);
289 va_end(ap);
290
291 redisLogRaw(level,msg);
292}
293
e2641e09 294/* Redis generally does not try to recover from out of memory conditions
295 * when allocating objects or strings, it is not clear if it will be possible
296 * to report this condition to the client since the networking layer itself
297 * is based on heap allocation for send buffers, so we simply abort.
298 * At least the code will be simpler to read... */
299void oom(const char *msg) {
300 redisLog(REDIS_WARNING, "%s: Out of memory\n",msg);
301 sleep(1);
302 abort();
303}
304
d9cb288c 305/* Return the UNIX time in microseconds */
306long long ustime(void) {
307 struct timeval tv;
308 long long ust;
309
310 gettimeofday(&tv, NULL);
311 ust = ((long long)tv.tv_sec)*1000000;
312 ust += tv.tv_usec;
313 return ust;
314}
315
2c2b2085 316/* Return the UNIX time in milliseconds */
317long long mstime(void) {
318 return ustime()/1000;
319}
320
e2641e09 321/*====================== Hash table type implementation ==================== */
322
323/* This is an hash table type that uses the SDS dynamic strings libary as
324 * keys and radis objects as values (objects can hold SDS strings,
325 * lists, sets). */
326
327void dictVanillaFree(void *privdata, void *val)
328{
329 DICT_NOTUSED(privdata);
330 zfree(val);
331}
332
333void dictListDestructor(void *privdata, void *val)
334{
335 DICT_NOTUSED(privdata);
336 listRelease((list*)val);
337}
338
339int dictSdsKeyCompare(void *privdata, const void *key1,
340 const void *key2)
341{
342 int l1,l2;
343 DICT_NOTUSED(privdata);
344
345 l1 = sdslen((sds)key1);
346 l2 = sdslen((sds)key2);
347 if (l1 != l2) return 0;
348 return memcmp(key1, key2, l1) == 0;
349}
350
1b1f47c9 351/* A case insensitive version used for the command lookup table. */
352int dictSdsKeyCaseCompare(void *privdata, const void *key1,
353 const void *key2)
354{
355 DICT_NOTUSED(privdata);
356
357 return strcasecmp(key1, key2) == 0;
358}
359
e2641e09 360void dictRedisObjectDestructor(void *privdata, void *val)
361{
362 DICT_NOTUSED(privdata);
363
364 if (val == NULL) return; /* Values of swapped out keys as set to NULL */
365 decrRefCount(val);
366}
367
368void dictSdsDestructor(void *privdata, void *val)
369{
370 DICT_NOTUSED(privdata);
371
372 sdsfree(val);
373}
374
375int dictObjKeyCompare(void *privdata, const void *key1,
376 const void *key2)
377{
378 const robj *o1 = key1, *o2 = key2;
379 return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
380}
381
382unsigned int dictObjHash(const void *key) {
383 const robj *o = key;
384 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
385}
386
387unsigned int dictSdsHash(const void *key) {
388 return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
389}
390
1b1f47c9 391unsigned int dictSdsCaseHash(const void *key) {
392 return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
393}
394
e2641e09 395int dictEncObjKeyCompare(void *privdata, const void *key1,
396 const void *key2)
397{
398 robj *o1 = (robj*) key1, *o2 = (robj*) key2;
399 int cmp;
400
401 if (o1->encoding == REDIS_ENCODING_INT &&
402 o2->encoding == REDIS_ENCODING_INT)
403 return o1->ptr == o2->ptr;
404
405 o1 = getDecodedObject(o1);
406 o2 = getDecodedObject(o2);
407 cmp = dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
408 decrRefCount(o1);
409 decrRefCount(o2);
410 return cmp;
411}
412
413unsigned int dictEncObjHash(const void *key) {
414 robj *o = (robj*) key;
415
416 if (o->encoding == REDIS_ENCODING_RAW) {
417 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
418 } else {
419 if (o->encoding == REDIS_ENCODING_INT) {
420 char buf[32];
421 int len;
422
423 len = ll2string(buf,32,(long)o->ptr);
424 return dictGenHashFunction((unsigned char*)buf, len);
425 } else {
426 unsigned int hash;
427
428 o = getDecodedObject(o);
429 hash = dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
430 decrRefCount(o);
431 return hash;
432 }
433 }
434}
435
4dd444bb 436/* Sets type hash table */
e2641e09 437dictType setDictType = {
438 dictEncObjHash, /* hash function */
439 NULL, /* key dup */
440 NULL, /* val dup */
441 dictEncObjKeyCompare, /* key compare */
442 dictRedisObjectDestructor, /* key destructor */
443 NULL /* val destructor */
444};
445
446/* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
447dictType zsetDictType = {
448 dictEncObjHash, /* hash function */
449 NULL, /* key dup */
450 NULL, /* val dup */
451 dictEncObjKeyCompare, /* key compare */
452 dictRedisObjectDestructor, /* key destructor */
69ef89f2 453 NULL /* val destructor */
e2641e09 454};
455
456/* Db->dict, keys are sds strings, vals are Redis objects. */
457dictType dbDictType = {
458 dictSdsHash, /* hash function */
459 NULL, /* key dup */
460 NULL, /* val dup */
461 dictSdsKeyCompare, /* key compare */
462 dictSdsDestructor, /* key destructor */
463 dictRedisObjectDestructor /* val destructor */
464};
465
466/* Db->expires */
467dictType keyptrDictType = {
468 dictSdsHash, /* hash function */
469 NULL, /* key dup */
470 NULL, /* val dup */
471 dictSdsKeyCompare, /* key compare */
472 NULL, /* key destructor */
473 NULL /* val destructor */
474};
475
1b1f47c9 476/* Command table. sds string -> command struct pointer. */
477dictType commandTableDictType = {
478 dictSdsCaseHash, /* hash function */
479 NULL, /* key dup */
480 NULL, /* val dup */
481 dictSdsKeyCaseCompare, /* key compare */
482 dictSdsDestructor, /* key destructor */
483 NULL /* val destructor */
484};
485
e2641e09 486/* Hash type hash table (note that small hashes are represented with zimpaps) */
487dictType hashDictType = {
488 dictEncObjHash, /* hash function */
489 NULL, /* key dup */
490 NULL, /* val dup */
491 dictEncObjKeyCompare, /* key compare */
492 dictRedisObjectDestructor, /* key destructor */
493 dictRedisObjectDestructor /* val destructor */
494};
495
496/* Keylist hash table type has unencoded redis objects as keys and
497 * lists as values. It's used for blocking operations (BLPOP) and to
498 * map swapped keys to a list of clients waiting for this keys to be loaded. */
499dictType keylistDictType = {
500 dictObjHash, /* hash function */
501 NULL, /* key dup */
502 NULL, /* val dup */
503 dictObjKeyCompare, /* key compare */
504 dictRedisObjectDestructor, /* key destructor */
505 dictListDestructor /* val destructor */
506};
507
508int htNeedsResize(dict *dict) {
509 long long size, used;
510
511 size = dictSlots(dict);
512 used = dictSize(dict);
513 return (size && used && size > DICT_HT_INITIAL_SIZE &&
514 (used*100/size < REDIS_HT_MINFILL));
515}
516
517/* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
518 * we resize the hash table to save memory */
519void tryResizeHashTables(void) {
520 int j;
521
522 for (j = 0; j < server.dbnum; j++) {
523 if (htNeedsResize(server.db[j].dict))
524 dictResize(server.db[j].dict);
525 if (htNeedsResize(server.db[j].expires))
526 dictResize(server.db[j].expires);
527 }
528}
529
530/* Our hash table implementation performs rehashing incrementally while
531 * we write/read from the hash table. Still if the server is idle, the hash
532 * table will use two tables for a long time. So we try to use 1 millisecond
533 * of CPU time at every serverCron() loop in order to rehash some key. */
534void incrementallyRehash(void) {
535 int j;
536
537 for (j = 0; j < server.dbnum; j++) {
538 if (dictIsRehashing(server.db[j].dict)) {
539 dictRehashMilliseconds(server.db[j].dict,1);
540 break; /* already used our millisecond for this loop... */
541 }
542 }
543}
544
545/* This function is called once a background process of some kind terminates,
546 * as we want to avoid resizing the hash tables when there is a child in order
547 * to play well with copy-on-write (otherwise when a resize happens lots of
548 * memory pages are copied). The goal of this function is to update the ability
549 * for dict.c to resize the hash tables accordingly to the fact we have o not
550 * running childs. */
551void updateDictResizePolicy(void) {
f48cd4b9 552 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
e2641e09 553 dictEnableResize();
554 else
555 dictDisableResize();
556}
557
558/* ======================= Cron: called every 100 ms ======================== */
559
bcf2995c 560/* Try to expire a few timed out keys. The algorithm used is adaptive and
561 * will use few CPU cycles if there are few expiring keys, otherwise
562 * it will get more aggressive to avoid that too much memory is used by
563 * keys that can be removed from the keyspace. */
564void activeExpireCycle(void) {
565 int j;
566
567 for (j = 0; j < server.dbnum; j++) {
568 int expired;
569 redisDb *db = server.db+j;
570
571 /* Continue to expire if at the end of the cycle more than 25%
572 * of the keys were expired. */
573 do {
574 long num = dictSize(db->expires);
4be855e7 575 long long now = mstime();
bcf2995c 576
577 expired = 0;
578 if (num > REDIS_EXPIRELOOKUPS_PER_CRON)
579 num = REDIS_EXPIRELOOKUPS_PER_CRON;
580 while (num--) {
581 dictEntry *de;
4be855e7 582 long long t;
bcf2995c 583
584 if ((de = dictGetRandomKey(db->expires)) == NULL) break;
4be855e7 585 t = dictGetSignedIntegerVal(de);
bcf2995c 586 if (now > t) {
c0ba9ebe 587 sds key = dictGetKey(de);
bcf2995c 588 robj *keyobj = createStringObject(key,sdslen(key));
589
590 propagateExpire(db,keyobj);
591 dbDelete(db,keyobj);
592 decrRefCount(keyobj);
593 expired++;
594 server.stat_expiredkeys++;
595 }
596 }
597 } while (expired > REDIS_EXPIRELOOKUPS_PER_CRON/4);
598 }
599}
600
165346ca 601void updateLRUClock(void) {
602 server.lruclock = (time(NULL)/REDIS_LRU_CLOCK_RESOLUTION) &
603 REDIS_LRU_CLOCK_MAX;
604}
bcf2995c 605
250e7f69 606
607/* Add a sample to the operations per second array of samples. */
608void trackOperationsPerSecond(void) {
609 long long t = mstime() - server.ops_sec_last_sample_time;
610 long long ops = server.stat_numcommands - server.ops_sec_last_sample_ops;
611 long long ops_sec;
612
613 ops_sec = t > 0 ? (ops*1000/t) : 0;
614
615 server.ops_sec_samples[server.ops_sec_idx] = ops_sec;
616 server.ops_sec_idx = (server.ops_sec_idx+1) % REDIS_OPS_SEC_SAMPLES;
617 server.ops_sec_last_sample_time = mstime();
618 server.ops_sec_last_sample_ops = server.stat_numcommands;
619}
620
621/* Return the mean of all the samples. */
622long long getOperationsPerSecond(void) {
623 int j;
624 long long sum = 0;
625
626 for (j = 0; j < REDIS_OPS_SEC_SAMPLES; j++)
627 sum += server.ops_sec_samples[j];
628 return sum / REDIS_OPS_SEC_SAMPLES;
629}
630
f1eaf572 631/* Check for timeouts. Returns non-zero if the client was terminated */
632int clientsCronHandleTimeout(redisClient *c) {
9fa9ccb0 633 time_t now = server.unixtime;
cfa4b57c 634
635 if (server.maxidletime &&
636 !(c->flags & REDIS_SLAVE) && /* no timeout for slaves */
637 !(c->flags & REDIS_MASTER) && /* no timeout for masters */
638 !(c->flags & REDIS_BLOCKED) && /* no timeout for BLPOP */
639 dictSize(c->pubsub_channels) == 0 && /* no timeout for pubsub */
640 listLength(c->pubsub_patterns) == 0 &&
641 (now - c->lastinteraction > server.maxidletime))
642 {
643 redisLog(REDIS_VERBOSE,"Closing idle client");
644 freeClient(c);
f1eaf572 645 return 1;
cfa4b57c 646 } else if (c->flags & REDIS_BLOCKED) {
647 if (c->bpop.timeout != 0 && c->bpop.timeout < now) {
648 addReply(c,shared.nullmultibulk);
649 unblockClientWaitingData(c);
650 }
651 }
f1eaf572 652 return 0;
cfa4b57c 653}
654
9fa9ccb0 655/* The client query buffer is an sds.c string that can end with a lot of
f1eaf572 656 * free space not used, this function reclaims space if needed.
657 *
658 * The funciton always returns 0 as it never terminates the client. */
659int clientsCronResizeQueryBuffer(redisClient *c) {
9fa9ccb0 660 size_t querybuf_size = sdsAllocSize(c->querybuf);
661 time_t idletime = server.unixtime - c->lastinteraction;
662
663 /* There are two conditions to resize the query buffer:
664 * 1) Query buffer is > BIG_ARG and too big for latest peak.
665 * 2) Client is inactive and the buffer is bigger than 1k. */
666 if (((querybuf_size > REDIS_MBULK_BIG_ARG) &&
667 (querybuf_size/(c->querybuf_peak+1)) > 2) ||
668 (querybuf_size > 1024 && idletime > 2))
669 {
670 /* Only resize the query buffer if it is actually wasting space. */
671 if (sdsavail(c->querybuf) > 1024) {
672 c->querybuf = sdsRemoveFreeSpace(c->querybuf);
673 }
674 }
675 /* Reset the peak again to capture the peak memory usage in the next
676 * cycle. */
677 c->querybuf_peak = 0;
f1eaf572 678 return 0;
9fa9ccb0 679}
680
cfa4b57c 681void clientsCron(void) {
682 /* Make sure to process at least 1/100 of clients per call.
683 * Since this function is called 10 times per second we are sure that
684 * in the worst case we process all the clients in 10 seconds.
685 * In normal conditions (a reasonable number of clients) we process
686 * all the clients in a shorter time. */
9fa9ccb0 687 int numclients = listLength(server.clients);
688 int iterations = numclients/100;
cfa4b57c 689
9fa9ccb0 690 if (iterations < 50)
691 iterations = (numclients < 50) ? numclients : 50;
cfa4b57c 692 while(listLength(server.clients) && iterations--) {
693 redisClient *c;
694 listNode *head;
695
696 /* Rotate the list, take the current head, process.
697 * This way if the client must be removed from the list it's the
698 * first element and we don't incur into O(N) computation. */
699 listRotate(server.clients);
700 head = listFirst(server.clients);
701 c = listNodeValue(head);
f1eaf572 702 /* The following functions do different service checks on the client.
703 * The protocol is that they return non-zero if the client was
704 * terminated. */
705 if (clientsCronHandleTimeout(c)) continue;
706 if (clientsCronResizeQueryBuffer(c)) continue;
cfa4b57c 707 }
708}
709
e2641e09 710int serverCron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
89a1433e 711 int j, loops = server.cronloops;
e2641e09 712 REDIS_NOTUSED(eventLoop);
713 REDIS_NOTUSED(id);
714 REDIS_NOTUSED(clientData);
715
716 /* We take a cached value of the unix time in the global state because
717 * with virtual memory and aging there is to store the current time
718 * in objects at every object access, and accuracy is not needed.
719 * To access a global var is faster than calling time(NULL) */
720 server.unixtime = time(NULL);
4f06867a 721
250e7f69 722 trackOperationsPerSecond();
723
ef59a8bc 724 /* We have just 22 bits per object for LRU information.
165346ca 725 * So we use an (eventually wrapping) LRU clock with 10 seconds resolution.
726 * 2^22 bits with 10 seconds resoluton is more or less 1.5 years.
e2641e09 727 *
165346ca 728 * Note that even if this will wrap after 1.5 years it's not a problem,
ef59a8bc 729 * everything will still work but just some object will appear younger
165346ca 730 * to Redis. But for this to happen a given object should never be touched
731 * for 1.5 years.
732 *
733 * Note that you can change the resolution altering the
734 * REDIS_LRU_CLOCK_RESOLUTION define.
e2641e09 735 */
165346ca 736 updateLRUClock();
e2641e09 737
17b24ff3 738 /* Record the max memory used since the server was started. */
739 if (zmalloc_used_memory() > server.stat_peak_memory)
740 server.stat_peak_memory = zmalloc_used_memory();
741
e2641e09 742 /* We received a SIGTERM, shutting down here in a safe way, as it is
743 * not ok doing so inside the signal handler. */
744 if (server.shutdown_asap) {
4ab8695d 745 if (prepareForShutdown(0) == REDIS_OK) exit(0);
e2641e09 746 redisLog(REDIS_WARNING,"SIGTERM received but errors trying to shut down the server, check the logs for more information");
747 }
748
749 /* Show some info about non-empty databases */
750 for (j = 0; j < server.dbnum; j++) {
751 long long size, used, vkeys;
752
753 size = dictSlots(server.db[j].dict);
754 used = dictSize(server.db[j].dict);
755 vkeys = dictSize(server.db[j].expires);
756 if (!(loops % 50) && (used || vkeys)) {
757 redisLog(REDIS_VERBOSE,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j,used,vkeys,size);
758 /* dictPrintStats(server.dict); */
759 }
760 }
761
762 /* We don't want to resize the hash tables while a bacground saving
763 * is in progress: the saving child is created using fork() that is
764 * implemented with a copy-on-write semantic in most modern systems, so
765 * if we resize the HT while there is the saving child at work actually
766 * a lot of memory movements in the parent will cause a lot of pages
767 * copied. */
f48cd4b9 768 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
e2641e09 769 if (!(loops % 10)) tryResizeHashTables();
770 if (server.activerehashing) incrementallyRehash();
771 }
772
773 /* Show information about connected clients */
774 if (!(loops % 50)) {
775 redisLog(REDIS_VERBOSE,"%d clients connected (%d slaves), %zu bytes in use",
776 listLength(server.clients)-listLength(server.slaves),
777 listLength(server.slaves),
ca734d17 778 zmalloc_used_memory());
e2641e09 779 }
780
cfa4b57c 781 /* We need to do a few operations on clients asynchronously. */
782 clientsCron();
e2641e09 783
b333e239 784 /* Start a scheduled AOF rewrite if this was requested by the user while
785 * a BGSAVE was in progress. */
f48cd4b9 786 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1 &&
2c915bcf 787 server.aof_rewrite_scheduled)
b333e239 788 {
789 rewriteAppendOnlyFileBackground();
790 }
791
f03fe802 792 /* Check if a background saving or AOF rewrite in progress terminated. */
f48cd4b9 793 if (server.rdb_child_pid != -1 || server.aof_child_pid != -1) {
e2641e09 794 int statloc;
795 pid_t pid;
796
797 if ((pid = wait3(&statloc,WNOHANG,NULL)) != 0) {
36c17a53 798 int exitcode = WEXITSTATUS(statloc);
799 int bysignal = 0;
800
801 if (WIFSIGNALED(statloc)) bysignal = WTERMSIG(statloc);
802
f48cd4b9 803 if (pid == server.rdb_child_pid) {
36c17a53 804 backgroundSaveDoneHandler(exitcode,bysignal);
e2641e09 805 } else {
36c17a53 806 backgroundRewriteDoneHandler(exitcode,bysignal);
e2641e09 807 }
808 updateDictResizePolicy();
809 }
c9d0c362 810 } else {
e2641e09 811 time_t now = time(NULL);
b333e239 812
813 /* If there is not a background saving/rewrite in progress check if
814 * we have to save/rewrite now */
e2641e09 815 for (j = 0; j < server.saveparamslen; j++) {
816 struct saveparam *sp = server.saveparams+j;
817
818 if (server.dirty >= sp->changes &&
819 now-server.lastsave > sp->seconds) {
820 redisLog(REDIS_NOTICE,"%d changes in %d seconds. Saving...",
821 sp->changes, sp->seconds);
f48cd4b9 822 rdbSaveBackground(server.rdb_filename);
e2641e09 823 break;
824 }
825 }
b333e239 826
827 /* Trigger an AOF rewrite if needed */
f48cd4b9 828 if (server.rdb_child_pid == -1 &&
ff2145ad 829 server.aof_child_pid == -1 &&
2c915bcf 830 server.aof_rewrite_perc &&
831 server.aof_current_size > server.aof_rewrite_min_size)
b333e239 832 {
2c915bcf 833 long long base = server.aof_rewrite_base_size ?
834 server.aof_rewrite_base_size : 1;
835 long long growth = (server.aof_current_size*100/base) - 100;
836 if (growth >= server.aof_rewrite_perc) {
19b46c9a 837 redisLog(REDIS_NOTICE,"Starting automatic rewriting of AOF on %lld%% growth",growth);
b333e239 838 rewriteAppendOnlyFileBackground();
839 }
840 }
e2641e09 841 }
842
db3c2a4f 843
844 /* If we postponed an AOF buffer flush, let's try to do it every time the
845 * cron function is called. */
846 if (server.aof_flush_postponed_start) flushAppendOnlyFile(0);
847
bcf2995c 848 /* Expire a few keys per cycle, only if this is a master.
849 * On slaves we wait for DEL operations synthesized by the master
850 * in order to guarantee a strict consistency. */
851 if (server.masterhost == NULL) activeExpireCycle();
e2641e09 852
8c43e663 853 /* Close clients that need to be closed asynchronous */
854 freeClientsInAsyncFreeQueue();
855
f4aa600b 856 /* Replication cron function -- used to reconnect to master and
857 * to detect transfer failures. */
62ec599c 858 if (!(loops % 10)) replicationCron();
f4aa600b 859
89a1433e 860 server.cronloops++;
e2641e09 861 return 100;
862}
863
864/* This function gets called every time Redis is entering the
865 * main loop of the event driven library, that is, before to sleep
866 * for ready file descriptors. */
867void beforeSleep(struct aeEventLoop *eventLoop) {
868 REDIS_NOTUSED(eventLoop);
a4ce7581
PN
869 listNode *ln;
870 redisClient *c;
e2641e09 871
a4ce7581
PN
872 /* Try to process pending commands for clients that were just unblocked. */
873 while (listLength(server.unblocked_clients)) {
874 ln = listFirst(server.unblocked_clients);
875 redisAssert(ln != NULL);
876 c = ln->value;
877 listDelNode(server.unblocked_clients,ln);
3bcffcbe 878 c->flags &= ~REDIS_UNBLOCKED;
a4ce7581
PN
879
880 /* Process remaining data in the input buffer. */
00010fa9 881 if (c->querybuf && sdslen(c->querybuf) > 0) {
882 server.current_client = c;
a4ce7581 883 processInputBuffer(c);
00010fa9 884 server.current_client = NULL;
885 }
a4ce7581
PN
886 }
887
e2641e09 888 /* Write the AOF buffer on disk */
db3c2a4f 889 flushAppendOnlyFile(0);
e2641e09 890}
891
892/* =========================== Server initialization ======================== */
893
894void createSharedObjects(void) {
895 int j;
896
897 shared.crlf = createObject(REDIS_STRING,sdsnew("\r\n"));
898 shared.ok = createObject(REDIS_STRING,sdsnew("+OK\r\n"));
899 shared.err = createObject(REDIS_STRING,sdsnew("-ERR\r\n"));
900 shared.emptybulk = createObject(REDIS_STRING,sdsnew("$0\r\n\r\n"));
901 shared.czero = createObject(REDIS_STRING,sdsnew(":0\r\n"));
902 shared.cone = createObject(REDIS_STRING,sdsnew(":1\r\n"));
903 shared.cnegone = createObject(REDIS_STRING,sdsnew(":-1\r\n"));
904 shared.nullbulk = createObject(REDIS_STRING,sdsnew("$-1\r\n"));
905 shared.nullmultibulk = createObject(REDIS_STRING,sdsnew("*-1\r\n"));
906 shared.emptymultibulk = createObject(REDIS_STRING,sdsnew("*0\r\n"));
907 shared.pong = createObject(REDIS_STRING,sdsnew("+PONG\r\n"));
908 shared.queued = createObject(REDIS_STRING,sdsnew("+QUEUED\r\n"));
909 shared.wrongtypeerr = createObject(REDIS_STRING,sdsnew(
910 "-ERR Operation against a key holding the wrong kind of value\r\n"));
911 shared.nokeyerr = createObject(REDIS_STRING,sdsnew(
912 "-ERR no such key\r\n"));
913 shared.syntaxerr = createObject(REDIS_STRING,sdsnew(
914 "-ERR syntax error\r\n"));
915 shared.sameobjecterr = createObject(REDIS_STRING,sdsnew(
916 "-ERR source and destination objects are the same\r\n"));
917 shared.outofrangeerr = createObject(REDIS_STRING,sdsnew(
918 "-ERR index out of range\r\n"));
7229d60d 919 shared.noscripterr = createObject(REDIS_STRING,sdsnew(
920 "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
97e7f8ae 921 shared.loadingerr = createObject(REDIS_STRING,sdsnew(
922 "-LOADING Redis is loading the dataset in memory\r\n"));
115e3ff3 923 shared.slowscripterr = createObject(REDIS_STRING,sdsnew(
4ab8695d 924 "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
c25e7eaf 925 shared.bgsaveerr = createObject(REDIS_STRING,sdsnew(
05406168 926 "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
927 shared.roslaveerr = createObject(REDIS_STRING,sdsnew(
928 "-READONLY You can't write against a read only slave.\r\n"));
3f7ad833 929 shared.oomerr = createObject(REDIS_STRING,sdsnew(
930 "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
e2641e09 931 shared.space = createObject(REDIS_STRING,sdsnew(" "));
932 shared.colon = createObject(REDIS_STRING,sdsnew(":"));
933 shared.plus = createObject(REDIS_STRING,sdsnew("+"));
934 shared.select0 = createStringObject("select 0\r\n",10);
935 shared.select1 = createStringObject("select 1\r\n",10);
936 shared.select2 = createStringObject("select 2\r\n",10);
937 shared.select3 = createStringObject("select 3\r\n",10);
938 shared.select4 = createStringObject("select 4\r\n",10);
939 shared.select5 = createStringObject("select 5\r\n",10);
940 shared.select6 = createStringObject("select 6\r\n",10);
941 shared.select7 = createStringObject("select 7\r\n",10);
942 shared.select8 = createStringObject("select 8\r\n",10);
943 shared.select9 = createStringObject("select 9\r\n",10);
944 shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
945 shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
946 shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
947 shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
948 shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
949 shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
355f8591 950 shared.del = createStringObject("DEL",3);
c1db214e 951 shared.rpop = createStringObject("RPOP",4);
952 shared.lpop = createStringObject("LPOP",4);
e2641e09 953 for (j = 0; j < REDIS_SHARED_INTEGERS; j++) {
954 shared.integers[j] = createObject(REDIS_STRING,(void*)(long)j);
955 shared.integers[j]->encoding = REDIS_ENCODING_INT;
956 }
355f8591 957 for (j = 0; j < REDIS_SHARED_BULKHDR_LEN; j++) {
958 shared.mbulkhdr[j] = createObject(REDIS_STRING,
959 sdscatprintf(sdsempty(),"*%d\r\n",j));
960 shared.bulkhdr[j] = createObject(REDIS_STRING,
961 sdscatprintf(sdsempty(),"$%d\r\n",j));
962 }
e2641e09 963}
964
965void initServerConfig() {
91d664d6 966 getRandomHexChars(server.runid,REDIS_RUN_ID_SIZE);
967 server.runid[REDIS_RUN_ID_SIZE] = '\0';
75eaac5c 968 server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
e2641e09 969 server.port = REDIS_SERVERPORT;
a5639e7d 970 server.bindaddr = NULL;
5d10923f 971 server.unixsocket = NULL;
85238765 972 server.unixsocketperm = 0;
a5639e7d
PN
973 server.ipfd = -1;
974 server.sofd = -1;
975 server.dbnum = REDIS_DEFAULT_DBNUM;
c6f9ee88 976 server.verbosity = REDIS_NOTICE;
e2641e09 977 server.maxidletime = REDIS_MAXIDLETIME;
becf5fdb 978 server.client_max_querybuf_len = REDIS_MAX_QUERYBUF_LEN;
e2641e09 979 server.saveparams = NULL;
97e7f8ae 980 server.loading = 0;
e2641e09 981 server.logfile = NULL; /* NULL = log on standard output */
e1a586ee
JH
982 server.syslog_enabled = 0;
983 server.syslog_ident = zstrdup("redis");
984 server.syslog_facility = LOG_LOCAL0;
e2641e09 985 server.daemonize = 0;
e394114d 986 server.aof_state = REDIS_AOF_OFF;
2c915bcf 987 server.aof_fsync = AOF_FSYNC_EVERYSEC;
988 server.aof_no_fsync_on_rewrite = 0;
989 server.aof_rewrite_perc = REDIS_AOF_REWRITE_PERC;
990 server.aof_rewrite_min_size = REDIS_AOF_REWRITE_MIN_SIZE;
991 server.aof_rewrite_base_size = 0;
992 server.aof_rewrite_scheduled = 0;
ff2145ad 993 server.aof_last_fsync = time(NULL);
994 server.aof_fd = -1;
995 server.aof_selected_db = -1; /* Make sure the first time will not match */
db3c2a4f 996 server.aof_flush_postponed_start = 0;
e2641e09 997 server.pidfile = zstrdup("/var/run/redis.pid");
f48cd4b9 998 server.rdb_filename = zstrdup("dump.rdb");
2c915bcf 999 server.aof_filename = zstrdup("appendonly.aof");
e2641e09 1000 server.requirepass = NULL;
f48cd4b9 1001 server.rdb_compression = 1;
e2641e09 1002 server.activerehashing = 1;
58732c23 1003 server.maxclients = REDIS_MAX_CLIENTS;
5fa95ad7 1004 server.bpop_blocked_clients = 0;
e2641e09 1005 server.maxmemory = 0;
165346ca 1006 server.maxmemory_policy = REDIS_MAXMEMORY_VOLATILE_LRU;
1007 server.maxmemory_samples = 3;
ebd85e9a
PN
1008 server.hash_max_ziplist_entries = REDIS_HASH_MAX_ZIPLIST_ENTRIES;
1009 server.hash_max_ziplist_value = REDIS_HASH_MAX_ZIPLIST_VALUE;
e2641e09 1010 server.list_max_ziplist_entries = REDIS_LIST_MAX_ZIPLIST_ENTRIES;
1011 server.list_max_ziplist_value = REDIS_LIST_MAX_ZIPLIST_VALUE;
96ffb2fe 1012 server.set_max_intset_entries = REDIS_SET_MAX_INTSET_ENTRIES;
3ea204e1
PN
1013 server.zset_max_ziplist_entries = REDIS_ZSET_MAX_ZIPLIST_ENTRIES;
1014 server.zset_max_ziplist_value = REDIS_ZSET_MAX_ZIPLIST_VALUE;
e2641e09 1015 server.shutdown_asap = 0;
aeecbdfa 1016 server.repl_ping_slave_period = REDIS_REPL_PING_SLAVE_PERIOD;
1017 server.repl_timeout = REDIS_REPL_TIMEOUT;
4ab8695d 1018 server.lua_caller = NULL;
eeffcf38 1019 server.lua_time_limit = REDIS_LUA_TIME_LIMIT;
070e3945 1020 server.lua_client = NULL;
115e3ff3 1021 server.lua_timedout = 0;
e2641e09 1022
95506e46 1023 updateLRUClock();
e2641e09 1024 resetServerSaveParams();
1025
1026 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1027 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1028 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1029 /* Replication related */
e2641e09 1030 server.masterauth = NULL;
1031 server.masterhost = NULL;
1032 server.masterport = 6379;
1033 server.master = NULL;
1844f990 1034 server.repl_state = REDIS_REPL_NONE;
890a2ed9 1035 server.repl_syncio_timeout = REDIS_REPL_SYNCIO_TIMEOUT;
4ebfc455 1036 server.repl_serve_stale_data = 1;
05406168 1037 server.repl_slave_ro = 1;
07486df6 1038 server.repl_down_since = -1;
e2641e09 1039
7eac2a75 1040 /* Client output buffer limits */
1041 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].hard_limit_bytes = 0;
1042 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_bytes = 0;
1043 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_seconds = 0;
c8a607f2 1044 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].hard_limit_bytes = 1024*1024*256;
1045 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_bytes = 1024*1024*64;
7eac2a75 1046 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_seconds = 60;
c8a607f2 1047 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].hard_limit_bytes = 1024*1024*32;
1048 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_bytes = 1024*1024*8;
7eac2a75 1049 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_seconds = 60;
1050
e2641e09 1051 /* Double constants initialization */
1052 R_Zero = 0.0;
1053 R_PosInf = 1.0/R_Zero;
1054 R_NegInf = -1.0/R_Zero;
1055 R_Nan = R_Zero/R_Zero;
8d3e063a 1056
1057 /* Command table -- we intiialize it here as it is part of the
1058 * initial configuration, since command names may be changed via
1059 * redis.conf using the rename-command directive. */
1060 server.commands = dictCreate(&commandTableDictType,NULL);
1061 populateCommandTable();
1062 server.delCommand = lookupCommandByCString("del");
1063 server.multiCommand = lookupCommandByCString("multi");
eeb34eff 1064 server.lpushCommand = lookupCommandByCString("lpush");
daa70b17 1065
1066 /* Slow log */
1067 server.slowlog_log_slower_than = REDIS_SLOWLOG_LOG_SLOWER_THAN;
1068 server.slowlog_max_len = REDIS_SLOWLOG_MAX_LEN;
fa5af017 1069
1070 /* Assert */
1071 server.assert_failed = "<no assertion failed>";
1072 server.assert_file = "<no file>";
1073 server.assert_line = 0;
1074 server.bug_report_start = 0;
e2641e09 1075}
1076
e074416b 1077/* This function will try to raise the max number of open files accordingly to
1078 * the configured max number of clients. It will also account for 32 additional
1079 * file descriptors as we need a few more for persistence, listening
1080 * sockets, log files and so forth.
1081 *
1082 * If it will not be possible to set the limit accordingly to the configured
1083 * max number of clients, the function will do the reverse setting
1084 * server.maxclients to the value that we can actually handle. */
1085void adjustOpenFilesLimit(void) {
1086 rlim_t maxfiles = server.maxclients+32;
1087 struct rlimit limit;
1088
1089 if (maxfiles < 1024) maxfiles = 1024;
1090 if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
1091 redisLog(REDIS_WARNING,"Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
1092 strerror(errno));
1093 server.maxclients = 1024-32;
1094 } else {
1095 rlim_t oldlimit = limit.rlim_cur;
1096
1097 /* Set the max number of files if the current limit is not enough
1098 * for our needs. */
1099 if (oldlimit < maxfiles) {
1100 limit.rlim_cur = maxfiles;
1101 limit.rlim_max = maxfiles;
1102 if (setrlimit(RLIMIT_NOFILE,&limit) == -1) {
1103 server.maxclients = oldlimit-32;
1104 redisLog(REDIS_WARNING,"Unable to set the max number of files limit to %d (%s), setting the max clients configuration to %d.",
1105 (int) maxfiles, strerror(errno), (int) server.maxclients);
1106 } else {
1107 redisLog(REDIS_NOTICE,"Max number of open files set to %d",
1108 (int) maxfiles);
1109 }
1110 }
1111 }
1112}
1113
e2641e09 1114void initServer() {
1115 int j;
1116
1117 signal(SIGHUP, SIG_IGN);
1118 signal(SIGPIPE, SIG_IGN);
633a9410 1119 setupSignalHandlers();
e2641e09 1120
e1a586ee
JH
1121 if (server.syslog_enabled) {
1122 openlog(server.syslog_ident, LOG_PID | LOG_NDELAY | LOG_NOWAIT,
1123 server.syslog_facility);
1124 }
1125
00010fa9 1126 server.current_client = NULL;
e2641e09 1127 server.clients = listCreate();
7eac2a75 1128 server.clients_to_close = listCreate();
e2641e09 1129 server.slaves = listCreate();
1130 server.monitors = listCreate();
a4ce7581 1131 server.unblocked_clients = listCreate();
cea8c5cd 1132
e2641e09 1133 createSharedObjects();
e074416b 1134 adjustOpenFilesLimit();
1135 server.el = aeCreateEventLoop(server.maxclients+1024);
e2641e09 1136 server.db = zmalloc(sizeof(redisDb)*server.dbnum);
68d6345d 1137
a53b4c24 1138 if (server.port != 0) {
68d6345d 1139 server.ipfd = anetTcpServer(server.neterr,server.port,server.bindaddr);
a53b4c24 1140 if (server.ipfd == ANET_ERR) {
eef17490 1141 redisLog(REDIS_WARNING, "Opening port %d: %s",
1142 server.port, server.neterr);
a53b4c24 1143 exit(1);
1144 }
a5639e7d 1145 }
5d10923f
PN
1146 if (server.unixsocket != NULL) {
1147 unlink(server.unixsocket); /* don't care if this fails */
85238765 1148 server.sofd = anetUnixServer(server.neterr,server.unixsocket,server.unixsocketperm);
a5639e7d
PN
1149 if (server.sofd == ANET_ERR) {
1150 redisLog(REDIS_WARNING, "Opening socket: %s", server.neterr);
1151 exit(1);
1152 }
c61e6925 1153 }
a5639e7d
PN
1154 if (server.ipfd < 0 && server.sofd < 0) {
1155 redisLog(REDIS_WARNING, "Configured to not listen anywhere, exiting.");
e2641e09 1156 exit(1);
1157 }
1158 for (j = 0; j < server.dbnum; j++) {
1159 server.db[j].dict = dictCreate(&dbDictType,NULL);
1160 server.db[j].expires = dictCreate(&keyptrDictType,NULL);
1161 server.db[j].blocking_keys = dictCreate(&keylistDictType,NULL);
1162 server.db[j].watched_keys = dictCreate(&keylistDictType,NULL);
e2641e09 1163 server.db[j].id = j;
1164 }
1165 server.pubsub_channels = dictCreate(&keylistDictType,NULL);
1166 server.pubsub_patterns = listCreate();
1167 listSetFreeMethod(server.pubsub_patterns,freePubsubPattern);
1168 listSetMatchMethod(server.pubsub_patterns,listMatchPubsubPattern);
1169 server.cronloops = 0;
f48cd4b9 1170 server.rdb_child_pid = -1;
ff2145ad 1171 server.aof_child_pid = -1;
1172 server.aof_rewrite_buf = sdsempty();
1173 server.aof_buf = sdsempty();
e2641e09 1174 server.lastsave = time(NULL);
1175 server.dirty = 0;
1176 server.stat_numcommands = 0;
1177 server.stat_numconnections = 0;
1178 server.stat_expiredkeys = 0;
f21779ff 1179 server.stat_evictedkeys = 0;
e2641e09 1180 server.stat_starttime = time(NULL);
53eeeaff 1181 server.stat_keyspace_misses = 0;
1182 server.stat_keyspace_hits = 0;
17b24ff3 1183 server.stat_peak_memory = 0;
615e414c 1184 server.stat_fork_time = 0;
3c95e721 1185 server.stat_rejected_conn = 0;
250e7f69 1186 memset(server.ops_sec_samples,0,sizeof(server.ops_sec_samples));
1187 server.ops_sec_idx = 0;
1188 server.ops_sec_last_sample_time = mstime();
1189 server.ops_sec_last_sample_ops = 0;
e2641e09 1190 server.unixtime = time(NULL);
c25e7eaf 1191 server.lastbgsave_status = REDIS_OK;
4d3bbf35 1192 server.stop_writes_on_bgsave_err = 1;
e2641e09 1193 aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL);
a5639e7d 1194 if (server.ipfd > 0 && aeCreateFileEvent(server.el,server.ipfd,AE_READABLE,
ab17b909 1195 acceptTcpHandler,NULL) == AE_ERR) oom("creating file event");
a5639e7d 1196 if (server.sofd > 0 && aeCreateFileEvent(server.el,server.sofd,AE_READABLE,
ab17b909 1197 acceptUnixHandler,NULL) == AE_ERR) oom("creating file event");
e2641e09 1198
e394114d 1199 if (server.aof_state == REDIS_AOF_ON) {
ff2145ad 1200 server.aof_fd = open(server.aof_filename,
e394114d 1201 O_WRONLY|O_APPEND|O_CREAT,0644);
ff2145ad 1202 if (server.aof_fd == -1) {
e2641e09 1203 redisLog(REDIS_WARNING, "Can't open the append-only file: %s",
1204 strerror(errno));
1205 exit(1);
1206 }
1207 }
1208
d876678b 1209 /* 32 bit instances are limited to 4GB of address space, so if there is
1210 * no explicit limit in the user provided configuration we set a limit
1211 * at 3.5GB using maxmemory with 'noeviction' policy'. This saves
1212 * useless crashes of the Redis instance. */
1213 if (server.arch_bits == 32 && server.maxmemory == 0) {
1214 redisLog(REDIS_WARNING,"Warning: 32 bit instance detected but no memory limit set. Setting 3.5 GB maxmemory limit with 'noeviction' policy now.");
1215 server.maxmemory = 3584LL*(1024*1024); /* 3584 MB = 3.5 GB */
1216 server.maxmemory_policy = REDIS_MAXMEMORY_NO_EVICTION;
1217 }
1218
7585836e 1219 scriptingInit();
daa70b17 1220 slowlogInit();
8f61a72f 1221 bioInit();
e2641e09 1222}
1223
1b1f47c9 1224/* Populates the Redis Command Table starting from the hard coded list
1225 * we have on top of redis.c file. */
1226void populateCommandTable(void) {
1227 int j;
d7ed7fd2 1228 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1b1f47c9 1229
1230 for (j = 0; j < numcommands; j++) {
d7ed7fd2 1231 struct redisCommand *c = redisCommandTable+j;
5d02b00f 1232 char *f = c->sflags;
1b1f47c9 1233 int retval;
e2641e09 1234
5d02b00f 1235 while(*f != '\0') {
1236 switch(*f) {
1237 case 'w': c->flags |= REDIS_CMD_WRITE; break;
1238 case 'r': c->flags |= REDIS_CMD_READONLY; break;
1239 case 'm': c->flags |= REDIS_CMD_DENYOOM; break;
1240 case 'a': c->flags |= REDIS_CMD_ADMIN; break;
1241 case 'p': c->flags |= REDIS_CMD_PUBSUB; break;
1242 case 'f': c->flags |= REDIS_CMD_FORCE_REPLICATION; break;
b60ed6e8 1243 case 's': c->flags |= REDIS_CMD_NOSCRIPT; break;
1244 case 'R': c->flags |= REDIS_CMD_RANDOM; break;
548efd91 1245 case 'S': c->flags |= REDIS_CMD_SORT_FOR_SCRIPT; break;
5d02b00f 1246 default: redisPanic("Unsupported command flag"); break;
1247 }
1248 f++;
1249 }
1250
1b1f47c9 1251 retval = dictAdd(server.commands, sdsnew(c->name), c);
1252 assert(retval == DICT_OK);
1253 }
e2641e09 1254}
1255
d7ed7fd2 1256void resetCommandTableStats(void) {
1257 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1258 int j;
1259
1260 for (j = 0; j < numcommands; j++) {
1261 struct redisCommand *c = redisCommandTable+j;
1262
1263 c->microseconds = 0;
1264 c->calls = 0;
1265 }
1266}
1267
78d6a22d 1268/* ========================== Redis OP Array API ============================ */
1269
1270void redisOpArrayInit(redisOpArray *oa) {
1271 oa->ops = NULL;
1272 oa->numops = 0;
1273}
1274
1275int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
1276 robj **argv, int argc, int target)
1277{
1278 redisOp *op;
1279
1280 oa->ops = zrealloc(oa->ops,sizeof(redisOp)*(oa->numops+1));
1281 op = oa->ops+oa->numops;
1282 op->cmd = cmd;
1283 op->dbid = dbid;
1284 op->argv = argv;
1285 op->argc = argc;
1286 op->target = target;
1287 oa->numops++;
1288 return oa->numops;
1289}
1290
1291void redisOpArrayFree(redisOpArray *oa) {
1292 while(oa->numops) {
1293 int j;
1294 redisOp *op;
1295
1296 oa->numops--;
1297 op = oa->ops+oa->numops;
1298 for (j = 0; j < op->argc; j++)
1299 decrRefCount(op->argv[j]);
1300 zfree(op->argv);
1301 }
1302 zfree(oa->ops);
1303}
1304
e2641e09 1305/* ====================== Commands lookup and execution ===================== */
1306
1b1f47c9 1307struct redisCommand *lookupCommand(sds name) {
1308 return dictFetchValue(server.commands, name);
1309}
1310
1311struct redisCommand *lookupCommandByCString(char *s) {
1312 struct redisCommand *cmd;
1313 sds name = sdsnew(s);
1314
1315 cmd = dictFetchValue(server.commands, name);
1316 sdsfree(name);
1317 return cmd;
e2641e09 1318}
1319
ad08d059 1320/* Propagate the specified command (in the context of the specified database id)
1321 * to AOF, Slaves and Monitors.
1322 *
1323 * flags are an xor between:
1324 * + REDIS_PROPAGATE_NONE (no propagation of command at all)
1325 * + REDIS_PROPAGATE_AOF (propagate into the AOF file if is enabled)
1326 * + REDIS_PROPAGATE_REPL (propagate into the replication link)
1327 */
1328void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1329 int flags)
1330{
1331 if (server.aof_state != REDIS_AOF_OFF && flags & REDIS_PROPAGATE_AOF)
1332 feedAppendOnlyFile(cmd,dbid,argv,argc);
1333 if (flags & REDIS_PROPAGATE_REPL && listLength(server.slaves))
1334 replicationFeedSlaves(server.slaves,dbid,argv,argc);
1335}
1336
78d6a22d 1337/* Used inside commands to schedule the propagation of additional commands
1338 * after the current command is propagated to AOF / Replication. */
eeb34eff 1339void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1340 int target)
1341{
78d6a22d 1342 redisOpArrayAppend(&server.also_propagate,cmd,dbid,argv,argc,target);
eeb34eff 1343}
1344
e2641e09 1345/* Call() is the core of Redis execution of a command */
ce8b772b 1346void call(redisClient *c, int flags) {
daa70b17 1347 long long dirty, start = ustime(), duration;
e2641e09 1348
ad08d059 1349 /* Sent the command to clients in MONITOR mode, only if the commands are
1350 * not geneated from reading an AOF. */
1351 if (listLength(server.monitors) && !server.loading)
e31b615e 1352 replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
ad08d059 1353
1354 /* Call the command. */
78d6a22d 1355 redisOpArrayInit(&server.also_propagate);
e2641e09 1356 dirty = server.dirty;
09e2d9ee 1357 c->cmd->proc(c);
e2641e09 1358 dirty = server.dirty-dirty;
daa70b17 1359 duration = ustime()-start;
ce8b772b 1360
1361 /* When EVAL is called loading the AOF we don't want commands called
1362 * from Lua to go into the slowlog or to populate statistics. */
1363 if (server.loading && c->flags & REDIS_LUA_CLIENT)
1364 flags &= ~(REDIS_CALL_SLOWLOG | REDIS_CALL_STATS);
1365
ad08d059 1366 /* Log the command into the Slow log if needed, and populate the
1367 * per-command statistics that we show in INFO commandstats. */
ce8b772b 1368 if (flags & REDIS_CALL_SLOWLOG)
1369 slowlogPushEntryIfNeeded(c->argv,c->argc,duration);
1370 if (flags & REDIS_CALL_STATS) {
1371 c->cmd->microseconds += duration;
1372 c->cmd->calls++;
1373 }
ad08d059 1374
1375 /* Propagate the command into the AOF and replication link */
ce8b772b 1376 if (flags & REDIS_CALL_PROPAGATE) {
ad08d059 1377 int flags = REDIS_PROPAGATE_NONE;
1378
1379 if (c->cmd->flags & REDIS_CMD_FORCE_REPLICATION)
1380 flags |= REDIS_PROPAGATE_REPL;
1381 if (dirty)
1382 flags |= (REDIS_PROPAGATE_REPL | REDIS_PROPAGATE_AOF);
1383 if (flags != REDIS_PROPAGATE_NONE)
1384 propagate(c->cmd,c->db->id,c->argv,c->argc,flags);
ce8b772b 1385 }
eeb34eff 1386 /* Commands such as LPUSH or BRPOPLPUSH may propagate an additional
1387 * PUSH command. */
78d6a22d 1388 if (server.also_propagate.numops) {
eeb34eff 1389 int j;
78d6a22d 1390 redisOp *rop;
eeb34eff 1391
78d6a22d 1392 for (j = 0; j < server.also_propagate.numops; j++) {
1393 rop = &server.also_propagate.ops[j];
1394 propagate(rop->cmd, rop->dbid, rop->argv, rop->argc, rop->target);
1395 }
1396 redisOpArrayFree(&server.also_propagate);
eeb34eff 1397 }
e2641e09 1398 server.stat_numcommands++;
1399}
1400
1401/* If this function gets called we already read a whole
1402 * command, argments are in the client argv/argc fields.
1403 * processCommand() execute the command or prepare the
1404 * server for a bulk read from the client.
1405 *
1406 * If 1 is returned the client is still alive and valid and
1407 * and other operations can be performed by the caller. Otherwise
1408 * if 0 is returned the client was destroied (i.e. after QUIT). */
1409int processCommand(redisClient *c) {
941c9fa2
PN
1410 /* The QUIT command is handled separately. Normal command procs will
1411 * go through checking for replication and QUIT will cause trouble
1412 * when FORCE_REPLICATION is enabled and would be implemented in
1413 * a regular command proc. */
e2641e09 1414 if (!strcasecmp(c->argv[0]->ptr,"quit")) {
941c9fa2 1415 addReply(c,shared.ok);
5e78edb3 1416 c->flags |= REDIS_CLOSE_AFTER_REPLY;
cd8788f2 1417 return REDIS_ERR;
e2641e09 1418 }
1419
1420 /* Now lookup the command and check ASAP about trivial error conditions
09e2d9ee 1421 * such as wrong arity, bad command name and so forth. */
2c74a9f9 1422 c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
09e2d9ee 1423 if (!c->cmd) {
3ab20376
PN
1424 addReplyErrorFormat(c,"unknown command '%s'",
1425 (char*)c->argv[0]->ptr);
cd8788f2 1426 return REDIS_OK;
09e2d9ee 1427 } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
1428 (c->argc < -c->cmd->arity)) {
3ab20376 1429 addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
09e2d9ee 1430 c->cmd->name);
cd8788f2 1431 return REDIS_OK;
e2641e09 1432 }
e2641e09 1433
1434 /* Check if the user is authenticated */
09e2d9ee 1435 if (server.requirepass && !c->authenticated && c->cmd->proc != authCommand)
1436 {
3ab20376 1437 addReplyError(c,"operation not permitted");
cd8788f2 1438 return REDIS_OK;
e2641e09 1439 }
1440
1dd10ca2 1441 /* Handle the maxmemory directive.
1442 *
1443 * First we try to free some memory if possible (if there are volatile
1444 * keys in the dataset). If there are not the only thing we can do
1445 * is returning an error. */
f6b32c14 1446 if (server.maxmemory) {
1447 int retval = freeMemoryIfNeeded();
1448 if ((c->cmd->flags & REDIS_CMD_DENYOOM) && retval == REDIS_ERR) {
05406168 1449 addReply(c, shared.oomerr);
f6b32c14 1450 return REDIS_OK;
1451 }
e2641e09 1452 }
1453
c25e7eaf 1454 /* Don't accept write commands if there are problems persisting on disk. */
4d3bbf35 1455 if (server.stop_writes_on_bgsave_err &&
1456 server.saveparamslen > 0
1457 && server.lastbgsave_status == REDIS_ERR &&
c25e7eaf 1458 c->cmd->flags & REDIS_CMD_WRITE)
1459 {
1460 addReply(c, shared.bgsaveerr);
1461 return REDIS_OK;
05406168 1462 }
1463
1464 /* Don't accept wirte commands if this is a read only slave. But
1465 * accept write commands if this is our master. */
1466 if (server.masterhost && server.repl_slave_ro &&
1467 !(c->flags & REDIS_MASTER) &&
1468 c->cmd->flags & REDIS_CMD_WRITE)
1469 {
1470 addReply(c, shared.roslaveerr);
1471 return REDIS_OK;
c25e7eaf 1472 }
1473
e2641e09 1474 /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
1475 if ((dictSize(c->pubsub_channels) > 0 || listLength(c->pubsub_patterns) > 0)
1476 &&
09e2d9ee 1477 c->cmd->proc != subscribeCommand &&
1478 c->cmd->proc != unsubscribeCommand &&
1479 c->cmd->proc != psubscribeCommand &&
1480 c->cmd->proc != punsubscribeCommand) {
3ab20376 1481 addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / QUIT allowed in this context");
cd8788f2 1482 return REDIS_OK;
e2641e09 1483 }
1484
4ebfc455 1485 /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
1486 * we are a slave with a broken link with master. */
1844f990 1487 if (server.masterhost && server.repl_state != REDIS_REPL_CONNECTED &&
4ebfc455 1488 server.repl_serve_stale_data == 0 &&
09e2d9ee 1489 c->cmd->proc != infoCommand && c->cmd->proc != slaveofCommand)
4ebfc455 1490 {
1491 addReplyError(c,
1492 "link with MASTER is down and slave-serve-stale-data is set to no");
1493 return REDIS_OK;
1494 }
1495
97e7f8ae 1496 /* Loading DB? Return an error if the command is not INFO */
09e2d9ee 1497 if (server.loading && c->cmd->proc != infoCommand) {
97e7f8ae 1498 addReply(c, shared.loadingerr);
1499 return REDIS_OK;
1500 }
1501
4ab8695d 1502 /* Lua script too slow? Only allow SHUTDOWN NOSAVE and SCRIPT KILL. */
1503 if (server.lua_timedout &&
1504 !(c->cmd->proc != shutdownCommand &&
1505 c->argc == 2 &&
1506 tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
1507 !(c->cmd->proc == scriptCommand &&
1508 c->argc == 2 &&
1509 tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
1510 {
115e3ff3 1511 addReply(c, shared.slowscripterr);
1512 return REDIS_OK;
1513 }
1514
e2641e09 1515 /* Exec the command */
1516 if (c->flags & REDIS_MULTI &&
09e2d9ee 1517 c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
1518 c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
e2641e09 1519 {
09e2d9ee 1520 queueMultiCommand(c);
e2641e09 1521 addReply(c,shared.queued);
1522 } else {
ce8b772b 1523 call(c,REDIS_CALL_FULL);
e2641e09 1524 }
cd8788f2 1525 return REDIS_OK;
e2641e09 1526}
1527
1528/*================================== Shutdown =============================== */
1529
4ab8695d 1530int prepareForShutdown(int flags) {
1531 int save = flags & REDIS_SHUTDOWN_SAVE;
1532 int nosave = flags & REDIS_SHUTDOWN_NOSAVE;
1533
adae85cd 1534 redisLog(REDIS_WARNING,"User requested shutdown...");
e2641e09 1535 /* Kill the saving child if there is a background saving in progress.
1536 We want to avoid race conditions, for instance our saving child may
1537 overwrite the synchronous saving did by SHUTDOWN. */
f48cd4b9 1538 if (server.rdb_child_pid != -1) {
adae85cd 1539 redisLog(REDIS_WARNING,"There is a child saving an .rdb. Killing it!");
f48cd4b9 1540 kill(server.rdb_child_pid,SIGKILL);
1541 rdbRemoveTempFile(server.rdb_child_pid);
e2641e09 1542 }
e394114d 1543 if (server.aof_state != REDIS_AOF_OFF) {
adae85cd 1544 /* Kill the AOF saving child as the AOF we already have may be longer
1545 * but contains the full dataset anyway. */
ff2145ad 1546 if (server.aof_child_pid != -1) {
adae85cd 1547 redisLog(REDIS_WARNING,
1548 "There is a child rewriting the AOF. Killing it!");
ff2145ad 1549 kill(server.aof_child_pid,SIGKILL);
adae85cd 1550 }
e2641e09 1551 /* Append only file: fsync() the AOF and exit */
adae85cd 1552 redisLog(REDIS_NOTICE,"Calling fsync() on the AOF file.");
ff2145ad 1553 aof_fsync(server.aof_fd);
adae85cd 1554 }
4ab8695d 1555 if ((server.saveparamslen > 0 && !nosave) || save) {
adae85cd 1556 redisLog(REDIS_NOTICE,"Saving the final RDB snapshot before exiting.");
e2641e09 1557 /* Snapshotting. Perform a SYNC SAVE and exit */
f48cd4b9 1558 if (rdbSave(server.rdb_filename) != REDIS_OK) {
e2641e09 1559 /* Ooops.. error saving! The best we can do is to continue
1560 * operating. Note that if there was a background saving process,
1561 * in the next cron() Redis will be notified that the background
1562 * saving aborted, handling special stuff like slaves pending for
1563 * synchronization... */
adae85cd 1564 redisLog(REDIS_WARNING,"Error trying to save the DB, can't exit.");
e2641e09 1565 return REDIS_ERR;
1566 }
1567 }
adae85cd 1568 if (server.daemonize) {
1569 redisLog(REDIS_NOTICE,"Removing the pid file.");
1570 unlink(server.pidfile);
1571 }
80e87a46 1572 /* Close the listening sockets. Apparently this allows faster restarts. */
1573 if (server.ipfd != -1) close(server.ipfd);
1574 if (server.sofd != -1) close(server.sofd);
56209f72
NF
1575 if (server.unixsocket) {
1576 redisLog(REDIS_NOTICE,"Removing the unix socket file.");
1577 unlink(server.unixsocket); /* don't care if this fails */
1578 }
80e87a46 1579
adae85cd 1580 redisLog(REDIS_WARNING,"Redis is now ready to exit, bye bye...");
e2641e09 1581 return REDIS_OK;
1582}
1583
1584/*================================== Commands =============================== */
1585
1586void authCommand(redisClient *c) {
ab52d1f4 1587 if (!server.requirepass) {
1588 addReplyError(c,"Client sent AUTH, but no password is set");
1589 } else if (!strcmp(c->argv[1]->ptr, server.requirepass)) {
e2641e09 1590 c->authenticated = 1;
1591 addReply(c,shared.ok);
1592 } else {
1593 c->authenticated = 0;
3ab20376 1594 addReplyError(c,"invalid password");
e2641e09 1595 }
1596}
1597
1598void pingCommand(redisClient *c) {
1599 addReply(c,shared.pong);
1600}
1601
1602void echoCommand(redisClient *c) {
1603 addReplyBulk(c,c->argv[1]);
1604}
1605
9494f1f1 1606void timeCommand(redisClient *c) {
1607 struct timeval tv;
1608
1609 /* gettimeofday() can only fail if &tv is a bad addresss so we
1610 * don't check for errors. */
1611 gettimeofday(&tv,NULL);
1612 addReplyMultiBulkLen(c,2);
1613 addReplyBulkLongLong(c,tv.tv_sec);
1614 addReplyBulkLongLong(c,tv.tv_usec);
1615}
1616
e2641e09 1617/* Convert an amount of bytes into a human readable string in the form
1618 * of 100B, 2G, 100M, 4K, and so forth. */
1619void bytesToHuman(char *s, unsigned long long n) {
1620 double d;
1621
1622 if (n < 1024) {
1623 /* Bytes */
1624 sprintf(s,"%lluB",n);
1625 return;
1626 } else if (n < (1024*1024)) {
1627 d = (double)n/(1024);
1628 sprintf(s,"%.2fK",d);
1629 } else if (n < (1024LL*1024*1024)) {
1630 d = (double)n/(1024*1024);
1631 sprintf(s,"%.2fM",d);
1632 } else if (n < (1024LL*1024*1024*1024)) {
1633 d = (double)n/(1024LL*1024*1024);
1634 sprintf(s,"%.2fG",d);
1635 }
1636}
1637
1638/* Create the string returned by the INFO command. This is decoupled
1639 * by the INFO command itself as we need to report the same information
1640 * on memory corruption problems. */
1b085c9f 1641sds genRedisInfoString(char *section) {
1642 sds info = sdsempty();
e2641e09 1643 time_t uptime = time(NULL)-server.stat_starttime;
d9cb288c 1644 int j, numcommands;
2b00385d 1645 struct rusage self_ru, c_ru;
7a1fd61e 1646 unsigned long lol, bib;
1b085c9f 1647 int allsections = 0, defsections = 0;
1648 int sections = 0;
1649
1650 if (section) {
1651 allsections = strcasecmp(section,"all") == 0;
0d808ef2 1652 defsections = strcasecmp(section,"default") == 0;
1b085c9f 1653 }
2b00385d 1654
1655 getrusage(RUSAGE_SELF, &self_ru);
1656 getrusage(RUSAGE_CHILDREN, &c_ru);
7a1fd61e 1657 getClientsMaxBuffers(&lol,&bib);
1b085c9f 1658
1659 /* Server */
1660 if (allsections || defsections || !strcasecmp(section,"server")) {
1661 if (sections++) info = sdscat(info,"\r\n");
e2641e09 1662 info = sdscatprintf(info,
1b085c9f 1663 "# Server\r\n"
1664 "redis_version:%s\r\n"
1665 "redis_git_sha1:%s\r\n"
1666 "redis_git_dirty:%d\r\n"
75eaac5c 1667 "arch_bits:%d\r\n"
1b085c9f 1668 "multiplexing_api:%s\r\n"
5db904bd 1669 "gcc_version:%d.%d.%d\r\n"
1b085c9f 1670 "process_id:%ld\r\n"
91d664d6 1671 "run_id:%s\r\n"
1b085c9f 1672 "tcp_port:%d\r\n"
1673 "uptime_in_seconds:%ld\r\n"
1674 "uptime_in_days:%ld\r\n"
1675 "lru_clock:%ld\r\n",
1676 REDIS_VERSION,
1677 redisGitSHA1(),
1678 strtol(redisGitDirty(),NULL,10) > 0,
75eaac5c 1679 server.arch_bits,
1b085c9f 1680 aeGetApiName(),
5db904bd 1681#ifdef __GNUC__
1682 __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
1683#else
1684 0,0,0,
1685#endif
1b085c9f 1686 (long) getpid(),
91d664d6 1687 server.runid,
1b085c9f 1688 server.port,
1689 uptime,
1690 uptime/(3600*24),
1691 (unsigned long) server.lruclock);
1692 }
1693
1694 /* Clients */
1695 if (allsections || defsections || !strcasecmp(section,"clients")) {
1696 if (sections++) info = sdscat(info,"\r\n");
1697 info = sdscatprintf(info,
1698 "# Clients\r\n"
3c08fdae 1699 "connected_clients:%lu\r\n"
1b085c9f 1700 "client_longest_output_list:%lu\r\n"
1701 "client_biggest_input_buf:%lu\r\n"
1702 "blocked_clients:%d\r\n",
1703 listLength(server.clients)-listLength(server.slaves),
1704 lol, bib,
1705 server.bpop_blocked_clients);
1706 }
1707
1708 /* Memory */
1709 if (allsections || defsections || !strcasecmp(section,"memory")) {
17b24ff3 1710 char hmem[64];
1711 char peak_hmem[64];
1712
1713 bytesToHuman(hmem,zmalloc_used_memory());
1714 bytesToHuman(peak_hmem,server.stat_peak_memory);
1b085c9f 1715 if (sections++) info = sdscat(info,"\r\n");
1716 info = sdscatprintf(info,
1717 "# Memory\r\n"
1718 "used_memory:%zu\r\n"
1719 "used_memory_human:%s\r\n"
1720 "used_memory_rss:%zu\r\n"
17b24ff3 1721 "used_memory_peak:%zu\r\n"
1722 "used_memory_peak_human:%s\r\n"
8c3402df 1723 "used_memory_lua:%lld\r\n"
1b085c9f 1724 "mem_fragmentation_ratio:%.2f\r\n"
32f99c51 1725 "mem_allocator:%s\r\n",
1b085c9f 1726 zmalloc_used_memory(),
1727 hmem,
1728 zmalloc_get_rss(),
17b24ff3 1729 server.stat_peak_memory,
1730 peak_hmem,
8c3402df 1731 ((long long)lua_gc(server.lua,LUA_GCCOUNT,0))*1024LL,
1b085c9f 1732 zmalloc_get_fragmentation_ratio(),
fec5a664 1733 ZMALLOC_LIB
12ebe2ac 1734 );
0d808ef2 1735 }
1736
1b085c9f 1737 /* Persistence */
1738 if (allsections || defsections || !strcasecmp(section,"persistence")) {
1739 if (sections++) info = sdscat(info,"\r\n");
e2641e09 1740 info = sdscatprintf(info,
1b085c9f 1741 "# Persistence\r\n"
1742 "loading:%d\r\n"
1743 "aof_enabled:%d\r\n"
1744 "changes_since_last_save:%lld\r\n"
1745 "bgsave_in_progress:%d\r\n"
1746 "last_save_time:%ld\r\n"
c25e7eaf 1747 "last_bgsave_status:%s\r\n"
1b085c9f 1748 "bgrewriteaof_in_progress:%d\r\n",
1749 server.loading,
e394114d 1750 server.aof_state != REDIS_AOF_OFF,
1b085c9f 1751 server.dirty,
f48cd4b9 1752 server.rdb_child_pid != -1,
1b085c9f 1753 server.lastsave,
c25e7eaf 1754 server.lastbgsave_status == REDIS_OK ? "ok" : "err",
ff2145ad 1755 server.aof_child_pid != -1);
1b085c9f 1756
e394114d 1757 if (server.aof_state != REDIS_AOF_OFF) {
d630abcd 1758 info = sdscatprintf(info,
1759 "aof_current_size:%lld\r\n"
1760 "aof_base_size:%lld\r\n"
e7ef418c 1761 "aof_pending_rewrite:%d\r\n"
1762 "aof_buffer_length:%zu\r\n"
1763 "aof_pending_bio_fsync:%llu\r\n",
2c915bcf 1764 (long long) server.aof_current_size,
1765 (long long) server.aof_rewrite_base_size,
1766 server.aof_rewrite_scheduled,
ff2145ad 1767 sdslen(server.aof_buf),
e7ef418c 1768 bioPendingJobsOfType(REDIS_BIO_AOF_FSYNC));
d630abcd 1769 }
1770
1b085c9f 1771 if (server.loading) {
1772 double perc;
1773 time_t eta, elapsed;
1774 off_t remaining_bytes = server.loading_total_bytes-
1775 server.loading_loaded_bytes;
1776
1777 perc = ((double)server.loading_loaded_bytes /
1778 server.loading_total_bytes) * 100;
1779
1780 elapsed = time(NULL)-server.loading_start_time;
1781 if (elapsed == 0) {
1782 eta = 1; /* A fake 1 second figure if we don't have
1783 enough info */
1784 } else {
1785 eta = (elapsed*remaining_bytes)/server.loading_loaded_bytes;
1786 }
1787
1788 info = sdscatprintf(info,
1789 "loading_start_time:%ld\r\n"
1790 "loading_total_bytes:%llu\r\n"
1791 "loading_loaded_bytes:%llu\r\n"
1792 "loading_loaded_perc:%.2f\r\n"
1793 "loading_eta_seconds:%ld\r\n"
1794 ,(unsigned long) server.loading_start_time,
1795 (unsigned long long) server.loading_total_bytes,
1796 (unsigned long long) server.loading_loaded_bytes,
1797 perc,
1798 eta
1799 );
1800 }
e2641e09 1801 }
1b085c9f 1802
1b085c9f 1803 /* Stats */
1804 if (allsections || defsections || !strcasecmp(section,"stats")) {
1805 if (sections++) info = sdscat(info,"\r\n");
97e7f8ae 1806 info = sdscatprintf(info,
1b085c9f 1807 "# Stats\r\n"
1808 "total_connections_received:%lld\r\n"
1809 "total_commands_processed:%lld\r\n"
250e7f69 1810 "instantaneous_ops_per_sec:%lld\r\n"
3c95e721 1811 "rejected_connections:%lld\r\n"
1b085c9f 1812 "expired_keys:%lld\r\n"
1813 "evicted_keys:%lld\r\n"
1814 "keyspace_hits:%lld\r\n"
1815 "keyspace_misses:%lld\r\n"
1816 "pubsub_channels:%ld\r\n"
3c08fdae 1817 "pubsub_patterns:%lu\r\n"
615e414c 1818 "latest_fork_usec:%lld\r\n",
1b085c9f 1819 server.stat_numconnections,
1820 server.stat_numcommands,
250e7f69 1821 getOperationsPerSecond(),
3c95e721 1822 server.stat_rejected_conn,
1b085c9f 1823 server.stat_expiredkeys,
1824 server.stat_evictedkeys,
1825 server.stat_keyspace_hits,
1826 server.stat_keyspace_misses,
1827 dictSize(server.pubsub_channels),
615e414c 1828 listLength(server.pubsub_patterns),
1829 server.stat_fork_time);
97e7f8ae 1830 }
67a1810b 1831
1b085c9f 1832 /* Replication */
1833 if (allsections || defsections || !strcasecmp(section,"replication")) {
1834 if (sections++) info = sdscat(info,"\r\n");
1835 info = sdscatprintf(info,
1836 "# Replication\r\n"
1837 "role:%s\r\n",
1838 server.masterhost == NULL ? "master" : "slave");
1839 if (server.masterhost) {
1840 info = sdscatprintf(info,
1841 "master_host:%s\r\n"
1842 "master_port:%d\r\n"
1843 "master_link_status:%s\r\n"
1844 "master_last_io_seconds_ago:%d\r\n"
1845 "master_sync_in_progress:%d\r\n"
1846 ,server.masterhost,
1847 server.masterport,
1844f990 1848 (server.repl_state == REDIS_REPL_CONNECTED) ?
1b085c9f 1849 "up" : "down",
1850 server.master ?
1851 ((int)(time(NULL)-server.master->lastinteraction)) : -1,
1844f990 1852 server.repl_state == REDIS_REPL_TRANSFER
1b085c9f 1853 );
1854
1844f990 1855 if (server.repl_state == REDIS_REPL_TRANSFER) {
1b085c9f 1856 info = sdscatprintf(info,
1857 "master_sync_left_bytes:%ld\r\n"
1858 "master_sync_last_io_seconds_ago:%d\r\n"
1859 ,(long)server.repl_transfer_left,
1860 (int)(time(NULL)-server.repl_transfer_lastio)
1861 );
1862 }
07486df6 1863
1844f990 1864 if (server.repl_state != REDIS_REPL_CONNECTED) {
07486df6 1865 info = sdscatprintf(info,
1866 "master_link_down_since_seconds:%ld\r\n",
1867 (long)time(NULL)-server.repl_down_since);
1868 }
67a1810b 1869 }
1b085c9f 1870 info = sdscatprintf(info,
3c08fdae 1871 "connected_slaves:%lu\r\n",
1b085c9f 1872 listLength(server.slaves));
503d87a8 1873 if (listLength(server.slaves)) {
1874 int slaveid = 0;
1875 listNode *ln;
1876 listIter li;
1877
1878 listRewind(server.slaves,&li);
1879 while((ln = listNext(&li))) {
1880 redisClient *slave = listNodeValue(ln);
1881 char *state = NULL;
1882 char ip[32];
1883 int port;
1884
1885 if (anetPeerToString(slave->fd,ip,&port) == -1) continue;
1886 switch(slave->replstate) {
1887 case REDIS_REPL_WAIT_BGSAVE_START:
1888 case REDIS_REPL_WAIT_BGSAVE_END:
1889 state = "wait_bgsave";
1890 break;
1891 case REDIS_REPL_SEND_BULK:
1892 state = "send_bulk";
1893 break;
1894 case REDIS_REPL_ONLINE:
1895 state = "online";
1896 break;
1897 }
1898 if (state == NULL) continue;
1899 info = sdscatprintf(info,"slave%d:%s,%d,%s\r\n",
1900 slaveid,ip,port,state);
1901 slaveid++;
1902 }
1903 }
67a1810b 1904 }
67a1810b 1905
0d808ef2 1906 /* CPU */
1907 if (allsections || defsections || !strcasecmp(section,"cpu")) {
1b085c9f 1908 if (sections++) info = sdscat(info,"\r\n");
1909 info = sdscatprintf(info,
0d808ef2 1910 "# CPU\r\n"
1b085c9f 1911 "used_cpu_sys:%.2f\r\n"
1912 "used_cpu_user:%.2f\r\n"
5a9dd97c 1913 "used_cpu_sys_children:%.2f\r\n"
1914 "used_cpu_user_children:%.2f\r\n",
1b085c9f 1915 (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
d83eda48 1916 (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000,
1917 (float)c_ru.ru_stime.tv_sec+(float)c_ru.ru_stime.tv_usec/1000000,
1918 (float)c_ru.ru_utime.tv_sec+(float)c_ru.ru_utime.tv_usec/1000000);
0d808ef2 1919 }
1b085c9f 1920
0d808ef2 1921 /* cmdtime */
1922 if (allsections || !strcasecmp(section,"commandstats")) {
1923 if (sections++) info = sdscat(info,"\r\n");
1924 info = sdscatprintf(info, "# Commandstats\r\n");
d7ed7fd2 1925 numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1b085c9f 1926 for (j = 0; j < numcommands; j++) {
d7ed7fd2 1927 struct redisCommand *c = redisCommandTable+j;
0d808ef2 1928
d7ed7fd2 1929 if (!c->calls) continue;
1930 info = sdscatprintf(info,
1931 "cmdstat_%s:calls=%lld,usec=%lld,usec_per_call=%.2f\r\n",
1932 c->name, c->calls, c->microseconds,
1933 (c->calls == 0) ? 0 : ((float)c->microseconds/c->calls));
1b085c9f 1934 }
d9cb288c 1935 }
1936
1b085c9f 1937 /* Key space */
1938 if (allsections || defsections || !strcasecmp(section,"keyspace")) {
1939 if (sections++) info = sdscat(info,"\r\n");
1940 info = sdscatprintf(info, "# Keyspace\r\n");
1941 for (j = 0; j < server.dbnum; j++) {
1942 long long keys, vkeys;
e2641e09 1943
1b085c9f 1944 keys = dictSize(server.db[j].dict);
1945 vkeys = dictSize(server.db[j].expires);
1946 if (keys || vkeys) {
1947 info = sdscatprintf(info, "db%d:keys=%lld,expires=%lld\r\n",
1948 j, keys, vkeys);
1949 }
e2641e09 1950 }
1951 }
1952 return info;
1953}
1954
1955void infoCommand(redisClient *c) {
1b085c9f 1956 char *section = c->argc == 2 ? c->argv[1]->ptr : "default";
1957
1958 if (c->argc > 2) {
1959 addReply(c,shared.syntaxerr);
1960 return;
1961 }
1962 sds info = genRedisInfoString(section);
e2641e09 1963 addReplySds(c,sdscatprintf(sdsempty(),"$%lu\r\n",
1964 (unsigned long)sdslen(info)));
1965 addReplySds(c,info);
1966 addReply(c,shared.crlf);
1967}
1968
1969void monitorCommand(redisClient *c) {
1970 /* ignore MONITOR if aleady slave or in monitor mode */
1971 if (c->flags & REDIS_SLAVE) return;
1972
1973 c->flags |= (REDIS_SLAVE|REDIS_MONITOR);
1974 c->slaveseldb = 0;
1975 listAddNodeTail(server.monitors,c);
1976 addReply(c,shared.ok);
1977}
1978
1979/* ============================ Maxmemory directive ======================== */
1980
e2641e09 1981/* This function gets called when 'maxmemory' is set on the config file to limit
f6b32c14 1982 * the max memory used by the server, before processing a command.
e2641e09 1983 *
f6b32c14 1984 * The goal of the function is to free enough memory to keep Redis under the
1985 * configured memory limit.
e2641e09 1986 *
f6b32c14 1987 * The function starts calculating how many bytes should be freed to keep
1988 * Redis under the limit, and enters a loop selecting the best keys to
1989 * evict accordingly to the configured policy.
1990 *
1991 * If all the bytes needed to return back under the limit were freed the
1992 * function returns REDIS_OK, otherwise REDIS_ERR is returned, and the caller
1993 * should block the execution of commands that will result in more memory
1994 * used by the server.
e2641e09 1995 */
f6b32c14 1996int freeMemoryIfNeeded(void) {
1997 size_t mem_used, mem_tofree, mem_freed;
1998 int slaves = listLength(server.slaves);
1999
c1ef6ffe 2000 /* Remove the size of slaves output buffers and AOF buffer from the
2001 * count of used memory. */
f6b32c14 2002 mem_used = zmalloc_used_memory();
2003 if (slaves) {
2004 listIter li;
2005 listNode *ln;
2006
2007 listRewind(server.slaves,&li);
2008 while((ln = listNext(&li))) {
2009 redisClient *slave = listNodeValue(ln);
2010 unsigned long obuf_bytes = getClientOutputBufferMemoryUsage(slave);
2011 if (obuf_bytes > mem_used)
2012 mem_used = 0;
2013 else
2014 mem_used -= obuf_bytes;
2015 }
2016 }
c1ef6ffe 2017 if (server.aof_state != REDIS_AOF_OFF) {
2018 mem_used -= sdslen(server.aof_buf);
2019 mem_used -= sdslen(server.aof_rewrite_buf);
2020 }
5402c426 2021
f6b32c14 2022 /* Check if we are over the memory limit. */
2023 if (mem_used <= server.maxmemory) return REDIS_OK;
2024
2025 if (server.maxmemory_policy == REDIS_MAXMEMORY_NO_EVICTION)
2026 return REDIS_ERR; /* We need to free memory, but policy forbids. */
2027
2028 /* Compute how much memory we need to free. */
2029 mem_tofree = mem_used - server.maxmemory;
f6b32c14 2030 mem_freed = 0;
2031 while (mem_freed < mem_tofree) {
2032 int j, k, keys_freed = 0;
e2641e09 2033
165346ca 2034 for (j = 0; j < server.dbnum; j++) {
10c12171 2035 long bestval = 0; /* just to prevent warning */
165346ca 2036 sds bestkey = NULL;
2037 struct dictEntry *de;
2038 redisDb *db = server.db+j;
2039 dict *dict;
2040
2041 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2042 server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM)
2043 {
2044 dict = server.db[j].dict;
2045 } else {
2046 dict = server.db[j].expires;
2047 }
2048 if (dictSize(dict) == 0) continue;
2049
2050 /* volatile-random and allkeys-random policy */
2051 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM ||
2052 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_RANDOM)
2053 {
2054 de = dictGetRandomKey(dict);
c0ba9ebe 2055 bestkey = dictGetKey(de);
165346ca 2056 }
2057
2058 /* volatile-lru and allkeys-lru policy */
2059 else if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2060 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2061 {
2062 for (k = 0; k < server.maxmemory_samples; k++) {
2063 sds thiskey;
2064 long thisval;
2065 robj *o;
2066
2067 de = dictGetRandomKey(dict);
c0ba9ebe 2068 thiskey = dictGetKey(de);
0c2f75c6 2069 /* When policy is volatile-lru we need an additonal lookup
2070 * to locate the real key, as dict is set to db->expires. */
2071 if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2072 de = dictFind(db->dict, thiskey);
c0ba9ebe 2073 o = dictGetVal(de);
165346ca 2074 thisval = estimateObjectIdleTime(o);
2075
2076 /* Higher idle time is better candidate for deletion */
2077 if (bestkey == NULL || thisval > bestval) {
2078 bestkey = thiskey;
2079 bestval = thisval;
2080 }
2081 }
2082 }
2083
2084 /* volatile-ttl */
2085 else if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_TTL) {
2086 for (k = 0; k < server.maxmemory_samples; k++) {
2087 sds thiskey;
2088 long thisval;
2089
2090 de = dictGetRandomKey(dict);
c0ba9ebe 2091 thiskey = dictGetKey(de);
2092 thisval = (long) dictGetVal(de);
165346ca 2093
2094 /* Expire sooner (minor expire unix timestamp) is better
2095 * candidate for deletion */
2096 if (bestkey == NULL || thisval < bestval) {
2097 bestkey = thiskey;
2098 bestval = thisval;
2099 }
2100 }
2101 }
2102
2103 /* Finally remove the selected key. */
2104 if (bestkey) {
f6b32c14 2105 long long delta;
2106
165346ca 2107 robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
452229b6 2108 propagateExpire(db,keyobj);
f6b32c14 2109 /* We compute the amount of memory freed by dbDelete() alone.
2110 * It is possible that actually the memory needed to propagate
2111 * the DEL in AOF and replication link is greater than the one
2112 * we are freeing removing the key, but we can't account for
2113 * that otherwise we would never exit the loop.
2114 *
2115 * AOF and Output buffer memory will be freed eventually so
2116 * we only care about memory used by the key space. */
2117 delta = (long long) zmalloc_used_memory();
165346ca 2118 dbDelete(db,keyobj);
f6b32c14 2119 delta -= (long long) zmalloc_used_memory();
f6b32c14 2120 mem_freed += delta;
f21779ff 2121 server.stat_evictedkeys++;
165346ca 2122 decrRefCount(keyobj);
f6b32c14 2123 keys_freed++;
2124
2125 /* When the memory to free starts to be big enough, we may
2126 * start spending so much time here that is impossible to
2127 * deliver data to the slaves fast enough, so we force the
2128 * transmission here inside the loop. */
8b7c3455 2129 if (slaves) flushSlavesOutputBuffers();
165346ca 2130 }
2131 }
b129c6df 2132 if (!keys_freed) return REDIS_ERR; /* nothing to free... */
165346ca 2133 }
f6b32c14 2134 return REDIS_OK;
e2641e09 2135}
2136
2137/* =================================== Main! ================================ */
2138
2139#ifdef __linux__
2140int linuxOvercommitMemoryValue(void) {
2141 FILE *fp = fopen("/proc/sys/vm/overcommit_memory","r");
2142 char buf[64];
2143
2144 if (!fp) return -1;
2145 if (fgets(buf,64,fp) == NULL) {
2146 fclose(fp);
2147 return -1;
2148 }
2149 fclose(fp);
2150
2151 return atoi(buf);
2152}
2153
2154void linuxOvercommitMemoryWarning(void) {
2155 if (linuxOvercommitMemoryValue() == 0) {
2156 redisLog(REDIS_WARNING,"WARNING overcommit_memory is set to 0! Background save may fail under low memory condition. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
2157 }
2158}
2159#endif /* __linux__ */
2160
695fe874 2161void createPidFile(void) {
2162 /* Try to write the pid file in a best-effort way. */
2163 FILE *fp = fopen(server.pidfile,"w");
2164 if (fp) {
8ce39260 2165 fprintf(fp,"%d\n",(int)getpid());
695fe874 2166 fclose(fp);
2167 }
2168}
2169
e2641e09 2170void daemonize(void) {
2171 int fd;
e2641e09 2172
2173 if (fork() != 0) exit(0); /* parent exits */
2174 setsid(); /* create a new session */
2175
2176 /* Every output goes to /dev/null. If Redis is daemonized but
2177 * the 'logfile' is set to 'stdout' in the configuration file
2178 * it will not log at all. */
2179 if ((fd = open("/dev/null", O_RDWR, 0)) != -1) {
2180 dup2(fd, STDIN_FILENO);
2181 dup2(fd, STDOUT_FILENO);
2182 dup2(fd, STDERR_FILENO);
2183 if (fd > STDERR_FILENO) close(fd);
2184 }
e2641e09 2185}
2186
2187void version() {
2188 printf("Redis server version %s (%s:%d)\n", REDIS_VERSION,
2189 redisGitSHA1(), atoi(redisGitDirty()) > 0);
2190 exit(0);
2191}
2192
2193void usage() {
9268a5b5 2194 fprintf(stderr,"Usage: ./redis-server [/path/to/redis.conf] [options]\n");
e2641e09 2195 fprintf(stderr," ./redis-server - (read config from stdin)\n");
9268a5b5 2196 fprintf(stderr," ./redis-server -v or --version\n");
78d6a02b 2197 fprintf(stderr," ./redis-server -h or --help\n");
2198 fprintf(stderr," ./redis-server --test-memory <megabytes>\n\n");
9268a5b5 2199 fprintf(stderr,"Examples:\n");
2200 fprintf(stderr," ./redis-server (run the server with default conf)\n");
2201 fprintf(stderr," ./redis-server /etc/redis/6379.conf\n");
2202 fprintf(stderr," ./redis-server --port 7777\n");
2203 fprintf(stderr," ./redis-server --port 7777 --slaveof 127.0.0.1 8888\n");
2204 fprintf(stderr," ./redis-server /etc/myredis.conf --loglevel verbose\n");
e2641e09 2205 exit(1);
2206}
2207
996d503d 2208void redisAsciiArt(void) {
2209#include "asciilogo.h"
2210 char *buf = zmalloc(1024*16);
2211
2212 snprintf(buf,1024*16,ascii_logo,
2213 REDIS_VERSION,
2214 redisGitSHA1(),
2215 strtol(redisGitDirty(),NULL,10) > 0,
2216 (sizeof(long) == 8) ? "64" : "32",
571e257d 2217 "stand alone",
996d503d 2218 server.port,
2219 (long) getpid()
2220 );
2221 redisLogRaw(REDIS_NOTICE|REDIS_LOG_RAW,buf);
2222 zfree(buf);
2223}
2224
633a9410 2225static void sigtermHandler(int sig) {
e2641e09 2226 REDIS_NOTUSED(sig);
2227
633a9410 2228 redisLog(REDIS_WARNING,"Received SIGTERM, scheduling shutdown...");
e2641e09 2229 server.shutdown_asap = 1;
2230}
2231
633a9410 2232void setupSignalHandlers(void) {
e2641e09 2233 struct sigaction act;
2234
633a9410
PN
2235 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction is used.
2236 * Otherwise, sa_handler is used. */
2237 sigemptyset(&act.sa_mask);
e2641e09 2238 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND;
2239 act.sa_handler = sigtermHandler;
633a9410 2240 sigaction(SIGTERM, &act, NULL);
e2641e09 2241
633a9410
PN
2242#ifdef HAVE_BACKTRACE
2243 sigemptyset(&act.sa_mask);
2244 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND | SA_SIGINFO;
2245 act.sa_sigaction = sigsegvHandler;
2246 sigaction(SIGSEGV, &act, NULL);
2247 sigaction(SIGBUS, &act, NULL);
2248 sigaction(SIGFPE, &act, NULL);
2249 sigaction(SIGILL, &act, NULL);
2250#endif
2251 return;
e2641e09 2252}
e2641e09 2253
78d6a02b 2254void memtest(size_t megabytes, int passes);
2255
39ca1713 2256int main(int argc, char **argv) {
2257 long long start;
a48c8d87 2258 struct timeval tv;
39ca1713 2259
06c5523a 2260 /* We need to initialize our libraries, and the server configuration. */
39ca1713 2261 zmalloc_enable_thread_safeness();
a48c8d87 2262 srand(time(NULL)^getpid());
2263 gettimeofday(&tv,NULL);
2264 dictSetHashFunctionSeed(tv.tv_sec^tv.tv_usec^getpid());
39ca1713 2265 initServerConfig();
a48c8d87 2266
67c6f0f6 2267 if (argc >= 2) {
2268 int j = 1; /* First option to parse in argv[] */
2269 sds options = sdsempty();
2270 char *configfile = NULL;
2271
2272 /* Handle special options --help and --version */
39ca1713 2273 if (strcmp(argv[1], "-v") == 0 ||
2274 strcmp(argv[1], "--version") == 0) version();
4c8bd905 2275 if (strcmp(argv[1], "--help") == 0 ||
2276 strcmp(argv[1], "-h") == 0) usage();
78d6a02b 2277 if (strcmp(argv[1], "--test-memory") == 0) {
2278 if (argc == 3) {
ea693f02 2279 memtest(atoi(argv[2]),50);
78d6a02b 2280 exit(0);
2281 } else {
2282 fprintf(stderr,"Please specify the amount of memory to test in megabytes.\n");
2283 fprintf(stderr,"Example: ./redis-server --test-memory 4096\n\n");
2284 exit(1);
2285 }
2286 }
2287
67c6f0f6 2288 /* First argument is the config file name? */
2289 if (argv[j][0] != '-' || argv[j][1] != '-')
2290 configfile = argv[j++];
2291 /* All the other options are parsed and conceptually appended to the
2292 * configuration file. For instance --port 6380 will generate the
2293 * string "port 6380\n" to be parsed after the actual file name
2294 * is parsed, if any. */
2295 while(j != argc) {
2296 if (argv[j][0] == '-' && argv[j][1] == '-') {
2297 /* Option name */
2298 if (sdslen(options)) options = sdscat(options,"\n");
2299 options = sdscat(options,argv[j]+2);
2300 options = sdscat(options," ");
2301 } else {
2302 /* Option argument */
2303 options = sdscatrepr(options,argv[j],strlen(argv[j]));
2304 options = sdscat(options," ");
2305 }
2306 j++;
2307 }
39ca1713 2308 resetServerSaveParams();
67c6f0f6 2309 loadServerConfig(configfile,options);
2310 sdsfree(options);
39ca1713 2311 } else {
2312 redisLog(REDIS_WARNING,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
2313 }
2314 if (server.daemonize) daemonize();
2315 initServer();
2316 if (server.daemonize) createPidFile();
2317 redisAsciiArt();
27ccb94a 2318 redisLog(REDIS_WARNING,"Server started, Redis version " REDIS_VERSION);
39ca1713 2319#ifdef __linux__
2320 linuxOvercommitMemoryWarning();
2321#endif
2322 start = ustime();
e394114d 2323 if (server.aof_state == REDIS_AOF_ON) {
2c915bcf 2324 if (loadAppendOnlyFile(server.aof_filename) == REDIS_OK)
39ca1713 2325 redisLog(REDIS_NOTICE,"DB loaded from append only file: %.3f seconds",(float)(ustime()-start)/1000000);
2326 } else {
f48cd4b9 2327 if (rdbLoad(server.rdb_filename) == REDIS_OK) {
39ca1713 2328 redisLog(REDIS_NOTICE,"DB loaded from disk: %.3f seconds",
2329 (float)(ustime()-start)/1000000);
2330 } else if (errno != ENOENT) {
2331 redisLog(REDIS_WARNING,"Fatal error loading the DB. Exiting.");
2332 exit(1);
2333 }
2334 }
2335 if (server.ipfd > 0)
2336 redisLog(REDIS_NOTICE,"The server is now ready to accept connections on port %d", server.port);
2337 if (server.sofd > 0)
2338 redisLog(REDIS_NOTICE,"The server is now ready to accept connections at %s", server.unixsocket);
2339 aeSetBeforeSleepProc(server.el,beforeSleep);
2340 aeMain(server.el);
2341 aeDeleteEventLoop(server.el);
2342 return 0;
2343}
2344
e2641e09 2345/* The End */