]> git.saurik.com Git - redis.git/blame - src/redis.c
Redis software watchdog.
[redis.git] / src / redis.c
CommitLineData
e2641e09 1/*
2 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 */
29
30#include "redis.h"
daa70b17 31#include "slowlog.h"
8f61a72f 32#include "bio.h"
e2641e09 33
e2641e09 34#include <time.h>
35#include <signal.h>
36#include <sys/wait.h>
37#include <errno.h>
38#include <assert.h>
39#include <ctype.h>
40#include <stdarg.h>
e2641e09 41#include <arpa/inet.h>
42#include <sys/stat.h>
43#include <fcntl.h>
44#include <sys/time.h>
45#include <sys/resource.h>
46#include <sys/uio.h>
47#include <limits.h>
48#include <float.h>
49#include <math.h>
2b00385d 50#include <sys/resource.h>
e2641e09 51
52/* Our shared "common" objects */
53
54struct sharedObjectsStruct shared;
55
c74b7c77 56/* Global vars that are actually used as constants. The following double
e2641e09 57 * values are used for double on-disk serialization, and are initialized
58 * at runtime to avoid strange compiler optimizations. */
59
60double R_Zero, R_PosInf, R_NegInf, R_Nan;
61
62/*================================= Globals ================================= */
63
64/* Global vars */
65struct redisServer server; /* server global state */
66struct redisCommand *commandTable;
5d02b00f 67
7501c66f 68/* Our command table.
69 *
70 * Every entry is composed of the following fields:
71 *
72 * name: a string representing the command name.
73 * function: pointer to the C function implementing the command.
74 * arity: number of arguments, it is possible to use -N to say >= N
75 * sflags: command flags as string. See below for a table of flags.
76 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
77 * get_keys_proc: an optional function to get key arguments from a command.
78 * This is only used when the following three fields are not
79 * enough to specify what arguments are keys.
80 * first_key_index: first argument that is a key
81 * last_key_index: last argument that is a key
82 * key_step: step to get all the keys from first to last argument. For instance
83 * in MSET the step is two since arguments are key,val,key,val,...
84 * microseconds: microseconds of total execution time for this command.
85 * calls: total number of calls of this command.
86 *
87 * The flags, microseconds and calls fields are computed by Redis and should
88 * always be set to zero.
89 *
90 * Command flags are expressed using strings where every character represents
91 * a flag. Later the populateCommandTable() function will take care of
92 * populating the real 'flags' field using this characters.
5d02b00f 93 *
94 * This is the meaning of the flags:
95 *
96 * w: write command (may modify the key space).
97 * r: read command (will never modify the key space).
98 * m: may increase memory usage once called. Don't allow if out of memory.
99 * a: admin command, like SAVE or SHUTDOWN.
100 * p: Pub/Sub related command.
b60ed6e8 101 * f: force replication of this command, regarless of server.dirty.
102 * s: command not allowed in scripts.
7e14a208 103 * R: random command. Command is not deterministic, that is, the same command
b60ed6e8 104 * with the same arguments, with the same key space, may have different
548efd91 105 * results. For instance SPOP and RANDOMKEY are two random commands.
106 * S: Sort command output array if called from script, so that the output
107 * is deterministic.
108 */
d7ed7fd2 109struct redisCommand redisCommandTable[] = {
5d02b00f 110 {"get",getCommand,2,"r",0,NULL,1,1,1,0,0},
111 {"set",setCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
112 {"setnx",setnxCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
39da5d1f 113 {"setex",setexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
114 {"psetex",psetexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
5d02b00f 115 {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
116 {"strlen",strlenCommand,2,"r",0,NULL,1,1,1,0,0},
117 {"del",delCommand,-2,"w",0,noPreloadGetKeys,1,-1,1,0,0},
118 {"exists",existsCommand,2,"r",0,NULL,1,1,1,0,0},
119 {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
120 {"getbit",getbitCommand,3,"r",0,NULL,1,1,1,0,0},
121 {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
122 {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
123 {"substr",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
124 {"incr",incrCommand,2,"wm",0,NULL,1,1,1,0,0},
125 {"decr",decrCommand,2,"wm",0,NULL,1,1,1,0,0},
126 {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
127 {"rpush",rpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
128 {"lpush",lpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
129 {"rpushx",rpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
130 {"lpushx",lpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
131 {"linsert",linsertCommand,5,"wm",0,NULL,1,1,1,0,0},
132 {"rpop",rpopCommand,2,"w",0,NULL,1,1,1,0,0},
133 {"lpop",lpopCommand,2,"w",0,NULL,1,1,1,0,0},
e41677b4 134 {"brpop",brpopCommand,-3,"ws",0,NULL,1,1,1,0,0},
135 {"brpoplpush",brpoplpushCommand,4,"wms",0,NULL,1,2,1,0,0},
136 {"blpop",blpopCommand,-3,"ws",0,NULL,1,-2,1,0,0},
5d02b00f 137 {"llen",llenCommand,2,"r",0,NULL,1,1,1,0,0},
138 {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
139 {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
140 {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
141 {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
142 {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
143 {"rpoplpush",rpoplpushCommand,3,"wm",0,NULL,1,2,1,0,0},
144 {"sadd",saddCommand,-3,"wm",0,NULL,1,1,1,0,0},
145 {"srem",sremCommand,-3,"w",0,NULL,1,1,1,0,0},
146 {"smove",smoveCommand,4,"w",0,NULL,1,2,1,0,0},
147 {"sismember",sismemberCommand,3,"r",0,NULL,1,1,1,0,0},
148 {"scard",scardCommand,2,"r",0,NULL,1,1,1,0,0},
15ef6053 149 {"spop",spopCommand,2,"wRs",0,NULL,1,1,1,0,0},
b60ed6e8 150 {"srandmember",srandmemberCommand,2,"rR",0,NULL,1,1,1,0,0},
548efd91 151 {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 152 {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 153 {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 154 {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 155 {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 156 {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 157 {"smembers",sinterCommand,2,"rS",0,NULL,1,1,1,0,0},
5d02b00f 158 {"zadd",zaddCommand,-4,"wm",0,NULL,1,1,1,0,0},
159 {"zincrby",zincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
160 {"zrem",zremCommand,-3,"w",0,NULL,1,1,1,0,0},
161 {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
162 {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
163 {"zunionstore",zunionstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
164 {"zinterstore",zinterstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
165 {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
166 {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
167 {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
168 {"zcount",zcountCommand,4,"r",0,NULL,1,1,1,0,0},
169 {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
170 {"zcard",zcardCommand,2,"r",0,NULL,1,1,1,0,0},
171 {"zscore",zscoreCommand,3,"r",0,NULL,1,1,1,0,0},
172 {"zrank",zrankCommand,3,"r",0,NULL,1,1,1,0,0},
173 {"zrevrank",zrevrankCommand,3,"r",0,NULL,1,1,1,0,0},
174 {"hset",hsetCommand,4,"wm",0,NULL,1,1,1,0,0},
175 {"hsetnx",hsetnxCommand,4,"wm",0,NULL,1,1,1,0,0},
176 {"hget",hgetCommand,3,"r",0,NULL,1,1,1,0,0},
177 {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
178 {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
179 {"hincrby",hincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
68bfe993 180 {"hincrbyfloat",hincrbyfloatCommand,4,"wm",0,NULL,1,1,1,0,0},
5d02b00f 181 {"hdel",hdelCommand,-3,"w",0,NULL,1,1,1,0,0},
182 {"hlen",hlenCommand,2,"r",0,NULL,1,1,1,0,0},
548efd91 183 {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
184 {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
5d02b00f 185 {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
186 {"hexists",hexistsCommand,3,"r",0,NULL,1,1,1,0,0},
187 {"incrby",incrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
188 {"decrby",decrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
5574b53e 189 {"incrbyfloat",incrbyfloatCommand,3,"wm",0,NULL,1,1,1,0,0},
5d02b00f 190 {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
191 {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
192 {"msetnx",msetnxCommand,-3,"wm",0,NULL,1,-1,2,0,0},
b60ed6e8 193 {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
5d02b00f 194 {"select",selectCommand,2,"r",0,NULL,0,0,0,0,0},
195 {"move",moveCommand,3,"w",0,NULL,1,1,1,0,0},
196 {"rename",renameCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
197 {"renamenx",renamenxCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
12d293ca 198 {"expire",expireCommand,3,"w",0,NULL,1,1,1,0,0},
199 {"expireat",expireatCommand,3,"w",0,NULL,1,1,1,0,0},
200 {"pexpire",pexpireCommand,3,"w",0,NULL,1,1,1,0,0},
201 {"pexpireat",pexpireatCommand,3,"w",0,NULL,1,1,1,0,0},
548efd91 202 {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
5d02b00f 203 {"dbsize",dbsizeCommand,1,"r",0,NULL,0,0,0,0,0},
e41677b4 204 {"auth",authCommand,2,"rs",0,NULL,0,0,0,0,0},
5d02b00f 205 {"ping",pingCommand,1,"r",0,NULL,0,0,0,0,0},
206 {"echo",echoCommand,2,"r",0,NULL,0,0,0,0,0},
e41677b4 207 {"save",saveCommand,1,"ars",0,NULL,0,0,0,0,0},
5d02b00f 208 {"bgsave",bgsaveCommand,1,"ar",0,NULL,0,0,0,0,0},
209 {"bgrewriteaof",bgrewriteaofCommand,1,"ar",0,NULL,0,0,0,0,0},
4ab8695d 210 {"shutdown",shutdownCommand,-1,"ar",0,NULL,0,0,0,0,0},
5d02b00f 211 {"lastsave",lastsaveCommand,1,"r",0,NULL,0,0,0,0,0},
212 {"type",typeCommand,2,"r",0,NULL,1,1,1,0,0},
b60ed6e8 213 {"multi",multiCommand,1,"rs",0,NULL,0,0,0,0,0},
05406168 214 {"exec",execCommand,1,"s",0,NULL,0,0,0,0,0},
b60ed6e8 215 {"discard",discardCommand,1,"rs",0,NULL,0,0,0,0,0},
216 {"sync",syncCommand,1,"ars",0,NULL,0,0,0,0,0},
5d02b00f 217 {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
218 {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
2c861050 219 {"sort",sortCommand,-2,"wmS",0,NULL,1,1,1,0,0},
5d02b00f 220 {"info",infoCommand,-1,"r",0,NULL,0,0,0,0,0},
b60ed6e8 221 {"monitor",monitorCommand,1,"ars",0,NULL,0,0,0,0,0},
12d293ca 222 {"ttl",ttlCommand,2,"r",0,NULL,1,1,1,0,0},
223 {"pttl",pttlCommand,2,"r",0,NULL,1,1,1,0,0},
5d02b00f 224 {"persist",persistCommand,2,"w",0,NULL,1,1,1,0,0},
b60ed6e8 225 {"slaveof",slaveofCommand,3,"aws",0,NULL,0,0,0,0,0},
38bb4522 226 {"debug",debugCommand,-2,"as",0,NULL,0,0,0,0,0},
5d02b00f 227 {"config",configCommand,-2,"ar",0,NULL,0,0,0,0,0},
b60ed6e8 228 {"subscribe",subscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
229 {"unsubscribe",unsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
230 {"psubscribe",psubscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
231 {"punsubscribe",punsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
6e6bbac7 232 {"publish",publishCommand,3,"pf",0,NULL,0,0,0,0,0},
b60ed6e8 233 {"watch",watchCommand,-2,"rs",0,noPreloadGetKeys,1,-1,1,0,0},
234 {"unwatch",unwatchCommand,1,"rs",0,NULL,0,0,0,0,0},
7afc3a96 235 {"restore",restoreCommand,4,"awm",0,NULL,1,1,1,0,0},
5d02b00f 236 {"migrate",migrateCommand,6,"aw",0,NULL,0,0,0,0,0},
1bcfa0f6 237 {"dump",dumpCommand,2,"ar",0,NULL,1,1,1,0,0},
238 {"object",objectCommand,-2,"r",0,NULL,2,2,2,0,0},
5d02b00f 239 {"client",clientCommand,-2,"ar",0,NULL,0,0,0,0,0},
05406168 240 {"eval",evalCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
241 {"evalsha",evalShaCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
070e3945 242 {"slowlog",slowlogCommand,-2,"r",0,NULL,0,0,0,0,0},
9494f1f1 243 {"script",scriptCommand,-2,"ras",0,NULL,0,0,0,0,0},
244 {"time",timeCommand,1,"rR",0,NULL,0,0,0,0,0}
e2641e09 245};
246
247/*============================ Utility functions ============================ */
248
9c104c68 249/* Low level logging. To use only for very big messages, otherwise
250 * redisLog() is to prefer. */
251void redisLogRaw(int level, const char *msg) {
e1a586ee
JH
252 const int syslogLevelMap[] = { LOG_DEBUG, LOG_INFO, LOG_NOTICE, LOG_WARNING };
253 const char *c = ".-*#";
254 time_t now = time(NULL);
e2641e09 255 FILE *fp;
23072961 256 char buf[64];
996d503d 257 int rawmode = (level & REDIS_LOG_RAW);
23072961 258
996d503d 259 level &= 0xff; /* clear flags */
23072961 260 if (level < server.verbosity) return;
e2641e09 261
262 fp = (server.logfile == NULL) ? stdout : fopen(server.logfile,"a");
263 if (!fp) return;
264
996d503d 265 if (rawmode) {
266 fprintf(fp,"%s",msg);
267 } else {
268 strftime(buf,sizeof(buf),"%d %b %H:%M:%S",localtime(&now));
269 fprintf(fp,"[%d] %s %c %s\n",(int)getpid(),buf,c[level],msg);
270 }
e1a586ee
JH
271 fflush(fp);
272
e2641e09 273 if (server.logfile) fclose(fp);
e1a586ee
JH
274
275 if (server.syslog_enabled) syslog(syslogLevelMap[level], "%s", msg);
e2641e09 276}
277
9c104c68 278/* Like redisLogRaw() but with printf-alike support. This is the funciton that
279 * is used across the code. The raw version is only used in order to dump
280 * the INFO output on crash. */
281void redisLog(int level, const char *fmt, ...) {
282 va_list ap;
283 char msg[REDIS_MAX_LOGMSG_LEN];
284
996d503d 285 if ((level&0xff) < server.verbosity) return;
9c104c68 286
287 va_start(ap, fmt);
288 vsnprintf(msg, sizeof(msg), fmt, ap);
289 va_end(ap);
290
291 redisLogRaw(level,msg);
292}
293
e2641e09 294/* Redis generally does not try to recover from out of memory conditions
295 * when allocating objects or strings, it is not clear if it will be possible
296 * to report this condition to the client since the networking layer itself
297 * is based on heap allocation for send buffers, so we simply abort.
298 * At least the code will be simpler to read... */
299void oom(const char *msg) {
300 redisLog(REDIS_WARNING, "%s: Out of memory\n",msg);
301 sleep(1);
302 abort();
303}
304
d9cb288c 305/* Return the UNIX time in microseconds */
306long long ustime(void) {
307 struct timeval tv;
308 long long ust;
309
310 gettimeofday(&tv, NULL);
311 ust = ((long long)tv.tv_sec)*1000000;
312 ust += tv.tv_usec;
313 return ust;
314}
315
2c2b2085 316/* Return the UNIX time in milliseconds */
317long long mstime(void) {
318 return ustime()/1000;
319}
320
e2641e09 321/*====================== Hash table type implementation ==================== */
322
323/* This is an hash table type that uses the SDS dynamic strings libary as
324 * keys and radis objects as values (objects can hold SDS strings,
325 * lists, sets). */
326
327void dictVanillaFree(void *privdata, void *val)
328{
329 DICT_NOTUSED(privdata);
330 zfree(val);
331}
332
333void dictListDestructor(void *privdata, void *val)
334{
335 DICT_NOTUSED(privdata);
336 listRelease((list*)val);
337}
338
339int dictSdsKeyCompare(void *privdata, const void *key1,
340 const void *key2)
341{
342 int l1,l2;
343 DICT_NOTUSED(privdata);
344
345 l1 = sdslen((sds)key1);
346 l2 = sdslen((sds)key2);
347 if (l1 != l2) return 0;
348 return memcmp(key1, key2, l1) == 0;
349}
350
1b1f47c9 351/* A case insensitive version used for the command lookup table. */
352int dictSdsKeyCaseCompare(void *privdata, const void *key1,
353 const void *key2)
354{
355 DICT_NOTUSED(privdata);
356
357 return strcasecmp(key1, key2) == 0;
358}
359
e2641e09 360void dictRedisObjectDestructor(void *privdata, void *val)
361{
362 DICT_NOTUSED(privdata);
363
364 if (val == NULL) return; /* Values of swapped out keys as set to NULL */
365 decrRefCount(val);
366}
367
368void dictSdsDestructor(void *privdata, void *val)
369{
370 DICT_NOTUSED(privdata);
371
372 sdsfree(val);
373}
374
375int dictObjKeyCompare(void *privdata, const void *key1,
376 const void *key2)
377{
378 const robj *o1 = key1, *o2 = key2;
379 return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
380}
381
382unsigned int dictObjHash(const void *key) {
383 const robj *o = key;
384 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
385}
386
387unsigned int dictSdsHash(const void *key) {
388 return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
389}
390
1b1f47c9 391unsigned int dictSdsCaseHash(const void *key) {
392 return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
393}
394
e2641e09 395int dictEncObjKeyCompare(void *privdata, const void *key1,
396 const void *key2)
397{
398 robj *o1 = (robj*) key1, *o2 = (robj*) key2;
399 int cmp;
400
401 if (o1->encoding == REDIS_ENCODING_INT &&
402 o2->encoding == REDIS_ENCODING_INT)
403 return o1->ptr == o2->ptr;
404
405 o1 = getDecodedObject(o1);
406 o2 = getDecodedObject(o2);
407 cmp = dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
408 decrRefCount(o1);
409 decrRefCount(o2);
410 return cmp;
411}
412
413unsigned int dictEncObjHash(const void *key) {
414 robj *o = (robj*) key;
415
416 if (o->encoding == REDIS_ENCODING_RAW) {
417 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
418 } else {
419 if (o->encoding == REDIS_ENCODING_INT) {
420 char buf[32];
421 int len;
422
423 len = ll2string(buf,32,(long)o->ptr);
424 return dictGenHashFunction((unsigned char*)buf, len);
425 } else {
426 unsigned int hash;
427
428 o = getDecodedObject(o);
429 hash = dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
430 decrRefCount(o);
431 return hash;
432 }
433 }
434}
435
4dd444bb 436/* Sets type hash table */
e2641e09 437dictType setDictType = {
438 dictEncObjHash, /* hash function */
439 NULL, /* key dup */
440 NULL, /* val dup */
441 dictEncObjKeyCompare, /* key compare */
442 dictRedisObjectDestructor, /* key destructor */
443 NULL /* val destructor */
444};
445
446/* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
447dictType zsetDictType = {
448 dictEncObjHash, /* hash function */
449 NULL, /* key dup */
450 NULL, /* val dup */
451 dictEncObjKeyCompare, /* key compare */
452 dictRedisObjectDestructor, /* key destructor */
69ef89f2 453 NULL /* val destructor */
e2641e09 454};
455
456/* Db->dict, keys are sds strings, vals are Redis objects. */
457dictType dbDictType = {
458 dictSdsHash, /* hash function */
459 NULL, /* key dup */
460 NULL, /* val dup */
461 dictSdsKeyCompare, /* key compare */
462 dictSdsDestructor, /* key destructor */
463 dictRedisObjectDestructor /* val destructor */
464};
465
466/* Db->expires */
467dictType keyptrDictType = {
468 dictSdsHash, /* hash function */
469 NULL, /* key dup */
470 NULL, /* val dup */
471 dictSdsKeyCompare, /* key compare */
472 NULL, /* key destructor */
473 NULL /* val destructor */
474};
475
1b1f47c9 476/* Command table. sds string -> command struct pointer. */
477dictType commandTableDictType = {
478 dictSdsCaseHash, /* hash function */
479 NULL, /* key dup */
480 NULL, /* val dup */
481 dictSdsKeyCaseCompare, /* key compare */
482 dictSdsDestructor, /* key destructor */
483 NULL /* val destructor */
484};
485
e2641e09 486/* Hash type hash table (note that small hashes are represented with zimpaps) */
487dictType hashDictType = {
488 dictEncObjHash, /* hash function */
489 NULL, /* key dup */
490 NULL, /* val dup */
491 dictEncObjKeyCompare, /* key compare */
492 dictRedisObjectDestructor, /* key destructor */
493 dictRedisObjectDestructor /* val destructor */
494};
495
496/* Keylist hash table type has unencoded redis objects as keys and
497 * lists as values. It's used for blocking operations (BLPOP) and to
498 * map swapped keys to a list of clients waiting for this keys to be loaded. */
499dictType keylistDictType = {
500 dictObjHash, /* hash function */
501 NULL, /* key dup */
502 NULL, /* val dup */
503 dictObjKeyCompare, /* key compare */
504 dictRedisObjectDestructor, /* key destructor */
505 dictListDestructor /* val destructor */
506};
507
508int htNeedsResize(dict *dict) {
509 long long size, used;
510
511 size = dictSlots(dict);
512 used = dictSize(dict);
513 return (size && used && size > DICT_HT_INITIAL_SIZE &&
514 (used*100/size < REDIS_HT_MINFILL));
515}
516
517/* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
518 * we resize the hash table to save memory */
519void tryResizeHashTables(void) {
520 int j;
521
522 for (j = 0; j < server.dbnum; j++) {
523 if (htNeedsResize(server.db[j].dict))
524 dictResize(server.db[j].dict);
525 if (htNeedsResize(server.db[j].expires))
526 dictResize(server.db[j].expires);
527 }
528}
529
530/* Our hash table implementation performs rehashing incrementally while
531 * we write/read from the hash table. Still if the server is idle, the hash
532 * table will use two tables for a long time. So we try to use 1 millisecond
533 * of CPU time at every serverCron() loop in order to rehash some key. */
534void incrementallyRehash(void) {
535 int j;
536
537 for (j = 0; j < server.dbnum; j++) {
538 if (dictIsRehashing(server.db[j].dict)) {
539 dictRehashMilliseconds(server.db[j].dict,1);
540 break; /* already used our millisecond for this loop... */
541 }
542 }
543}
544
545/* This function is called once a background process of some kind terminates,
546 * as we want to avoid resizing the hash tables when there is a child in order
547 * to play well with copy-on-write (otherwise when a resize happens lots of
548 * memory pages are copied). The goal of this function is to update the ability
549 * for dict.c to resize the hash tables accordingly to the fact we have o not
550 * running childs. */
551void updateDictResizePolicy(void) {
f48cd4b9 552 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
e2641e09 553 dictEnableResize();
554 else
555 dictDisableResize();
556}
557
558/* ======================= Cron: called every 100 ms ======================== */
559
bcf2995c 560/* Try to expire a few timed out keys. The algorithm used is adaptive and
561 * will use few CPU cycles if there are few expiring keys, otherwise
562 * it will get more aggressive to avoid that too much memory is used by
563 * keys that can be removed from the keyspace. */
564void activeExpireCycle(void) {
565 int j;
566
567 for (j = 0; j < server.dbnum; j++) {
568 int expired;
569 redisDb *db = server.db+j;
570
571 /* Continue to expire if at the end of the cycle more than 25%
572 * of the keys were expired. */
573 do {
574 long num = dictSize(db->expires);
4be855e7 575 long long now = mstime();
bcf2995c 576
577 expired = 0;
578 if (num > REDIS_EXPIRELOOKUPS_PER_CRON)
579 num = REDIS_EXPIRELOOKUPS_PER_CRON;
580 while (num--) {
581 dictEntry *de;
4be855e7 582 long long t;
bcf2995c 583
584 if ((de = dictGetRandomKey(db->expires)) == NULL) break;
4be855e7 585 t = dictGetSignedIntegerVal(de);
bcf2995c 586 if (now > t) {
c0ba9ebe 587 sds key = dictGetKey(de);
bcf2995c 588 robj *keyobj = createStringObject(key,sdslen(key));
589
590 propagateExpire(db,keyobj);
591 dbDelete(db,keyobj);
592 decrRefCount(keyobj);
593 expired++;
594 server.stat_expiredkeys++;
595 }
596 }
597 } while (expired > REDIS_EXPIRELOOKUPS_PER_CRON/4);
598 }
599}
600
165346ca 601void updateLRUClock(void) {
56ff70f8 602 server.lruclock = (server.unixtime/REDIS_LRU_CLOCK_RESOLUTION) &
165346ca 603 REDIS_LRU_CLOCK_MAX;
604}
bcf2995c 605
250e7f69 606
607/* Add a sample to the operations per second array of samples. */
608void trackOperationsPerSecond(void) {
609 long long t = mstime() - server.ops_sec_last_sample_time;
610 long long ops = server.stat_numcommands - server.ops_sec_last_sample_ops;
611 long long ops_sec;
612
613 ops_sec = t > 0 ? (ops*1000/t) : 0;
614
615 server.ops_sec_samples[server.ops_sec_idx] = ops_sec;
616 server.ops_sec_idx = (server.ops_sec_idx+1) % REDIS_OPS_SEC_SAMPLES;
617 server.ops_sec_last_sample_time = mstime();
618 server.ops_sec_last_sample_ops = server.stat_numcommands;
619}
620
621/* Return the mean of all the samples. */
622long long getOperationsPerSecond(void) {
623 int j;
624 long long sum = 0;
625
626 for (j = 0; j < REDIS_OPS_SEC_SAMPLES; j++)
627 sum += server.ops_sec_samples[j];
628 return sum / REDIS_OPS_SEC_SAMPLES;
629}
630
f1eaf572 631/* Check for timeouts. Returns non-zero if the client was terminated */
632int clientsCronHandleTimeout(redisClient *c) {
9fa9ccb0 633 time_t now = server.unixtime;
cfa4b57c 634
635 if (server.maxidletime &&
636 !(c->flags & REDIS_SLAVE) && /* no timeout for slaves */
637 !(c->flags & REDIS_MASTER) && /* no timeout for masters */
638 !(c->flags & REDIS_BLOCKED) && /* no timeout for BLPOP */
639 dictSize(c->pubsub_channels) == 0 && /* no timeout for pubsub */
640 listLength(c->pubsub_patterns) == 0 &&
641 (now - c->lastinteraction > server.maxidletime))
642 {
643 redisLog(REDIS_VERBOSE,"Closing idle client");
644 freeClient(c);
f1eaf572 645 return 1;
cfa4b57c 646 } else if (c->flags & REDIS_BLOCKED) {
647 if (c->bpop.timeout != 0 && c->bpop.timeout < now) {
648 addReply(c,shared.nullmultibulk);
649 unblockClientWaitingData(c);
650 }
651 }
f1eaf572 652 return 0;
cfa4b57c 653}
654
9fa9ccb0 655/* The client query buffer is an sds.c string that can end with a lot of
f1eaf572 656 * free space not used, this function reclaims space if needed.
657 *
658 * The funciton always returns 0 as it never terminates the client. */
659int clientsCronResizeQueryBuffer(redisClient *c) {
9fa9ccb0 660 size_t querybuf_size = sdsAllocSize(c->querybuf);
661 time_t idletime = server.unixtime - c->lastinteraction;
662
663 /* There are two conditions to resize the query buffer:
664 * 1) Query buffer is > BIG_ARG and too big for latest peak.
665 * 2) Client is inactive and the buffer is bigger than 1k. */
666 if (((querybuf_size > REDIS_MBULK_BIG_ARG) &&
667 (querybuf_size/(c->querybuf_peak+1)) > 2) ||
668 (querybuf_size > 1024 && idletime > 2))
669 {
670 /* Only resize the query buffer if it is actually wasting space. */
671 if (sdsavail(c->querybuf) > 1024) {
672 c->querybuf = sdsRemoveFreeSpace(c->querybuf);
673 }
674 }
675 /* Reset the peak again to capture the peak memory usage in the next
676 * cycle. */
677 c->querybuf_peak = 0;
f1eaf572 678 return 0;
9fa9ccb0 679}
680
cfa4b57c 681void clientsCron(void) {
682 /* Make sure to process at least 1/100 of clients per call.
683 * Since this function is called 10 times per second we are sure that
684 * in the worst case we process all the clients in 10 seconds.
685 * In normal conditions (a reasonable number of clients) we process
686 * all the clients in a shorter time. */
9fa9ccb0 687 int numclients = listLength(server.clients);
688 int iterations = numclients/100;
cfa4b57c 689
9fa9ccb0 690 if (iterations < 50)
691 iterations = (numclients < 50) ? numclients : 50;
cfa4b57c 692 while(listLength(server.clients) && iterations--) {
693 redisClient *c;
694 listNode *head;
695
696 /* Rotate the list, take the current head, process.
697 * This way if the client must be removed from the list it's the
698 * first element and we don't incur into O(N) computation. */
699 listRotate(server.clients);
700 head = listFirst(server.clients);
701 c = listNodeValue(head);
f1eaf572 702 /* The following functions do different service checks on the client.
703 * The protocol is that they return non-zero if the client was
704 * terminated. */
705 if (clientsCronHandleTimeout(c)) continue;
706 if (clientsCronResizeQueryBuffer(c)) continue;
cfa4b57c 707 }
708}
709
e2641e09 710int serverCron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
89a1433e 711 int j, loops = server.cronloops;
e2641e09 712 REDIS_NOTUSED(eventLoop);
713 REDIS_NOTUSED(id);
714 REDIS_NOTUSED(clientData);
715
fc030ac7 716 /* Software watchdog: deliver the SIGALRM that will reach the signal
717 * handler if we don't return here fast enough. */
718 if (server.watchdog_period) watchdogScheduleSignal(server.watchdog_period);
719
e2641e09 720 /* We take a cached value of the unix time in the global state because
721 * with virtual memory and aging there is to store the current time
722 * in objects at every object access, and accuracy is not needed.
723 * To access a global var is faster than calling time(NULL) */
724 server.unixtime = time(NULL);
4f06867a 725
250e7f69 726 trackOperationsPerSecond();
727
ef59a8bc 728 /* We have just 22 bits per object for LRU information.
165346ca 729 * So we use an (eventually wrapping) LRU clock with 10 seconds resolution.
730 * 2^22 bits with 10 seconds resoluton is more or less 1.5 years.
e2641e09 731 *
165346ca 732 * Note that even if this will wrap after 1.5 years it's not a problem,
ef59a8bc 733 * everything will still work but just some object will appear younger
165346ca 734 * to Redis. But for this to happen a given object should never be touched
735 * for 1.5 years.
736 *
737 * Note that you can change the resolution altering the
738 * REDIS_LRU_CLOCK_RESOLUTION define.
e2641e09 739 */
165346ca 740 updateLRUClock();
e2641e09 741
17b24ff3 742 /* Record the max memory used since the server was started. */
743 if (zmalloc_used_memory() > server.stat_peak_memory)
744 server.stat_peak_memory = zmalloc_used_memory();
745
e2641e09 746 /* We received a SIGTERM, shutting down here in a safe way, as it is
747 * not ok doing so inside the signal handler. */
748 if (server.shutdown_asap) {
4ab8695d 749 if (prepareForShutdown(0) == REDIS_OK) exit(0);
e2641e09 750 redisLog(REDIS_WARNING,"SIGTERM received but errors trying to shut down the server, check the logs for more information");
751 }
752
753 /* Show some info about non-empty databases */
754 for (j = 0; j < server.dbnum; j++) {
755 long long size, used, vkeys;
756
757 size = dictSlots(server.db[j].dict);
758 used = dictSize(server.db[j].dict);
759 vkeys = dictSize(server.db[j].expires);
760 if (!(loops % 50) && (used || vkeys)) {
761 redisLog(REDIS_VERBOSE,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j,used,vkeys,size);
762 /* dictPrintStats(server.dict); */
763 }
764 }
765
766 /* We don't want to resize the hash tables while a bacground saving
767 * is in progress: the saving child is created using fork() that is
768 * implemented with a copy-on-write semantic in most modern systems, so
769 * if we resize the HT while there is the saving child at work actually
770 * a lot of memory movements in the parent will cause a lot of pages
771 * copied. */
f48cd4b9 772 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
e2641e09 773 if (!(loops % 10)) tryResizeHashTables();
774 if (server.activerehashing) incrementallyRehash();
775 }
776
777 /* Show information about connected clients */
778 if (!(loops % 50)) {
779 redisLog(REDIS_VERBOSE,"%d clients connected (%d slaves), %zu bytes in use",
780 listLength(server.clients)-listLength(server.slaves),
781 listLength(server.slaves),
ca734d17 782 zmalloc_used_memory());
e2641e09 783 }
784
cfa4b57c 785 /* We need to do a few operations on clients asynchronously. */
786 clientsCron();
e2641e09 787
b333e239 788 /* Start a scheduled AOF rewrite if this was requested by the user while
789 * a BGSAVE was in progress. */
f48cd4b9 790 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1 &&
2c915bcf 791 server.aof_rewrite_scheduled)
b333e239 792 {
793 rewriteAppendOnlyFileBackground();
794 }
795
f03fe802 796 /* Check if a background saving or AOF rewrite in progress terminated. */
f48cd4b9 797 if (server.rdb_child_pid != -1 || server.aof_child_pid != -1) {
e2641e09 798 int statloc;
799 pid_t pid;
800
801 if ((pid = wait3(&statloc,WNOHANG,NULL)) != 0) {
36c17a53 802 int exitcode = WEXITSTATUS(statloc);
803 int bysignal = 0;
804
805 if (WIFSIGNALED(statloc)) bysignal = WTERMSIG(statloc);
806
f48cd4b9 807 if (pid == server.rdb_child_pid) {
36c17a53 808 backgroundSaveDoneHandler(exitcode,bysignal);
e2641e09 809 } else {
36c17a53 810 backgroundRewriteDoneHandler(exitcode,bysignal);
e2641e09 811 }
812 updateDictResizePolicy();
813 }
c9d0c362 814 } else {
b333e239 815 /* If there is not a background saving/rewrite in progress check if
816 * we have to save/rewrite now */
e2641e09 817 for (j = 0; j < server.saveparamslen; j++) {
818 struct saveparam *sp = server.saveparams+j;
819
820 if (server.dirty >= sp->changes &&
56ff70f8 821 server.unixtime-server.lastsave > sp->seconds) {
e2641e09 822 redisLog(REDIS_NOTICE,"%d changes in %d seconds. Saving...",
823 sp->changes, sp->seconds);
f48cd4b9 824 rdbSaveBackground(server.rdb_filename);
e2641e09 825 break;
826 }
827 }
b333e239 828
829 /* Trigger an AOF rewrite if needed */
f48cd4b9 830 if (server.rdb_child_pid == -1 &&
ff2145ad 831 server.aof_child_pid == -1 &&
2c915bcf 832 server.aof_rewrite_perc &&
833 server.aof_current_size > server.aof_rewrite_min_size)
b333e239 834 {
2c915bcf 835 long long base = server.aof_rewrite_base_size ?
836 server.aof_rewrite_base_size : 1;
837 long long growth = (server.aof_current_size*100/base) - 100;
838 if (growth >= server.aof_rewrite_perc) {
19b46c9a 839 redisLog(REDIS_NOTICE,"Starting automatic rewriting of AOF on %lld%% growth",growth);
b333e239 840 rewriteAppendOnlyFileBackground();
841 }
842 }
e2641e09 843 }
844
db3c2a4f 845
846 /* If we postponed an AOF buffer flush, let's try to do it every time the
847 * cron function is called. */
848 if (server.aof_flush_postponed_start) flushAppendOnlyFile(0);
849
bcf2995c 850 /* Expire a few keys per cycle, only if this is a master.
851 * On slaves we wait for DEL operations synthesized by the master
852 * in order to guarantee a strict consistency. */
853 if (server.masterhost == NULL) activeExpireCycle();
e2641e09 854
8c43e663 855 /* Close clients that need to be closed asynchronous */
856 freeClientsInAsyncFreeQueue();
857
f4aa600b 858 /* Replication cron function -- used to reconnect to master and
859 * to detect transfer failures. */
62ec599c 860 if (!(loops % 10)) replicationCron();
f4aa600b 861
89a1433e 862 server.cronloops++;
e2641e09 863 return 100;
864}
865
866/* This function gets called every time Redis is entering the
867 * main loop of the event driven library, that is, before to sleep
868 * for ready file descriptors. */
869void beforeSleep(struct aeEventLoop *eventLoop) {
870 REDIS_NOTUSED(eventLoop);
a4ce7581
PN
871 listNode *ln;
872 redisClient *c;
e2641e09 873
a4ce7581
PN
874 /* Try to process pending commands for clients that were just unblocked. */
875 while (listLength(server.unblocked_clients)) {
876 ln = listFirst(server.unblocked_clients);
877 redisAssert(ln != NULL);
878 c = ln->value;
879 listDelNode(server.unblocked_clients,ln);
3bcffcbe 880 c->flags &= ~REDIS_UNBLOCKED;
a4ce7581
PN
881
882 /* Process remaining data in the input buffer. */
00010fa9 883 if (c->querybuf && sdslen(c->querybuf) > 0) {
884 server.current_client = c;
a4ce7581 885 processInputBuffer(c);
00010fa9 886 server.current_client = NULL;
887 }
a4ce7581
PN
888 }
889
e2641e09 890 /* Write the AOF buffer on disk */
db3c2a4f 891 flushAppendOnlyFile(0);
e2641e09 892}
893
894/* =========================== Server initialization ======================== */
895
896void createSharedObjects(void) {
897 int j;
898
899 shared.crlf = createObject(REDIS_STRING,sdsnew("\r\n"));
900 shared.ok = createObject(REDIS_STRING,sdsnew("+OK\r\n"));
901 shared.err = createObject(REDIS_STRING,sdsnew("-ERR\r\n"));
902 shared.emptybulk = createObject(REDIS_STRING,sdsnew("$0\r\n\r\n"));
903 shared.czero = createObject(REDIS_STRING,sdsnew(":0\r\n"));
904 shared.cone = createObject(REDIS_STRING,sdsnew(":1\r\n"));
905 shared.cnegone = createObject(REDIS_STRING,sdsnew(":-1\r\n"));
906 shared.nullbulk = createObject(REDIS_STRING,sdsnew("$-1\r\n"));
907 shared.nullmultibulk = createObject(REDIS_STRING,sdsnew("*-1\r\n"));
908 shared.emptymultibulk = createObject(REDIS_STRING,sdsnew("*0\r\n"));
909 shared.pong = createObject(REDIS_STRING,sdsnew("+PONG\r\n"));
910 shared.queued = createObject(REDIS_STRING,sdsnew("+QUEUED\r\n"));
911 shared.wrongtypeerr = createObject(REDIS_STRING,sdsnew(
912 "-ERR Operation against a key holding the wrong kind of value\r\n"));
913 shared.nokeyerr = createObject(REDIS_STRING,sdsnew(
914 "-ERR no such key\r\n"));
915 shared.syntaxerr = createObject(REDIS_STRING,sdsnew(
916 "-ERR syntax error\r\n"));
917 shared.sameobjecterr = createObject(REDIS_STRING,sdsnew(
918 "-ERR source and destination objects are the same\r\n"));
919 shared.outofrangeerr = createObject(REDIS_STRING,sdsnew(
920 "-ERR index out of range\r\n"));
7229d60d 921 shared.noscripterr = createObject(REDIS_STRING,sdsnew(
922 "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
97e7f8ae 923 shared.loadingerr = createObject(REDIS_STRING,sdsnew(
924 "-LOADING Redis is loading the dataset in memory\r\n"));
115e3ff3 925 shared.slowscripterr = createObject(REDIS_STRING,sdsnew(
4ab8695d 926 "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
c25e7eaf 927 shared.bgsaveerr = createObject(REDIS_STRING,sdsnew(
05406168 928 "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
929 shared.roslaveerr = createObject(REDIS_STRING,sdsnew(
930 "-READONLY You can't write against a read only slave.\r\n"));
3f7ad833 931 shared.oomerr = createObject(REDIS_STRING,sdsnew(
932 "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
e2641e09 933 shared.space = createObject(REDIS_STRING,sdsnew(" "));
934 shared.colon = createObject(REDIS_STRING,sdsnew(":"));
935 shared.plus = createObject(REDIS_STRING,sdsnew("+"));
936 shared.select0 = createStringObject("select 0\r\n",10);
937 shared.select1 = createStringObject("select 1\r\n",10);
938 shared.select2 = createStringObject("select 2\r\n",10);
939 shared.select3 = createStringObject("select 3\r\n",10);
940 shared.select4 = createStringObject("select 4\r\n",10);
941 shared.select5 = createStringObject("select 5\r\n",10);
942 shared.select6 = createStringObject("select 6\r\n",10);
943 shared.select7 = createStringObject("select 7\r\n",10);
944 shared.select8 = createStringObject("select 8\r\n",10);
945 shared.select9 = createStringObject("select 9\r\n",10);
946 shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
947 shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
948 shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
949 shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
950 shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
951 shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
355f8591 952 shared.del = createStringObject("DEL",3);
c1db214e 953 shared.rpop = createStringObject("RPOP",4);
954 shared.lpop = createStringObject("LPOP",4);
e2641e09 955 for (j = 0; j < REDIS_SHARED_INTEGERS; j++) {
956 shared.integers[j] = createObject(REDIS_STRING,(void*)(long)j);
957 shared.integers[j]->encoding = REDIS_ENCODING_INT;
958 }
355f8591 959 for (j = 0; j < REDIS_SHARED_BULKHDR_LEN; j++) {
960 shared.mbulkhdr[j] = createObject(REDIS_STRING,
961 sdscatprintf(sdsempty(),"*%d\r\n",j));
962 shared.bulkhdr[j] = createObject(REDIS_STRING,
963 sdscatprintf(sdsempty(),"$%d\r\n",j));
964 }
e2641e09 965}
966
967void initServerConfig() {
91d664d6 968 getRandomHexChars(server.runid,REDIS_RUN_ID_SIZE);
969 server.runid[REDIS_RUN_ID_SIZE] = '\0';
75eaac5c 970 server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
e2641e09 971 server.port = REDIS_SERVERPORT;
a5639e7d 972 server.bindaddr = NULL;
5d10923f 973 server.unixsocket = NULL;
85238765 974 server.unixsocketperm = 0;
a5639e7d
PN
975 server.ipfd = -1;
976 server.sofd = -1;
977 server.dbnum = REDIS_DEFAULT_DBNUM;
c6f9ee88 978 server.verbosity = REDIS_NOTICE;
e2641e09 979 server.maxidletime = REDIS_MAXIDLETIME;
becf5fdb 980 server.client_max_querybuf_len = REDIS_MAX_QUERYBUF_LEN;
e2641e09 981 server.saveparams = NULL;
97e7f8ae 982 server.loading = 0;
e2641e09 983 server.logfile = NULL; /* NULL = log on standard output */
e1a586ee
JH
984 server.syslog_enabled = 0;
985 server.syslog_ident = zstrdup("redis");
986 server.syslog_facility = LOG_LOCAL0;
e2641e09 987 server.daemonize = 0;
e394114d 988 server.aof_state = REDIS_AOF_OFF;
2c915bcf 989 server.aof_fsync = AOF_FSYNC_EVERYSEC;
990 server.aof_no_fsync_on_rewrite = 0;
991 server.aof_rewrite_perc = REDIS_AOF_REWRITE_PERC;
992 server.aof_rewrite_min_size = REDIS_AOF_REWRITE_MIN_SIZE;
993 server.aof_rewrite_base_size = 0;
994 server.aof_rewrite_scheduled = 0;
ff2145ad 995 server.aof_last_fsync = time(NULL);
81f32c7b 996 server.aof_delayed_fsync = 0;
ff2145ad 997 server.aof_fd = -1;
998 server.aof_selected_db = -1; /* Make sure the first time will not match */
db3c2a4f 999 server.aof_flush_postponed_start = 0;
e2641e09 1000 server.pidfile = zstrdup("/var/run/redis.pid");
f48cd4b9 1001 server.rdb_filename = zstrdup("dump.rdb");
2c915bcf 1002 server.aof_filename = zstrdup("appendonly.aof");
e2641e09 1003 server.requirepass = NULL;
f48cd4b9 1004 server.rdb_compression = 1;
e2641e09 1005 server.activerehashing = 1;
58732c23 1006 server.maxclients = REDIS_MAX_CLIENTS;
5fa95ad7 1007 server.bpop_blocked_clients = 0;
e2641e09 1008 server.maxmemory = 0;
165346ca 1009 server.maxmemory_policy = REDIS_MAXMEMORY_VOLATILE_LRU;
1010 server.maxmemory_samples = 3;
ebd85e9a
PN
1011 server.hash_max_ziplist_entries = REDIS_HASH_MAX_ZIPLIST_ENTRIES;
1012 server.hash_max_ziplist_value = REDIS_HASH_MAX_ZIPLIST_VALUE;
e2641e09 1013 server.list_max_ziplist_entries = REDIS_LIST_MAX_ZIPLIST_ENTRIES;
1014 server.list_max_ziplist_value = REDIS_LIST_MAX_ZIPLIST_VALUE;
96ffb2fe 1015 server.set_max_intset_entries = REDIS_SET_MAX_INTSET_ENTRIES;
3ea204e1
PN
1016 server.zset_max_ziplist_entries = REDIS_ZSET_MAX_ZIPLIST_ENTRIES;
1017 server.zset_max_ziplist_value = REDIS_ZSET_MAX_ZIPLIST_VALUE;
e2641e09 1018 server.shutdown_asap = 0;
aeecbdfa 1019 server.repl_ping_slave_period = REDIS_REPL_PING_SLAVE_PERIOD;
1020 server.repl_timeout = REDIS_REPL_TIMEOUT;
4ab8695d 1021 server.lua_caller = NULL;
eeffcf38 1022 server.lua_time_limit = REDIS_LUA_TIME_LIMIT;
070e3945 1023 server.lua_client = NULL;
115e3ff3 1024 server.lua_timedout = 0;
e2641e09 1025
95506e46 1026 updateLRUClock();
e2641e09 1027 resetServerSaveParams();
1028
1029 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1030 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1031 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1032 /* Replication related */
e2641e09 1033 server.masterauth = NULL;
1034 server.masterhost = NULL;
1035 server.masterport = 6379;
1036 server.master = NULL;
1844f990 1037 server.repl_state = REDIS_REPL_NONE;
890a2ed9 1038 server.repl_syncio_timeout = REDIS_REPL_SYNCIO_TIMEOUT;
4ebfc455 1039 server.repl_serve_stale_data = 1;
05406168 1040 server.repl_slave_ro = 1;
07486df6 1041 server.repl_down_since = -1;
e2641e09 1042
7eac2a75 1043 /* Client output buffer limits */
1044 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].hard_limit_bytes = 0;
1045 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_bytes = 0;
1046 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_seconds = 0;
c8a607f2 1047 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].hard_limit_bytes = 1024*1024*256;
1048 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_bytes = 1024*1024*64;
7eac2a75 1049 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_seconds = 60;
c8a607f2 1050 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].hard_limit_bytes = 1024*1024*32;
1051 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_bytes = 1024*1024*8;
7eac2a75 1052 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_seconds = 60;
1053
e2641e09 1054 /* Double constants initialization */
1055 R_Zero = 0.0;
1056 R_PosInf = 1.0/R_Zero;
1057 R_NegInf = -1.0/R_Zero;
1058 R_Nan = R_Zero/R_Zero;
8d3e063a 1059
1060 /* Command table -- we intiialize it here as it is part of the
1061 * initial configuration, since command names may be changed via
1062 * redis.conf using the rename-command directive. */
1063 server.commands = dictCreate(&commandTableDictType,NULL);
1064 populateCommandTable();
1065 server.delCommand = lookupCommandByCString("del");
1066 server.multiCommand = lookupCommandByCString("multi");
eeb34eff 1067 server.lpushCommand = lookupCommandByCString("lpush");
daa70b17 1068
1069 /* Slow log */
1070 server.slowlog_log_slower_than = REDIS_SLOWLOG_LOG_SLOWER_THAN;
1071 server.slowlog_max_len = REDIS_SLOWLOG_MAX_LEN;
fa5af017 1072
fc030ac7 1073 /* Debugging */
fa5af017 1074 server.assert_failed = "<no assertion failed>";
1075 server.assert_file = "<no file>";
1076 server.assert_line = 0;
1077 server.bug_report_start = 0;
fc030ac7 1078 server.watchdog_period = 0;
e2641e09 1079}
1080
e074416b 1081/* This function will try to raise the max number of open files accordingly to
1082 * the configured max number of clients. It will also account for 32 additional
1083 * file descriptors as we need a few more for persistence, listening
1084 * sockets, log files and so forth.
1085 *
1086 * If it will not be possible to set the limit accordingly to the configured
1087 * max number of clients, the function will do the reverse setting
1088 * server.maxclients to the value that we can actually handle. */
1089void adjustOpenFilesLimit(void) {
1090 rlim_t maxfiles = server.maxclients+32;
1091 struct rlimit limit;
1092
1093 if (maxfiles < 1024) maxfiles = 1024;
1094 if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
1095 redisLog(REDIS_WARNING,"Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
1096 strerror(errno));
1097 server.maxclients = 1024-32;
1098 } else {
1099 rlim_t oldlimit = limit.rlim_cur;
1100
1101 /* Set the max number of files if the current limit is not enough
1102 * for our needs. */
1103 if (oldlimit < maxfiles) {
1104 limit.rlim_cur = maxfiles;
1105 limit.rlim_max = maxfiles;
1106 if (setrlimit(RLIMIT_NOFILE,&limit) == -1) {
1107 server.maxclients = oldlimit-32;
1108 redisLog(REDIS_WARNING,"Unable to set the max number of files limit to %d (%s), setting the max clients configuration to %d.",
1109 (int) maxfiles, strerror(errno), (int) server.maxclients);
1110 } else {
1111 redisLog(REDIS_NOTICE,"Max number of open files set to %d",
1112 (int) maxfiles);
1113 }
1114 }
1115 }
1116}
1117
e2641e09 1118void initServer() {
1119 int j;
1120
1121 signal(SIGHUP, SIG_IGN);
1122 signal(SIGPIPE, SIG_IGN);
633a9410 1123 setupSignalHandlers();
e2641e09 1124
e1a586ee
JH
1125 if (server.syslog_enabled) {
1126 openlog(server.syslog_ident, LOG_PID | LOG_NDELAY | LOG_NOWAIT,
1127 server.syslog_facility);
1128 }
1129
00010fa9 1130 server.current_client = NULL;
e2641e09 1131 server.clients = listCreate();
7eac2a75 1132 server.clients_to_close = listCreate();
e2641e09 1133 server.slaves = listCreate();
1134 server.monitors = listCreate();
a4ce7581 1135 server.unblocked_clients = listCreate();
cea8c5cd 1136
e2641e09 1137 createSharedObjects();
e074416b 1138 adjustOpenFilesLimit();
1139 server.el = aeCreateEventLoop(server.maxclients+1024);
e2641e09 1140 server.db = zmalloc(sizeof(redisDb)*server.dbnum);
68d6345d 1141
a53b4c24 1142 if (server.port != 0) {
68d6345d 1143 server.ipfd = anetTcpServer(server.neterr,server.port,server.bindaddr);
a53b4c24 1144 if (server.ipfd == ANET_ERR) {
eef17490 1145 redisLog(REDIS_WARNING, "Opening port %d: %s",
1146 server.port, server.neterr);
a53b4c24 1147 exit(1);
1148 }
a5639e7d 1149 }
5d10923f
PN
1150 if (server.unixsocket != NULL) {
1151 unlink(server.unixsocket); /* don't care if this fails */
85238765 1152 server.sofd = anetUnixServer(server.neterr,server.unixsocket,server.unixsocketperm);
a5639e7d
PN
1153 if (server.sofd == ANET_ERR) {
1154 redisLog(REDIS_WARNING, "Opening socket: %s", server.neterr);
1155 exit(1);
1156 }
c61e6925 1157 }
a5639e7d
PN
1158 if (server.ipfd < 0 && server.sofd < 0) {
1159 redisLog(REDIS_WARNING, "Configured to not listen anywhere, exiting.");
e2641e09 1160 exit(1);
1161 }
1162 for (j = 0; j < server.dbnum; j++) {
1163 server.db[j].dict = dictCreate(&dbDictType,NULL);
1164 server.db[j].expires = dictCreate(&keyptrDictType,NULL);
1165 server.db[j].blocking_keys = dictCreate(&keylistDictType,NULL);
1166 server.db[j].watched_keys = dictCreate(&keylistDictType,NULL);
e2641e09 1167 server.db[j].id = j;
1168 }
1169 server.pubsub_channels = dictCreate(&keylistDictType,NULL);
1170 server.pubsub_patterns = listCreate();
1171 listSetFreeMethod(server.pubsub_patterns,freePubsubPattern);
1172 listSetMatchMethod(server.pubsub_patterns,listMatchPubsubPattern);
1173 server.cronloops = 0;
f48cd4b9 1174 server.rdb_child_pid = -1;
ff2145ad 1175 server.aof_child_pid = -1;
1176 server.aof_rewrite_buf = sdsempty();
1177 server.aof_buf = sdsempty();
e2641e09 1178 server.lastsave = time(NULL);
1179 server.dirty = 0;
1180 server.stat_numcommands = 0;
1181 server.stat_numconnections = 0;
1182 server.stat_expiredkeys = 0;
f21779ff 1183 server.stat_evictedkeys = 0;
e2641e09 1184 server.stat_starttime = time(NULL);
53eeeaff 1185 server.stat_keyspace_misses = 0;
1186 server.stat_keyspace_hits = 0;
17b24ff3 1187 server.stat_peak_memory = 0;
615e414c 1188 server.stat_fork_time = 0;
3c95e721 1189 server.stat_rejected_conn = 0;
250e7f69 1190 memset(server.ops_sec_samples,0,sizeof(server.ops_sec_samples));
1191 server.ops_sec_idx = 0;
1192 server.ops_sec_last_sample_time = mstime();
1193 server.ops_sec_last_sample_ops = 0;
e2641e09 1194 server.unixtime = time(NULL);
c25e7eaf 1195 server.lastbgsave_status = REDIS_OK;
4d3bbf35 1196 server.stop_writes_on_bgsave_err = 1;
e2641e09 1197 aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL);
a5639e7d 1198 if (server.ipfd > 0 && aeCreateFileEvent(server.el,server.ipfd,AE_READABLE,
ab17b909 1199 acceptTcpHandler,NULL) == AE_ERR) oom("creating file event");
a5639e7d 1200 if (server.sofd > 0 && aeCreateFileEvent(server.el,server.sofd,AE_READABLE,
ab17b909 1201 acceptUnixHandler,NULL) == AE_ERR) oom("creating file event");
e2641e09 1202
e394114d 1203 if (server.aof_state == REDIS_AOF_ON) {
ff2145ad 1204 server.aof_fd = open(server.aof_filename,
e394114d 1205 O_WRONLY|O_APPEND|O_CREAT,0644);
ff2145ad 1206 if (server.aof_fd == -1) {
e2641e09 1207 redisLog(REDIS_WARNING, "Can't open the append-only file: %s",
1208 strerror(errno));
1209 exit(1);
1210 }
1211 }
1212
d876678b 1213 /* 32 bit instances are limited to 4GB of address space, so if there is
1214 * no explicit limit in the user provided configuration we set a limit
1215 * at 3.5GB using maxmemory with 'noeviction' policy'. This saves
1216 * useless crashes of the Redis instance. */
1217 if (server.arch_bits == 32 && server.maxmemory == 0) {
1218 redisLog(REDIS_WARNING,"Warning: 32 bit instance detected but no memory limit set. Setting 3.5 GB maxmemory limit with 'noeviction' policy now.");
1219 server.maxmemory = 3584LL*(1024*1024); /* 3584 MB = 3.5 GB */
1220 server.maxmemory_policy = REDIS_MAXMEMORY_NO_EVICTION;
1221 }
1222
7585836e 1223 scriptingInit();
daa70b17 1224 slowlogInit();
8f61a72f 1225 bioInit();
e2641e09 1226}
1227
1b1f47c9 1228/* Populates the Redis Command Table starting from the hard coded list
1229 * we have on top of redis.c file. */
1230void populateCommandTable(void) {
1231 int j;
d7ed7fd2 1232 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1b1f47c9 1233
1234 for (j = 0; j < numcommands; j++) {
d7ed7fd2 1235 struct redisCommand *c = redisCommandTable+j;
5d02b00f 1236 char *f = c->sflags;
1b1f47c9 1237 int retval;
e2641e09 1238
5d02b00f 1239 while(*f != '\0') {
1240 switch(*f) {
1241 case 'w': c->flags |= REDIS_CMD_WRITE; break;
1242 case 'r': c->flags |= REDIS_CMD_READONLY; break;
1243 case 'm': c->flags |= REDIS_CMD_DENYOOM; break;
1244 case 'a': c->flags |= REDIS_CMD_ADMIN; break;
1245 case 'p': c->flags |= REDIS_CMD_PUBSUB; break;
1246 case 'f': c->flags |= REDIS_CMD_FORCE_REPLICATION; break;
b60ed6e8 1247 case 's': c->flags |= REDIS_CMD_NOSCRIPT; break;
1248 case 'R': c->flags |= REDIS_CMD_RANDOM; break;
548efd91 1249 case 'S': c->flags |= REDIS_CMD_SORT_FOR_SCRIPT; break;
5d02b00f 1250 default: redisPanic("Unsupported command flag"); break;
1251 }
1252 f++;
1253 }
1254
1b1f47c9 1255 retval = dictAdd(server.commands, sdsnew(c->name), c);
1256 assert(retval == DICT_OK);
1257 }
e2641e09 1258}
1259
d7ed7fd2 1260void resetCommandTableStats(void) {
1261 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1262 int j;
1263
1264 for (j = 0; j < numcommands; j++) {
1265 struct redisCommand *c = redisCommandTable+j;
1266
1267 c->microseconds = 0;
1268 c->calls = 0;
1269 }
1270}
1271
78d6a22d 1272/* ========================== Redis OP Array API ============================ */
1273
1274void redisOpArrayInit(redisOpArray *oa) {
1275 oa->ops = NULL;
1276 oa->numops = 0;
1277}
1278
1279int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
1280 robj **argv, int argc, int target)
1281{
1282 redisOp *op;
1283
1284 oa->ops = zrealloc(oa->ops,sizeof(redisOp)*(oa->numops+1));
1285 op = oa->ops+oa->numops;
1286 op->cmd = cmd;
1287 op->dbid = dbid;
1288 op->argv = argv;
1289 op->argc = argc;
1290 op->target = target;
1291 oa->numops++;
1292 return oa->numops;
1293}
1294
1295void redisOpArrayFree(redisOpArray *oa) {
1296 while(oa->numops) {
1297 int j;
1298 redisOp *op;
1299
1300 oa->numops--;
1301 op = oa->ops+oa->numops;
1302 for (j = 0; j < op->argc; j++)
1303 decrRefCount(op->argv[j]);
1304 zfree(op->argv);
1305 }
1306 zfree(oa->ops);
1307}
1308
e2641e09 1309/* ====================== Commands lookup and execution ===================== */
1310
1b1f47c9 1311struct redisCommand *lookupCommand(sds name) {
1312 return dictFetchValue(server.commands, name);
1313}
1314
1315struct redisCommand *lookupCommandByCString(char *s) {
1316 struct redisCommand *cmd;
1317 sds name = sdsnew(s);
1318
1319 cmd = dictFetchValue(server.commands, name);
1320 sdsfree(name);
1321 return cmd;
e2641e09 1322}
1323
ad08d059 1324/* Propagate the specified command (in the context of the specified database id)
1325 * to AOF, Slaves and Monitors.
1326 *
1327 * flags are an xor between:
1328 * + REDIS_PROPAGATE_NONE (no propagation of command at all)
1329 * + REDIS_PROPAGATE_AOF (propagate into the AOF file if is enabled)
1330 * + REDIS_PROPAGATE_REPL (propagate into the replication link)
1331 */
1332void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1333 int flags)
1334{
1335 if (server.aof_state != REDIS_AOF_OFF && flags & REDIS_PROPAGATE_AOF)
1336 feedAppendOnlyFile(cmd,dbid,argv,argc);
1337 if (flags & REDIS_PROPAGATE_REPL && listLength(server.slaves))
1338 replicationFeedSlaves(server.slaves,dbid,argv,argc);
1339}
1340
78d6a22d 1341/* Used inside commands to schedule the propagation of additional commands
1342 * after the current command is propagated to AOF / Replication. */
eeb34eff 1343void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1344 int target)
1345{
78d6a22d 1346 redisOpArrayAppend(&server.also_propagate,cmd,dbid,argv,argc,target);
eeb34eff 1347}
1348
e2641e09 1349/* Call() is the core of Redis execution of a command */
ce8b772b 1350void call(redisClient *c, int flags) {
daa70b17 1351 long long dirty, start = ustime(), duration;
e2641e09 1352
ad08d059 1353 /* Sent the command to clients in MONITOR mode, only if the commands are
1354 * not geneated from reading an AOF. */
1355 if (listLength(server.monitors) && !server.loading)
e31b615e 1356 replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
ad08d059 1357
1358 /* Call the command. */
78d6a22d 1359 redisOpArrayInit(&server.also_propagate);
e2641e09 1360 dirty = server.dirty;
09e2d9ee 1361 c->cmd->proc(c);
e2641e09 1362 dirty = server.dirty-dirty;
daa70b17 1363 duration = ustime()-start;
ce8b772b 1364
1365 /* When EVAL is called loading the AOF we don't want commands called
1366 * from Lua to go into the slowlog or to populate statistics. */
1367 if (server.loading && c->flags & REDIS_LUA_CLIENT)
1368 flags &= ~(REDIS_CALL_SLOWLOG | REDIS_CALL_STATS);
1369
ad08d059 1370 /* Log the command into the Slow log if needed, and populate the
1371 * per-command statistics that we show in INFO commandstats. */
ce8b772b 1372 if (flags & REDIS_CALL_SLOWLOG)
1373 slowlogPushEntryIfNeeded(c->argv,c->argc,duration);
1374 if (flags & REDIS_CALL_STATS) {
1375 c->cmd->microseconds += duration;
1376 c->cmd->calls++;
1377 }
ad08d059 1378
1379 /* Propagate the command into the AOF and replication link */
ce8b772b 1380 if (flags & REDIS_CALL_PROPAGATE) {
ad08d059 1381 int flags = REDIS_PROPAGATE_NONE;
1382
1383 if (c->cmd->flags & REDIS_CMD_FORCE_REPLICATION)
1384 flags |= REDIS_PROPAGATE_REPL;
1385 if (dirty)
1386 flags |= (REDIS_PROPAGATE_REPL | REDIS_PROPAGATE_AOF);
1387 if (flags != REDIS_PROPAGATE_NONE)
1388 propagate(c->cmd,c->db->id,c->argv,c->argc,flags);
ce8b772b 1389 }
eeb34eff 1390 /* Commands such as LPUSH or BRPOPLPUSH may propagate an additional
1391 * PUSH command. */
78d6a22d 1392 if (server.also_propagate.numops) {
eeb34eff 1393 int j;
78d6a22d 1394 redisOp *rop;
eeb34eff 1395
78d6a22d 1396 for (j = 0; j < server.also_propagate.numops; j++) {
1397 rop = &server.also_propagate.ops[j];
1398 propagate(rop->cmd, rop->dbid, rop->argv, rop->argc, rop->target);
1399 }
1400 redisOpArrayFree(&server.also_propagate);
eeb34eff 1401 }
e2641e09 1402 server.stat_numcommands++;
1403}
1404
1405/* If this function gets called we already read a whole
1406 * command, argments are in the client argv/argc fields.
1407 * processCommand() execute the command or prepare the
1408 * server for a bulk read from the client.
1409 *
1410 * If 1 is returned the client is still alive and valid and
1411 * and other operations can be performed by the caller. Otherwise
1412 * if 0 is returned the client was destroied (i.e. after QUIT). */
1413int processCommand(redisClient *c) {
941c9fa2
PN
1414 /* The QUIT command is handled separately. Normal command procs will
1415 * go through checking for replication and QUIT will cause trouble
1416 * when FORCE_REPLICATION is enabled and would be implemented in
1417 * a regular command proc. */
e2641e09 1418 if (!strcasecmp(c->argv[0]->ptr,"quit")) {
941c9fa2 1419 addReply(c,shared.ok);
5e78edb3 1420 c->flags |= REDIS_CLOSE_AFTER_REPLY;
cd8788f2 1421 return REDIS_ERR;
e2641e09 1422 }
1423
1424 /* Now lookup the command and check ASAP about trivial error conditions
09e2d9ee 1425 * such as wrong arity, bad command name and so forth. */
2c74a9f9 1426 c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
09e2d9ee 1427 if (!c->cmd) {
3ab20376
PN
1428 addReplyErrorFormat(c,"unknown command '%s'",
1429 (char*)c->argv[0]->ptr);
cd8788f2 1430 return REDIS_OK;
09e2d9ee 1431 } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
1432 (c->argc < -c->cmd->arity)) {
3ab20376 1433 addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
09e2d9ee 1434 c->cmd->name);
cd8788f2 1435 return REDIS_OK;
e2641e09 1436 }
e2641e09 1437
1438 /* Check if the user is authenticated */
09e2d9ee 1439 if (server.requirepass && !c->authenticated && c->cmd->proc != authCommand)
1440 {
3ab20376 1441 addReplyError(c,"operation not permitted");
cd8788f2 1442 return REDIS_OK;
e2641e09 1443 }
1444
1dd10ca2 1445 /* Handle the maxmemory directive.
1446 *
1447 * First we try to free some memory if possible (if there are volatile
1448 * keys in the dataset). If there are not the only thing we can do
1449 * is returning an error. */
f6b32c14 1450 if (server.maxmemory) {
1451 int retval = freeMemoryIfNeeded();
1452 if ((c->cmd->flags & REDIS_CMD_DENYOOM) && retval == REDIS_ERR) {
05406168 1453 addReply(c, shared.oomerr);
f6b32c14 1454 return REDIS_OK;
1455 }
e2641e09 1456 }
1457
c25e7eaf 1458 /* Don't accept write commands if there are problems persisting on disk. */
4d3bbf35 1459 if (server.stop_writes_on_bgsave_err &&
1460 server.saveparamslen > 0
1461 && server.lastbgsave_status == REDIS_ERR &&
c25e7eaf 1462 c->cmd->flags & REDIS_CMD_WRITE)
1463 {
1464 addReply(c, shared.bgsaveerr);
1465 return REDIS_OK;
05406168 1466 }
1467
1468 /* Don't accept wirte commands if this is a read only slave. But
1469 * accept write commands if this is our master. */
1470 if (server.masterhost && server.repl_slave_ro &&
1471 !(c->flags & REDIS_MASTER) &&
1472 c->cmd->flags & REDIS_CMD_WRITE)
1473 {
1474 addReply(c, shared.roslaveerr);
1475 return REDIS_OK;
c25e7eaf 1476 }
1477
e2641e09 1478 /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
1479 if ((dictSize(c->pubsub_channels) > 0 || listLength(c->pubsub_patterns) > 0)
1480 &&
09e2d9ee 1481 c->cmd->proc != subscribeCommand &&
1482 c->cmd->proc != unsubscribeCommand &&
1483 c->cmd->proc != psubscribeCommand &&
1484 c->cmd->proc != punsubscribeCommand) {
3ab20376 1485 addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / QUIT allowed in this context");
cd8788f2 1486 return REDIS_OK;
e2641e09 1487 }
1488
4ebfc455 1489 /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
1490 * we are a slave with a broken link with master. */
1844f990 1491 if (server.masterhost && server.repl_state != REDIS_REPL_CONNECTED &&
4ebfc455 1492 server.repl_serve_stale_data == 0 &&
09e2d9ee 1493 c->cmd->proc != infoCommand && c->cmd->proc != slaveofCommand)
4ebfc455 1494 {
1495 addReplyError(c,
1496 "link with MASTER is down and slave-serve-stale-data is set to no");
1497 return REDIS_OK;
1498 }
1499
97e7f8ae 1500 /* Loading DB? Return an error if the command is not INFO */
09e2d9ee 1501 if (server.loading && c->cmd->proc != infoCommand) {
97e7f8ae 1502 addReply(c, shared.loadingerr);
1503 return REDIS_OK;
1504 }
1505
4ab8695d 1506 /* Lua script too slow? Only allow SHUTDOWN NOSAVE and SCRIPT KILL. */
1507 if (server.lua_timedout &&
1508 !(c->cmd->proc != shutdownCommand &&
1509 c->argc == 2 &&
1510 tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
1511 !(c->cmd->proc == scriptCommand &&
1512 c->argc == 2 &&
1513 tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
1514 {
115e3ff3 1515 addReply(c, shared.slowscripterr);
1516 return REDIS_OK;
1517 }
1518
e2641e09 1519 /* Exec the command */
1520 if (c->flags & REDIS_MULTI &&
09e2d9ee 1521 c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
1522 c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
e2641e09 1523 {
09e2d9ee 1524 queueMultiCommand(c);
e2641e09 1525 addReply(c,shared.queued);
1526 } else {
ce8b772b 1527 call(c,REDIS_CALL_FULL);
e2641e09 1528 }
cd8788f2 1529 return REDIS_OK;
e2641e09 1530}
1531
1532/*================================== Shutdown =============================== */
1533
4ab8695d 1534int prepareForShutdown(int flags) {
1535 int save = flags & REDIS_SHUTDOWN_SAVE;
1536 int nosave = flags & REDIS_SHUTDOWN_NOSAVE;
1537
adae85cd 1538 redisLog(REDIS_WARNING,"User requested shutdown...");
e2641e09 1539 /* Kill the saving child if there is a background saving in progress.
1540 We want to avoid race conditions, for instance our saving child may
1541 overwrite the synchronous saving did by SHUTDOWN. */
f48cd4b9 1542 if (server.rdb_child_pid != -1) {
adae85cd 1543 redisLog(REDIS_WARNING,"There is a child saving an .rdb. Killing it!");
f48cd4b9 1544 kill(server.rdb_child_pid,SIGKILL);
1545 rdbRemoveTempFile(server.rdb_child_pid);
e2641e09 1546 }
e394114d 1547 if (server.aof_state != REDIS_AOF_OFF) {
adae85cd 1548 /* Kill the AOF saving child as the AOF we already have may be longer
1549 * but contains the full dataset anyway. */
ff2145ad 1550 if (server.aof_child_pid != -1) {
adae85cd 1551 redisLog(REDIS_WARNING,
1552 "There is a child rewriting the AOF. Killing it!");
ff2145ad 1553 kill(server.aof_child_pid,SIGKILL);
adae85cd 1554 }
e2641e09 1555 /* Append only file: fsync() the AOF and exit */
adae85cd 1556 redisLog(REDIS_NOTICE,"Calling fsync() on the AOF file.");
ff2145ad 1557 aof_fsync(server.aof_fd);
adae85cd 1558 }
4ab8695d 1559 if ((server.saveparamslen > 0 && !nosave) || save) {
adae85cd 1560 redisLog(REDIS_NOTICE,"Saving the final RDB snapshot before exiting.");
e2641e09 1561 /* Snapshotting. Perform a SYNC SAVE and exit */
f48cd4b9 1562 if (rdbSave(server.rdb_filename) != REDIS_OK) {
e2641e09 1563 /* Ooops.. error saving! The best we can do is to continue
1564 * operating. Note that if there was a background saving process,
1565 * in the next cron() Redis will be notified that the background
1566 * saving aborted, handling special stuff like slaves pending for
1567 * synchronization... */
adae85cd 1568 redisLog(REDIS_WARNING,"Error trying to save the DB, can't exit.");
e2641e09 1569 return REDIS_ERR;
1570 }
1571 }
adae85cd 1572 if (server.daemonize) {
1573 redisLog(REDIS_NOTICE,"Removing the pid file.");
1574 unlink(server.pidfile);
1575 }
80e87a46 1576 /* Close the listening sockets. Apparently this allows faster restarts. */
1577 if (server.ipfd != -1) close(server.ipfd);
1578 if (server.sofd != -1) close(server.sofd);
56209f72
NF
1579 if (server.unixsocket) {
1580 redisLog(REDIS_NOTICE,"Removing the unix socket file.");
1581 unlink(server.unixsocket); /* don't care if this fails */
1582 }
80e87a46 1583
adae85cd 1584 redisLog(REDIS_WARNING,"Redis is now ready to exit, bye bye...");
e2641e09 1585 return REDIS_OK;
1586}
1587
1588/*================================== Commands =============================== */
1589
1590void authCommand(redisClient *c) {
ab52d1f4 1591 if (!server.requirepass) {
1592 addReplyError(c,"Client sent AUTH, but no password is set");
1593 } else if (!strcmp(c->argv[1]->ptr, server.requirepass)) {
e2641e09 1594 c->authenticated = 1;
1595 addReply(c,shared.ok);
1596 } else {
1597 c->authenticated = 0;
3ab20376 1598 addReplyError(c,"invalid password");
e2641e09 1599 }
1600}
1601
1602void pingCommand(redisClient *c) {
1603 addReply(c,shared.pong);
1604}
1605
1606void echoCommand(redisClient *c) {
1607 addReplyBulk(c,c->argv[1]);
1608}
1609
9494f1f1 1610void timeCommand(redisClient *c) {
1611 struct timeval tv;
1612
1613 /* gettimeofday() can only fail if &tv is a bad addresss so we
1614 * don't check for errors. */
1615 gettimeofday(&tv,NULL);
1616 addReplyMultiBulkLen(c,2);
1617 addReplyBulkLongLong(c,tv.tv_sec);
1618 addReplyBulkLongLong(c,tv.tv_usec);
1619}
1620
e2641e09 1621/* Convert an amount of bytes into a human readable string in the form
1622 * of 100B, 2G, 100M, 4K, and so forth. */
1623void bytesToHuman(char *s, unsigned long long n) {
1624 double d;
1625
1626 if (n < 1024) {
1627 /* Bytes */
1628 sprintf(s,"%lluB",n);
1629 return;
1630 } else if (n < (1024*1024)) {
1631 d = (double)n/(1024);
1632 sprintf(s,"%.2fK",d);
1633 } else if (n < (1024LL*1024*1024)) {
1634 d = (double)n/(1024*1024);
1635 sprintf(s,"%.2fM",d);
1636 } else if (n < (1024LL*1024*1024*1024)) {
1637 d = (double)n/(1024LL*1024*1024);
1638 sprintf(s,"%.2fG",d);
1639 }
1640}
1641
1642/* Create the string returned by the INFO command. This is decoupled
1643 * by the INFO command itself as we need to report the same information
1644 * on memory corruption problems. */
1b085c9f 1645sds genRedisInfoString(char *section) {
1646 sds info = sdsempty();
56ff70f8 1647 time_t uptime = server.unixtime-server.stat_starttime;
d9cb288c 1648 int j, numcommands;
2b00385d 1649 struct rusage self_ru, c_ru;
7a1fd61e 1650 unsigned long lol, bib;
1b085c9f 1651 int allsections = 0, defsections = 0;
1652 int sections = 0;
1653
1654 if (section) {
1655 allsections = strcasecmp(section,"all") == 0;
0d808ef2 1656 defsections = strcasecmp(section,"default") == 0;
1b085c9f 1657 }
2b00385d 1658
1659 getrusage(RUSAGE_SELF, &self_ru);
1660 getrusage(RUSAGE_CHILDREN, &c_ru);
7a1fd61e 1661 getClientsMaxBuffers(&lol,&bib);
1b085c9f 1662
1663 /* Server */
1664 if (allsections || defsections || !strcasecmp(section,"server")) {
1665 if (sections++) info = sdscat(info,"\r\n");
e2641e09 1666 info = sdscatprintf(info,
1b085c9f 1667 "# Server\r\n"
1668 "redis_version:%s\r\n"
1669 "redis_git_sha1:%s\r\n"
1670 "redis_git_dirty:%d\r\n"
75eaac5c 1671 "arch_bits:%d\r\n"
1b085c9f 1672 "multiplexing_api:%s\r\n"
5db904bd 1673 "gcc_version:%d.%d.%d\r\n"
1b085c9f 1674 "process_id:%ld\r\n"
91d664d6 1675 "run_id:%s\r\n"
1b085c9f 1676 "tcp_port:%d\r\n"
1677 "uptime_in_seconds:%ld\r\n"
1678 "uptime_in_days:%ld\r\n"
1679 "lru_clock:%ld\r\n",
1680 REDIS_VERSION,
1681 redisGitSHA1(),
1682 strtol(redisGitDirty(),NULL,10) > 0,
75eaac5c 1683 server.arch_bits,
1b085c9f 1684 aeGetApiName(),
5db904bd 1685#ifdef __GNUC__
1686 __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
1687#else
1688 0,0,0,
1689#endif
1b085c9f 1690 (long) getpid(),
91d664d6 1691 server.runid,
1b085c9f 1692 server.port,
1693 uptime,
1694 uptime/(3600*24),
1695 (unsigned long) server.lruclock);
1696 }
1697
1698 /* Clients */
1699 if (allsections || defsections || !strcasecmp(section,"clients")) {
1700 if (sections++) info = sdscat(info,"\r\n");
1701 info = sdscatprintf(info,
1702 "# Clients\r\n"
3c08fdae 1703 "connected_clients:%lu\r\n"
1b085c9f 1704 "client_longest_output_list:%lu\r\n"
1705 "client_biggest_input_buf:%lu\r\n"
1706 "blocked_clients:%d\r\n",
1707 listLength(server.clients)-listLength(server.slaves),
1708 lol, bib,
1709 server.bpop_blocked_clients);
1710 }
1711
1712 /* Memory */
1713 if (allsections || defsections || !strcasecmp(section,"memory")) {
17b24ff3 1714 char hmem[64];
1715 char peak_hmem[64];
1716
1717 bytesToHuman(hmem,zmalloc_used_memory());
1718 bytesToHuman(peak_hmem,server.stat_peak_memory);
1b085c9f 1719 if (sections++) info = sdscat(info,"\r\n");
1720 info = sdscatprintf(info,
1721 "# Memory\r\n"
1722 "used_memory:%zu\r\n"
1723 "used_memory_human:%s\r\n"
1724 "used_memory_rss:%zu\r\n"
17b24ff3 1725 "used_memory_peak:%zu\r\n"
1726 "used_memory_peak_human:%s\r\n"
8c3402df 1727 "used_memory_lua:%lld\r\n"
1b085c9f 1728 "mem_fragmentation_ratio:%.2f\r\n"
32f99c51 1729 "mem_allocator:%s\r\n",
1b085c9f 1730 zmalloc_used_memory(),
1731 hmem,
1732 zmalloc_get_rss(),
17b24ff3 1733 server.stat_peak_memory,
1734 peak_hmem,
8c3402df 1735 ((long long)lua_gc(server.lua,LUA_GCCOUNT,0))*1024LL,
1b085c9f 1736 zmalloc_get_fragmentation_ratio(),
fec5a664 1737 ZMALLOC_LIB
12ebe2ac 1738 );
0d808ef2 1739 }
1740
1b085c9f 1741 /* Persistence */
1742 if (allsections || defsections || !strcasecmp(section,"persistence")) {
1743 if (sections++) info = sdscat(info,"\r\n");
e2641e09 1744 info = sdscatprintf(info,
1b085c9f 1745 "# Persistence\r\n"
1746 "loading:%d\r\n"
1747 "aof_enabled:%d\r\n"
1748 "changes_since_last_save:%lld\r\n"
1749 "bgsave_in_progress:%d\r\n"
1750 "last_save_time:%ld\r\n"
c25e7eaf 1751 "last_bgsave_status:%s\r\n"
1b085c9f 1752 "bgrewriteaof_in_progress:%d\r\n",
1753 server.loading,
e394114d 1754 server.aof_state != REDIS_AOF_OFF,
1b085c9f 1755 server.dirty,
f48cd4b9 1756 server.rdb_child_pid != -1,
1b085c9f 1757 server.lastsave,
c25e7eaf 1758 server.lastbgsave_status == REDIS_OK ? "ok" : "err",
ff2145ad 1759 server.aof_child_pid != -1);
1b085c9f 1760
e394114d 1761 if (server.aof_state != REDIS_AOF_OFF) {
d630abcd 1762 info = sdscatprintf(info,
1763 "aof_current_size:%lld\r\n"
1764 "aof_base_size:%lld\r\n"
e7ef418c 1765 "aof_pending_rewrite:%d\r\n"
1766 "aof_buffer_length:%zu\r\n"
81f32c7b 1767 "aof_pending_bio_fsync:%llu\r\n"
1768 "aof_delayed_fsync:%lu\r\n",
2c915bcf 1769 (long long) server.aof_current_size,
1770 (long long) server.aof_rewrite_base_size,
1771 server.aof_rewrite_scheduled,
ff2145ad 1772 sdslen(server.aof_buf),
81f32c7b 1773 bioPendingJobsOfType(REDIS_BIO_AOF_FSYNC),
1774 server.aof_delayed_fsync);
d630abcd 1775 }
1776
1b085c9f 1777 if (server.loading) {
1778 double perc;
1779 time_t eta, elapsed;
1780 off_t remaining_bytes = server.loading_total_bytes-
1781 server.loading_loaded_bytes;
1782
1783 perc = ((double)server.loading_loaded_bytes /
1784 server.loading_total_bytes) * 100;
1785
56ff70f8 1786 elapsed = server.unixtime-server.loading_start_time;
1b085c9f 1787 if (elapsed == 0) {
1788 eta = 1; /* A fake 1 second figure if we don't have
1789 enough info */
1790 } else {
1791 eta = (elapsed*remaining_bytes)/server.loading_loaded_bytes;
1792 }
1793
1794 info = sdscatprintf(info,
1795 "loading_start_time:%ld\r\n"
1796 "loading_total_bytes:%llu\r\n"
1797 "loading_loaded_bytes:%llu\r\n"
1798 "loading_loaded_perc:%.2f\r\n"
1799 "loading_eta_seconds:%ld\r\n"
1800 ,(unsigned long) server.loading_start_time,
1801 (unsigned long long) server.loading_total_bytes,
1802 (unsigned long long) server.loading_loaded_bytes,
1803 perc,
1804 eta
1805 );
1806 }
e2641e09 1807 }
1b085c9f 1808
1b085c9f 1809 /* Stats */
1810 if (allsections || defsections || !strcasecmp(section,"stats")) {
1811 if (sections++) info = sdscat(info,"\r\n");
97e7f8ae 1812 info = sdscatprintf(info,
1b085c9f 1813 "# Stats\r\n"
1814 "total_connections_received:%lld\r\n"
1815 "total_commands_processed:%lld\r\n"
250e7f69 1816 "instantaneous_ops_per_sec:%lld\r\n"
3c95e721 1817 "rejected_connections:%lld\r\n"
1b085c9f 1818 "expired_keys:%lld\r\n"
1819 "evicted_keys:%lld\r\n"
1820 "keyspace_hits:%lld\r\n"
1821 "keyspace_misses:%lld\r\n"
1822 "pubsub_channels:%ld\r\n"
3c08fdae 1823 "pubsub_patterns:%lu\r\n"
615e414c 1824 "latest_fork_usec:%lld\r\n",
1b085c9f 1825 server.stat_numconnections,
1826 server.stat_numcommands,
250e7f69 1827 getOperationsPerSecond(),
3c95e721 1828 server.stat_rejected_conn,
1b085c9f 1829 server.stat_expiredkeys,
1830 server.stat_evictedkeys,
1831 server.stat_keyspace_hits,
1832 server.stat_keyspace_misses,
1833 dictSize(server.pubsub_channels),
615e414c 1834 listLength(server.pubsub_patterns),
1835 server.stat_fork_time);
97e7f8ae 1836 }
67a1810b 1837
1b085c9f 1838 /* Replication */
1839 if (allsections || defsections || !strcasecmp(section,"replication")) {
1840 if (sections++) info = sdscat(info,"\r\n");
1841 info = sdscatprintf(info,
1842 "# Replication\r\n"
1843 "role:%s\r\n",
1844 server.masterhost == NULL ? "master" : "slave");
1845 if (server.masterhost) {
1846 info = sdscatprintf(info,
1847 "master_host:%s\r\n"
1848 "master_port:%d\r\n"
1849 "master_link_status:%s\r\n"
1850 "master_last_io_seconds_ago:%d\r\n"
1851 "master_sync_in_progress:%d\r\n"
1852 ,server.masterhost,
1853 server.masterport,
1844f990 1854 (server.repl_state == REDIS_REPL_CONNECTED) ?
1b085c9f 1855 "up" : "down",
1856 server.master ?
56ff70f8 1857 ((int)(server.unixtime-server.master->lastinteraction)) : -1,
1844f990 1858 server.repl_state == REDIS_REPL_TRANSFER
1b085c9f 1859 );
1860
1844f990 1861 if (server.repl_state == REDIS_REPL_TRANSFER) {
1b085c9f 1862 info = sdscatprintf(info,
1863 "master_sync_left_bytes:%ld\r\n"
1864 "master_sync_last_io_seconds_ago:%d\r\n"
1865 ,(long)server.repl_transfer_left,
56ff70f8 1866 (int)(server.unixtime-server.repl_transfer_lastio)
1b085c9f 1867 );
1868 }
07486df6 1869
1844f990 1870 if (server.repl_state != REDIS_REPL_CONNECTED) {
07486df6 1871 info = sdscatprintf(info,
1872 "master_link_down_since_seconds:%ld\r\n",
56ff70f8 1873 (long)server.unixtime-server.repl_down_since);
07486df6 1874 }
67a1810b 1875 }
1b085c9f 1876 info = sdscatprintf(info,
3c08fdae 1877 "connected_slaves:%lu\r\n",
1b085c9f 1878 listLength(server.slaves));
503d87a8 1879 if (listLength(server.slaves)) {
1880 int slaveid = 0;
1881 listNode *ln;
1882 listIter li;
1883
1884 listRewind(server.slaves,&li);
1885 while((ln = listNext(&li))) {
1886 redisClient *slave = listNodeValue(ln);
1887 char *state = NULL;
1888 char ip[32];
1889 int port;
1890
1891 if (anetPeerToString(slave->fd,ip,&port) == -1) continue;
1892 switch(slave->replstate) {
1893 case REDIS_REPL_WAIT_BGSAVE_START:
1894 case REDIS_REPL_WAIT_BGSAVE_END:
1895 state = "wait_bgsave";
1896 break;
1897 case REDIS_REPL_SEND_BULK:
1898 state = "send_bulk";
1899 break;
1900 case REDIS_REPL_ONLINE:
1901 state = "online";
1902 break;
1903 }
1904 if (state == NULL) continue;
1905 info = sdscatprintf(info,"slave%d:%s,%d,%s\r\n",
1906 slaveid,ip,port,state);
1907 slaveid++;
1908 }
1909 }
67a1810b 1910 }
67a1810b 1911
0d808ef2 1912 /* CPU */
1913 if (allsections || defsections || !strcasecmp(section,"cpu")) {
1b085c9f 1914 if (sections++) info = sdscat(info,"\r\n");
1915 info = sdscatprintf(info,
0d808ef2 1916 "# CPU\r\n"
1b085c9f 1917 "used_cpu_sys:%.2f\r\n"
1918 "used_cpu_user:%.2f\r\n"
5a9dd97c 1919 "used_cpu_sys_children:%.2f\r\n"
1920 "used_cpu_user_children:%.2f\r\n",
1b085c9f 1921 (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
d83eda48 1922 (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000,
1923 (float)c_ru.ru_stime.tv_sec+(float)c_ru.ru_stime.tv_usec/1000000,
1924 (float)c_ru.ru_utime.tv_sec+(float)c_ru.ru_utime.tv_usec/1000000);
0d808ef2 1925 }
1b085c9f 1926
0d808ef2 1927 /* cmdtime */
1928 if (allsections || !strcasecmp(section,"commandstats")) {
1929 if (sections++) info = sdscat(info,"\r\n");
1930 info = sdscatprintf(info, "# Commandstats\r\n");
d7ed7fd2 1931 numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1b085c9f 1932 for (j = 0; j < numcommands; j++) {
d7ed7fd2 1933 struct redisCommand *c = redisCommandTable+j;
0d808ef2 1934
d7ed7fd2 1935 if (!c->calls) continue;
1936 info = sdscatprintf(info,
1937 "cmdstat_%s:calls=%lld,usec=%lld,usec_per_call=%.2f\r\n",
1938 c->name, c->calls, c->microseconds,
1939 (c->calls == 0) ? 0 : ((float)c->microseconds/c->calls));
1b085c9f 1940 }
d9cb288c 1941 }
1942
1b085c9f 1943 /* Key space */
1944 if (allsections || defsections || !strcasecmp(section,"keyspace")) {
1945 if (sections++) info = sdscat(info,"\r\n");
1946 info = sdscatprintf(info, "# Keyspace\r\n");
1947 for (j = 0; j < server.dbnum; j++) {
1948 long long keys, vkeys;
e2641e09 1949
1b085c9f 1950 keys = dictSize(server.db[j].dict);
1951 vkeys = dictSize(server.db[j].expires);
1952 if (keys || vkeys) {
1953 info = sdscatprintf(info, "db%d:keys=%lld,expires=%lld\r\n",
1954 j, keys, vkeys);
1955 }
e2641e09 1956 }
1957 }
1958 return info;
1959}
1960
1961void infoCommand(redisClient *c) {
1b085c9f 1962 char *section = c->argc == 2 ? c->argv[1]->ptr : "default";
1963
1964 if (c->argc > 2) {
1965 addReply(c,shared.syntaxerr);
1966 return;
1967 }
1968 sds info = genRedisInfoString(section);
e2641e09 1969 addReplySds(c,sdscatprintf(sdsempty(),"$%lu\r\n",
1970 (unsigned long)sdslen(info)));
1971 addReplySds(c,info);
1972 addReply(c,shared.crlf);
1973}
1974
1975void monitorCommand(redisClient *c) {
1976 /* ignore MONITOR if aleady slave or in monitor mode */
1977 if (c->flags & REDIS_SLAVE) return;
1978
1979 c->flags |= (REDIS_SLAVE|REDIS_MONITOR);
1980 c->slaveseldb = 0;
1981 listAddNodeTail(server.monitors,c);
1982 addReply(c,shared.ok);
1983}
1984
1985/* ============================ Maxmemory directive ======================== */
1986
e2641e09 1987/* This function gets called when 'maxmemory' is set on the config file to limit
f6b32c14 1988 * the max memory used by the server, before processing a command.
e2641e09 1989 *
f6b32c14 1990 * The goal of the function is to free enough memory to keep Redis under the
1991 * configured memory limit.
e2641e09 1992 *
f6b32c14 1993 * The function starts calculating how many bytes should be freed to keep
1994 * Redis under the limit, and enters a loop selecting the best keys to
1995 * evict accordingly to the configured policy.
1996 *
1997 * If all the bytes needed to return back under the limit were freed the
1998 * function returns REDIS_OK, otherwise REDIS_ERR is returned, and the caller
1999 * should block the execution of commands that will result in more memory
2000 * used by the server.
e2641e09 2001 */
f6b32c14 2002int freeMemoryIfNeeded(void) {
2003 size_t mem_used, mem_tofree, mem_freed;
2004 int slaves = listLength(server.slaves);
2005
c1ef6ffe 2006 /* Remove the size of slaves output buffers and AOF buffer from the
2007 * count of used memory. */
f6b32c14 2008 mem_used = zmalloc_used_memory();
2009 if (slaves) {
2010 listIter li;
2011 listNode *ln;
2012
2013 listRewind(server.slaves,&li);
2014 while((ln = listNext(&li))) {
2015 redisClient *slave = listNodeValue(ln);
2016 unsigned long obuf_bytes = getClientOutputBufferMemoryUsage(slave);
2017 if (obuf_bytes > mem_used)
2018 mem_used = 0;
2019 else
2020 mem_used -= obuf_bytes;
2021 }
2022 }
c1ef6ffe 2023 if (server.aof_state != REDIS_AOF_OFF) {
2024 mem_used -= sdslen(server.aof_buf);
2025 mem_used -= sdslen(server.aof_rewrite_buf);
2026 }
5402c426 2027
f6b32c14 2028 /* Check if we are over the memory limit. */
2029 if (mem_used <= server.maxmemory) return REDIS_OK;
2030
2031 if (server.maxmemory_policy == REDIS_MAXMEMORY_NO_EVICTION)
2032 return REDIS_ERR; /* We need to free memory, but policy forbids. */
2033
2034 /* Compute how much memory we need to free. */
2035 mem_tofree = mem_used - server.maxmemory;
f6b32c14 2036 mem_freed = 0;
2037 while (mem_freed < mem_tofree) {
2038 int j, k, keys_freed = 0;
e2641e09 2039
165346ca 2040 for (j = 0; j < server.dbnum; j++) {
10c12171 2041 long bestval = 0; /* just to prevent warning */
165346ca 2042 sds bestkey = NULL;
2043 struct dictEntry *de;
2044 redisDb *db = server.db+j;
2045 dict *dict;
2046
2047 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2048 server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM)
2049 {
2050 dict = server.db[j].dict;
2051 } else {
2052 dict = server.db[j].expires;
2053 }
2054 if (dictSize(dict) == 0) continue;
2055
2056 /* volatile-random and allkeys-random policy */
2057 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM ||
2058 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_RANDOM)
2059 {
2060 de = dictGetRandomKey(dict);
c0ba9ebe 2061 bestkey = dictGetKey(de);
165346ca 2062 }
2063
2064 /* volatile-lru and allkeys-lru policy */
2065 else if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2066 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2067 {
2068 for (k = 0; k < server.maxmemory_samples; k++) {
2069 sds thiskey;
2070 long thisval;
2071 robj *o;
2072
2073 de = dictGetRandomKey(dict);
c0ba9ebe 2074 thiskey = dictGetKey(de);
0c2f75c6 2075 /* When policy is volatile-lru we need an additonal lookup
2076 * to locate the real key, as dict is set to db->expires. */
2077 if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2078 de = dictFind(db->dict, thiskey);
c0ba9ebe 2079 o = dictGetVal(de);
165346ca 2080 thisval = estimateObjectIdleTime(o);
2081
2082 /* Higher idle time is better candidate for deletion */
2083 if (bestkey == NULL || thisval > bestval) {
2084 bestkey = thiskey;
2085 bestval = thisval;
2086 }
2087 }
2088 }
2089
2090 /* volatile-ttl */
2091 else if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_TTL) {
2092 for (k = 0; k < server.maxmemory_samples; k++) {
2093 sds thiskey;
2094 long thisval;
2095
2096 de = dictGetRandomKey(dict);
c0ba9ebe 2097 thiskey = dictGetKey(de);
2098 thisval = (long) dictGetVal(de);
165346ca 2099
2100 /* Expire sooner (minor expire unix timestamp) is better
2101 * candidate for deletion */
2102 if (bestkey == NULL || thisval < bestval) {
2103 bestkey = thiskey;
2104 bestval = thisval;
2105 }
2106 }
2107 }
2108
2109 /* Finally remove the selected key. */
2110 if (bestkey) {
f6b32c14 2111 long long delta;
2112
165346ca 2113 robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
452229b6 2114 propagateExpire(db,keyobj);
f6b32c14 2115 /* We compute the amount of memory freed by dbDelete() alone.
2116 * It is possible that actually the memory needed to propagate
2117 * the DEL in AOF and replication link is greater than the one
2118 * we are freeing removing the key, but we can't account for
2119 * that otherwise we would never exit the loop.
2120 *
2121 * AOF and Output buffer memory will be freed eventually so
2122 * we only care about memory used by the key space. */
2123 delta = (long long) zmalloc_used_memory();
165346ca 2124 dbDelete(db,keyobj);
f6b32c14 2125 delta -= (long long) zmalloc_used_memory();
f6b32c14 2126 mem_freed += delta;
f21779ff 2127 server.stat_evictedkeys++;
165346ca 2128 decrRefCount(keyobj);
f6b32c14 2129 keys_freed++;
2130
2131 /* When the memory to free starts to be big enough, we may
2132 * start spending so much time here that is impossible to
2133 * deliver data to the slaves fast enough, so we force the
2134 * transmission here inside the loop. */
8b7c3455 2135 if (slaves) flushSlavesOutputBuffers();
165346ca 2136 }
2137 }
b129c6df 2138 if (!keys_freed) return REDIS_ERR; /* nothing to free... */
165346ca 2139 }
f6b32c14 2140 return REDIS_OK;
e2641e09 2141}
2142
2143/* =================================== Main! ================================ */
2144
2145#ifdef __linux__
2146int linuxOvercommitMemoryValue(void) {
2147 FILE *fp = fopen("/proc/sys/vm/overcommit_memory","r");
2148 char buf[64];
2149
2150 if (!fp) return -1;
2151 if (fgets(buf,64,fp) == NULL) {
2152 fclose(fp);
2153 return -1;
2154 }
2155 fclose(fp);
2156
2157 return atoi(buf);
2158}
2159
2160void linuxOvercommitMemoryWarning(void) {
2161 if (linuxOvercommitMemoryValue() == 0) {
2162 redisLog(REDIS_WARNING,"WARNING overcommit_memory is set to 0! Background save may fail under low memory condition. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
2163 }
2164}
2165#endif /* __linux__ */
2166
695fe874 2167void createPidFile(void) {
2168 /* Try to write the pid file in a best-effort way. */
2169 FILE *fp = fopen(server.pidfile,"w");
2170 if (fp) {
8ce39260 2171 fprintf(fp,"%d\n",(int)getpid());
695fe874 2172 fclose(fp);
2173 }
2174}
2175
e2641e09 2176void daemonize(void) {
2177 int fd;
e2641e09 2178
2179 if (fork() != 0) exit(0); /* parent exits */
2180 setsid(); /* create a new session */
2181
2182 /* Every output goes to /dev/null. If Redis is daemonized but
2183 * the 'logfile' is set to 'stdout' in the configuration file
2184 * it will not log at all. */
2185 if ((fd = open("/dev/null", O_RDWR, 0)) != -1) {
2186 dup2(fd, STDIN_FILENO);
2187 dup2(fd, STDOUT_FILENO);
2188 dup2(fd, STDERR_FILENO);
2189 if (fd > STDERR_FILENO) close(fd);
2190 }
e2641e09 2191}
2192
2193void version() {
188a17ed 2194 printf("Redis server v=%s sha=%s:%d malloc=%s\n", REDIS_VERSION,
2195 redisGitSHA1(), atoi(redisGitDirty()) > 0, ZMALLOC_LIB);
e2641e09 2196 exit(0);
2197}
2198
2199void usage() {
9268a5b5 2200 fprintf(stderr,"Usage: ./redis-server [/path/to/redis.conf] [options]\n");
e2641e09 2201 fprintf(stderr," ./redis-server - (read config from stdin)\n");
9268a5b5 2202 fprintf(stderr," ./redis-server -v or --version\n");
78d6a02b 2203 fprintf(stderr," ./redis-server -h or --help\n");
2204 fprintf(stderr," ./redis-server --test-memory <megabytes>\n\n");
9268a5b5 2205 fprintf(stderr,"Examples:\n");
2206 fprintf(stderr," ./redis-server (run the server with default conf)\n");
2207 fprintf(stderr," ./redis-server /etc/redis/6379.conf\n");
2208 fprintf(stderr," ./redis-server --port 7777\n");
2209 fprintf(stderr," ./redis-server --port 7777 --slaveof 127.0.0.1 8888\n");
2210 fprintf(stderr," ./redis-server /etc/myredis.conf --loglevel verbose\n");
e2641e09 2211 exit(1);
2212}
2213
996d503d 2214void redisAsciiArt(void) {
2215#include "asciilogo.h"
2216 char *buf = zmalloc(1024*16);
2217
2218 snprintf(buf,1024*16,ascii_logo,
2219 REDIS_VERSION,
2220 redisGitSHA1(),
2221 strtol(redisGitDirty(),NULL,10) > 0,
2222 (sizeof(long) == 8) ? "64" : "32",
571e257d 2223 "stand alone",
996d503d 2224 server.port,
2225 (long) getpid()
2226 );
2227 redisLogRaw(REDIS_NOTICE|REDIS_LOG_RAW,buf);
2228 zfree(buf);
2229}
2230
633a9410 2231static void sigtermHandler(int sig) {
e2641e09 2232 REDIS_NOTUSED(sig);
2233
633a9410 2234 redisLog(REDIS_WARNING,"Received SIGTERM, scheduling shutdown...");
e2641e09 2235 server.shutdown_asap = 1;
2236}
2237
633a9410 2238void setupSignalHandlers(void) {
e2641e09 2239 struct sigaction act;
2240
633a9410
PN
2241 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction is used.
2242 * Otherwise, sa_handler is used. */
2243 sigemptyset(&act.sa_mask);
e2641e09 2244 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND;
2245 act.sa_handler = sigtermHandler;
633a9410 2246 sigaction(SIGTERM, &act, NULL);
e2641e09 2247
633a9410
PN
2248#ifdef HAVE_BACKTRACE
2249 sigemptyset(&act.sa_mask);
2250 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND | SA_SIGINFO;
2251 act.sa_sigaction = sigsegvHandler;
2252 sigaction(SIGSEGV, &act, NULL);
2253 sigaction(SIGBUS, &act, NULL);
2254 sigaction(SIGFPE, &act, NULL);
2255 sigaction(SIGILL, &act, NULL);
2256#endif
2257 return;
e2641e09 2258}
e2641e09 2259
78d6a02b 2260void memtest(size_t megabytes, int passes);
2261
39ca1713 2262int main(int argc, char **argv) {
2263 long long start;
a48c8d87 2264 struct timeval tv;
39ca1713 2265
06c5523a 2266 /* We need to initialize our libraries, and the server configuration. */
39ca1713 2267 zmalloc_enable_thread_safeness();
a48c8d87 2268 srand(time(NULL)^getpid());
2269 gettimeofday(&tv,NULL);
2270 dictSetHashFunctionSeed(tv.tv_sec^tv.tv_usec^getpid());
39ca1713 2271 initServerConfig();
a48c8d87 2272
67c6f0f6 2273 if (argc >= 2) {
2274 int j = 1; /* First option to parse in argv[] */
2275 sds options = sdsempty();
2276 char *configfile = NULL;
2277
2278 /* Handle special options --help and --version */
39ca1713 2279 if (strcmp(argv[1], "-v") == 0 ||
2280 strcmp(argv[1], "--version") == 0) version();
4c8bd905 2281 if (strcmp(argv[1], "--help") == 0 ||
2282 strcmp(argv[1], "-h") == 0) usage();
78d6a02b 2283 if (strcmp(argv[1], "--test-memory") == 0) {
2284 if (argc == 3) {
ea693f02 2285 memtest(atoi(argv[2]),50);
78d6a02b 2286 exit(0);
2287 } else {
2288 fprintf(stderr,"Please specify the amount of memory to test in megabytes.\n");
2289 fprintf(stderr,"Example: ./redis-server --test-memory 4096\n\n");
2290 exit(1);
2291 }
2292 }
2293
67c6f0f6 2294 /* First argument is the config file name? */
2295 if (argv[j][0] != '-' || argv[j][1] != '-')
2296 configfile = argv[j++];
2297 /* All the other options are parsed and conceptually appended to the
2298 * configuration file. For instance --port 6380 will generate the
2299 * string "port 6380\n" to be parsed after the actual file name
2300 * is parsed, if any. */
2301 while(j != argc) {
2302 if (argv[j][0] == '-' && argv[j][1] == '-') {
2303 /* Option name */
2304 if (sdslen(options)) options = sdscat(options,"\n");
2305 options = sdscat(options,argv[j]+2);
2306 options = sdscat(options," ");
2307 } else {
2308 /* Option argument */
2309 options = sdscatrepr(options,argv[j],strlen(argv[j]));
2310 options = sdscat(options," ");
2311 }
2312 j++;
2313 }
39ca1713 2314 resetServerSaveParams();
67c6f0f6 2315 loadServerConfig(configfile,options);
2316 sdsfree(options);
39ca1713 2317 } else {
2318 redisLog(REDIS_WARNING,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
2319 }
2320 if (server.daemonize) daemonize();
2321 initServer();
2322 if (server.daemonize) createPidFile();
2323 redisAsciiArt();
27ccb94a 2324 redisLog(REDIS_WARNING,"Server started, Redis version " REDIS_VERSION);
39ca1713 2325#ifdef __linux__
2326 linuxOvercommitMemoryWarning();
2327#endif
2328 start = ustime();
e394114d 2329 if (server.aof_state == REDIS_AOF_ON) {
2c915bcf 2330 if (loadAppendOnlyFile(server.aof_filename) == REDIS_OK)
39ca1713 2331 redisLog(REDIS_NOTICE,"DB loaded from append only file: %.3f seconds",(float)(ustime()-start)/1000000);
2332 } else {
f48cd4b9 2333 if (rdbLoad(server.rdb_filename) == REDIS_OK) {
39ca1713 2334 redisLog(REDIS_NOTICE,"DB loaded from disk: %.3f seconds",
2335 (float)(ustime()-start)/1000000);
2336 } else if (errno != ENOENT) {
2337 redisLog(REDIS_WARNING,"Fatal error loading the DB. Exiting.");
2338 exit(1);
2339 }
2340 }
2341 if (server.ipfd > 0)
2342 redisLog(REDIS_NOTICE,"The server is now ready to accept connections on port %d", server.port);
2343 if (server.sofd > 0)
2344 redisLog(REDIS_NOTICE,"The server is now ready to accept connections at %s", server.unixsocket);
2345 aeSetBeforeSleepProc(server.el,beforeSleep);
2346 aeMain(server.el);
2347 aeDeleteEventLoop(server.el);
2348 return 0;
2349}
2350
e2641e09 2351/* The End */