]> git.saurik.com Git - redis.git/blame - src/redis.c
Fixes for redisLogFromHandler().
[redis.git] / src / redis.c
CommitLineData
e2641e09 1/*
2 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 */
29
30#include "redis.h"
daa70b17 31#include "slowlog.h"
8f61a72f 32#include "bio.h"
e2641e09 33
e2641e09 34#include <time.h>
35#include <signal.h>
36#include <sys/wait.h>
37#include <errno.h>
38#include <assert.h>
39#include <ctype.h>
40#include <stdarg.h>
e2641e09 41#include <arpa/inet.h>
42#include <sys/stat.h>
43#include <fcntl.h>
44#include <sys/time.h>
45#include <sys/resource.h>
46#include <sys/uio.h>
47#include <limits.h>
48#include <float.h>
49#include <math.h>
2b00385d 50#include <sys/resource.h>
e2641e09 51
52/* Our shared "common" objects */
53
54struct sharedObjectsStruct shared;
55
c74b7c77 56/* Global vars that are actually used as constants. The following double
e2641e09 57 * values are used for double on-disk serialization, and are initialized
58 * at runtime to avoid strange compiler optimizations. */
59
60double R_Zero, R_PosInf, R_NegInf, R_Nan;
61
62/*================================= Globals ================================= */
63
64/* Global vars */
65struct redisServer server; /* server global state */
66struct redisCommand *commandTable;
5d02b00f 67
7501c66f 68/* Our command table.
69 *
70 * Every entry is composed of the following fields:
71 *
72 * name: a string representing the command name.
73 * function: pointer to the C function implementing the command.
74 * arity: number of arguments, it is possible to use -N to say >= N
75 * sflags: command flags as string. See below for a table of flags.
76 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
77 * get_keys_proc: an optional function to get key arguments from a command.
78 * This is only used when the following three fields are not
79 * enough to specify what arguments are keys.
80 * first_key_index: first argument that is a key
81 * last_key_index: last argument that is a key
82 * key_step: step to get all the keys from first to last argument. For instance
83 * in MSET the step is two since arguments are key,val,key,val,...
84 * microseconds: microseconds of total execution time for this command.
85 * calls: total number of calls of this command.
86 *
87 * The flags, microseconds and calls fields are computed by Redis and should
88 * always be set to zero.
89 *
90 * Command flags are expressed using strings where every character represents
91 * a flag. Later the populateCommandTable() function will take care of
92 * populating the real 'flags' field using this characters.
5d02b00f 93 *
94 * This is the meaning of the flags:
95 *
96 * w: write command (may modify the key space).
97 * r: read command (will never modify the key space).
98 * m: may increase memory usage once called. Don't allow if out of memory.
99 * a: admin command, like SAVE or SHUTDOWN.
100 * p: Pub/Sub related command.
b60ed6e8 101 * f: force replication of this command, regarless of server.dirty.
102 * s: command not allowed in scripts.
7e14a208 103 * R: random command. Command is not deterministic, that is, the same command
b60ed6e8 104 * with the same arguments, with the same key space, may have different
548efd91 105 * results. For instance SPOP and RANDOMKEY are two random commands.
106 * S: Sort command output array if called from script, so that the output
107 * is deterministic.
108 */
d7ed7fd2 109struct redisCommand redisCommandTable[] = {
5d02b00f 110 {"get",getCommand,2,"r",0,NULL,1,1,1,0,0},
111 {"set",setCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
112 {"setnx",setnxCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
39da5d1f 113 {"setex",setexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
114 {"psetex",psetexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
5d02b00f 115 {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
116 {"strlen",strlenCommand,2,"r",0,NULL,1,1,1,0,0},
117 {"del",delCommand,-2,"w",0,noPreloadGetKeys,1,-1,1,0,0},
118 {"exists",existsCommand,2,"r",0,NULL,1,1,1,0,0},
119 {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
120 {"getbit",getbitCommand,3,"r",0,NULL,1,1,1,0,0},
121 {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
122 {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
123 {"substr",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
124 {"incr",incrCommand,2,"wm",0,NULL,1,1,1,0,0},
125 {"decr",decrCommand,2,"wm",0,NULL,1,1,1,0,0},
126 {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
127 {"rpush",rpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
128 {"lpush",lpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
129 {"rpushx",rpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
130 {"lpushx",lpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
131 {"linsert",linsertCommand,5,"wm",0,NULL,1,1,1,0,0},
132 {"rpop",rpopCommand,2,"w",0,NULL,1,1,1,0,0},
133 {"lpop",lpopCommand,2,"w",0,NULL,1,1,1,0,0},
e41677b4 134 {"brpop",brpopCommand,-3,"ws",0,NULL,1,1,1,0,0},
135 {"brpoplpush",brpoplpushCommand,4,"wms",0,NULL,1,2,1,0,0},
136 {"blpop",blpopCommand,-3,"ws",0,NULL,1,-2,1,0,0},
5d02b00f 137 {"llen",llenCommand,2,"r",0,NULL,1,1,1,0,0},
138 {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
139 {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
140 {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
141 {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
142 {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
143 {"rpoplpush",rpoplpushCommand,3,"wm",0,NULL,1,2,1,0,0},
144 {"sadd",saddCommand,-3,"wm",0,NULL,1,1,1,0,0},
145 {"srem",sremCommand,-3,"w",0,NULL,1,1,1,0,0},
146 {"smove",smoveCommand,4,"w",0,NULL,1,2,1,0,0},
147 {"sismember",sismemberCommand,3,"r",0,NULL,1,1,1,0,0},
148 {"scard",scardCommand,2,"r",0,NULL,1,1,1,0,0},
15ef6053 149 {"spop",spopCommand,2,"wRs",0,NULL,1,1,1,0,0},
b60ed6e8 150 {"srandmember",srandmemberCommand,2,"rR",0,NULL,1,1,1,0,0},
548efd91 151 {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 152 {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 153 {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 154 {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 155 {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 156 {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 157 {"smembers",sinterCommand,2,"rS",0,NULL,1,1,1,0,0},
5d02b00f 158 {"zadd",zaddCommand,-4,"wm",0,NULL,1,1,1,0,0},
159 {"zincrby",zincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
160 {"zrem",zremCommand,-3,"w",0,NULL,1,1,1,0,0},
161 {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
162 {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
163 {"zunionstore",zunionstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
164 {"zinterstore",zinterstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
165 {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
166 {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
167 {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
168 {"zcount",zcountCommand,4,"r",0,NULL,1,1,1,0,0},
169 {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
170 {"zcard",zcardCommand,2,"r",0,NULL,1,1,1,0,0},
171 {"zscore",zscoreCommand,3,"r",0,NULL,1,1,1,0,0},
172 {"zrank",zrankCommand,3,"r",0,NULL,1,1,1,0,0},
173 {"zrevrank",zrevrankCommand,3,"r",0,NULL,1,1,1,0,0},
174 {"hset",hsetCommand,4,"wm",0,NULL,1,1,1,0,0},
175 {"hsetnx",hsetnxCommand,4,"wm",0,NULL,1,1,1,0,0},
176 {"hget",hgetCommand,3,"r",0,NULL,1,1,1,0,0},
177 {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
178 {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
179 {"hincrby",hincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
68bfe993 180 {"hincrbyfloat",hincrbyfloatCommand,4,"wm",0,NULL,1,1,1,0,0},
5d02b00f 181 {"hdel",hdelCommand,-3,"w",0,NULL,1,1,1,0,0},
182 {"hlen",hlenCommand,2,"r",0,NULL,1,1,1,0,0},
548efd91 183 {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
184 {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
5d02b00f 185 {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
186 {"hexists",hexistsCommand,3,"r",0,NULL,1,1,1,0,0},
187 {"incrby",incrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
188 {"decrby",decrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
5574b53e 189 {"incrbyfloat",incrbyfloatCommand,3,"wm",0,NULL,1,1,1,0,0},
5d02b00f 190 {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
191 {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
192 {"msetnx",msetnxCommand,-3,"wm",0,NULL,1,-1,2,0,0},
b60ed6e8 193 {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
5d02b00f 194 {"select",selectCommand,2,"r",0,NULL,0,0,0,0,0},
195 {"move",moveCommand,3,"w",0,NULL,1,1,1,0,0},
196 {"rename",renameCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
197 {"renamenx",renamenxCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
12d293ca 198 {"expire",expireCommand,3,"w",0,NULL,1,1,1,0,0},
199 {"expireat",expireatCommand,3,"w",0,NULL,1,1,1,0,0},
200 {"pexpire",pexpireCommand,3,"w",0,NULL,1,1,1,0,0},
201 {"pexpireat",pexpireatCommand,3,"w",0,NULL,1,1,1,0,0},
548efd91 202 {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
5d02b00f 203 {"dbsize",dbsizeCommand,1,"r",0,NULL,0,0,0,0,0},
e41677b4 204 {"auth",authCommand,2,"rs",0,NULL,0,0,0,0,0},
5d02b00f 205 {"ping",pingCommand,1,"r",0,NULL,0,0,0,0,0},
206 {"echo",echoCommand,2,"r",0,NULL,0,0,0,0,0},
e41677b4 207 {"save",saveCommand,1,"ars",0,NULL,0,0,0,0,0},
5d02b00f 208 {"bgsave",bgsaveCommand,1,"ar",0,NULL,0,0,0,0,0},
209 {"bgrewriteaof",bgrewriteaofCommand,1,"ar",0,NULL,0,0,0,0,0},
4ab8695d 210 {"shutdown",shutdownCommand,-1,"ar",0,NULL,0,0,0,0,0},
5d02b00f 211 {"lastsave",lastsaveCommand,1,"r",0,NULL,0,0,0,0,0},
212 {"type",typeCommand,2,"r",0,NULL,1,1,1,0,0},
b60ed6e8 213 {"multi",multiCommand,1,"rs",0,NULL,0,0,0,0,0},
05406168 214 {"exec",execCommand,1,"s",0,NULL,0,0,0,0,0},
b60ed6e8 215 {"discard",discardCommand,1,"rs",0,NULL,0,0,0,0,0},
216 {"sync",syncCommand,1,"ars",0,NULL,0,0,0,0,0},
5d02b00f 217 {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
218 {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
2c861050 219 {"sort",sortCommand,-2,"wmS",0,NULL,1,1,1,0,0},
5d02b00f 220 {"info",infoCommand,-1,"r",0,NULL,0,0,0,0,0},
b60ed6e8 221 {"monitor",monitorCommand,1,"ars",0,NULL,0,0,0,0,0},
12d293ca 222 {"ttl",ttlCommand,2,"r",0,NULL,1,1,1,0,0},
223 {"pttl",pttlCommand,2,"r",0,NULL,1,1,1,0,0},
5d02b00f 224 {"persist",persistCommand,2,"w",0,NULL,1,1,1,0,0},
b60ed6e8 225 {"slaveof",slaveofCommand,3,"aws",0,NULL,0,0,0,0,0},
38bb4522 226 {"debug",debugCommand,-2,"as",0,NULL,0,0,0,0,0},
5d02b00f 227 {"config",configCommand,-2,"ar",0,NULL,0,0,0,0,0},
b60ed6e8 228 {"subscribe",subscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
229 {"unsubscribe",unsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
230 {"psubscribe",psubscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
231 {"punsubscribe",punsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
6e6bbac7 232 {"publish",publishCommand,3,"pf",0,NULL,0,0,0,0,0},
b60ed6e8 233 {"watch",watchCommand,-2,"rs",0,noPreloadGetKeys,1,-1,1,0,0},
234 {"unwatch",unwatchCommand,1,"rs",0,NULL,0,0,0,0,0},
7afc3a96 235 {"restore",restoreCommand,4,"awm",0,NULL,1,1,1,0,0},
5d02b00f 236 {"migrate",migrateCommand,6,"aw",0,NULL,0,0,0,0,0},
1bcfa0f6 237 {"dump",dumpCommand,2,"ar",0,NULL,1,1,1,0,0},
238 {"object",objectCommand,-2,"r",0,NULL,2,2,2,0,0},
5d02b00f 239 {"client",clientCommand,-2,"ar",0,NULL,0,0,0,0,0},
05406168 240 {"eval",evalCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
241 {"evalsha",evalShaCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
070e3945 242 {"slowlog",slowlogCommand,-2,"r",0,NULL,0,0,0,0,0},
9494f1f1 243 {"script",scriptCommand,-2,"ras",0,NULL,0,0,0,0,0},
244 {"time",timeCommand,1,"rR",0,NULL,0,0,0,0,0}
e2641e09 245};
246
247/*============================ Utility functions ============================ */
248
9c104c68 249/* Low level logging. To use only for very big messages, otherwise
250 * redisLog() is to prefer. */
251void redisLogRaw(int level, const char *msg) {
e1a586ee
JH
252 const int syslogLevelMap[] = { LOG_DEBUG, LOG_INFO, LOG_NOTICE, LOG_WARNING };
253 const char *c = ".-*#";
254 time_t now = time(NULL);
e2641e09 255 FILE *fp;
23072961 256 char buf[64];
996d503d 257 int rawmode = (level & REDIS_LOG_RAW);
23072961 258
996d503d 259 level &= 0xff; /* clear flags */
23072961 260 if (level < server.verbosity) return;
e2641e09 261
262 fp = (server.logfile == NULL) ? stdout : fopen(server.logfile,"a");
263 if (!fp) return;
264
996d503d 265 if (rawmode) {
266 fprintf(fp,"%s",msg);
267 } else {
268 strftime(buf,sizeof(buf),"%d %b %H:%M:%S",localtime(&now));
269 fprintf(fp,"[%d] %s %c %s\n",(int)getpid(),buf,c[level],msg);
270 }
e1a586ee
JH
271 fflush(fp);
272
e2641e09 273 if (server.logfile) fclose(fp);
e1a586ee
JH
274
275 if (server.syslog_enabled) syslog(syslogLevelMap[level], "%s", msg);
e2641e09 276}
277
9c104c68 278/* Like redisLogRaw() but with printf-alike support. This is the funciton that
279 * is used across the code. The raw version is only used in order to dump
280 * the INFO output on crash. */
281void redisLog(int level, const char *fmt, ...) {
282 va_list ap;
283 char msg[REDIS_MAX_LOGMSG_LEN];
284
996d503d 285 if ((level&0xff) < server.verbosity) return;
9c104c68 286
287 va_start(ap, fmt);
288 vsnprintf(msg, sizeof(msg), fmt, ap);
289 va_end(ap);
290
291 redisLogRaw(level,msg);
292}
293
be4f8ccc 294/* Log a fixed message without printf-alike capabilities, in a way that is
295 * safe to call from a signal handler.
296 *
297 * We actually use this only for signals that are not fatal from the point
298 * of view of Redis. Signals that are going to kill the server anyway and
299 * where we need printf-alike features are served by redisLog(). */
300void redisLogFromHandler(int level, const char *msg) {
301 int fd;
302 char buf[64];
303
304 if ((level&0xff) < server.verbosity ||
305 (server.logfile == NULL && server.daemonize)) return;
306 fd = server.logfile ?
307 open(server.logfile, O_APPEND|O_CREAT|O_WRONLY, 0644) :
e51f7d2c 308 STDOUT_FILENO;
be4f8ccc 309 if (fd == -1) return;
310 ll2string(buf,sizeof(buf),getpid());
311 write(fd,"[",1);
312 write(fd,buf,strlen(buf));
313 write(fd," | signal handler] (",20);
314 ll2string(buf,sizeof(buf),time(NULL));
315 write(fd,buf,strlen(buf));
316 write(fd,") ",2);
317 write(fd,msg,strlen(msg));
318 write(fd,"\n",1);
e51f7d2c 319 if (server.logfile) close(fd);
be4f8ccc 320}
321
e2641e09 322/* Redis generally does not try to recover from out of memory conditions
323 * when allocating objects or strings, it is not clear if it will be possible
324 * to report this condition to the client since the networking layer itself
325 * is based on heap allocation for send buffers, so we simply abort.
326 * At least the code will be simpler to read... */
327void oom(const char *msg) {
328 redisLog(REDIS_WARNING, "%s: Out of memory\n",msg);
329 sleep(1);
330 abort();
331}
332
d9cb288c 333/* Return the UNIX time in microseconds */
334long long ustime(void) {
335 struct timeval tv;
336 long long ust;
337
338 gettimeofday(&tv, NULL);
339 ust = ((long long)tv.tv_sec)*1000000;
340 ust += tv.tv_usec;
341 return ust;
342}
343
2c2b2085 344/* Return the UNIX time in milliseconds */
345long long mstime(void) {
346 return ustime()/1000;
347}
348
e2641e09 349/*====================== Hash table type implementation ==================== */
350
351/* This is an hash table type that uses the SDS dynamic strings libary as
352 * keys and radis objects as values (objects can hold SDS strings,
353 * lists, sets). */
354
355void dictVanillaFree(void *privdata, void *val)
356{
357 DICT_NOTUSED(privdata);
358 zfree(val);
359}
360
361void dictListDestructor(void *privdata, void *val)
362{
363 DICT_NOTUSED(privdata);
364 listRelease((list*)val);
365}
366
367int dictSdsKeyCompare(void *privdata, const void *key1,
368 const void *key2)
369{
370 int l1,l2;
371 DICT_NOTUSED(privdata);
372
373 l1 = sdslen((sds)key1);
374 l2 = sdslen((sds)key2);
375 if (l1 != l2) return 0;
376 return memcmp(key1, key2, l1) == 0;
377}
378
1b1f47c9 379/* A case insensitive version used for the command lookup table. */
380int dictSdsKeyCaseCompare(void *privdata, const void *key1,
381 const void *key2)
382{
383 DICT_NOTUSED(privdata);
384
385 return strcasecmp(key1, key2) == 0;
386}
387
e2641e09 388void dictRedisObjectDestructor(void *privdata, void *val)
389{
390 DICT_NOTUSED(privdata);
391
392 if (val == NULL) return; /* Values of swapped out keys as set to NULL */
393 decrRefCount(val);
394}
395
396void dictSdsDestructor(void *privdata, void *val)
397{
398 DICT_NOTUSED(privdata);
399
400 sdsfree(val);
401}
402
403int dictObjKeyCompare(void *privdata, const void *key1,
404 const void *key2)
405{
406 const robj *o1 = key1, *o2 = key2;
407 return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
408}
409
410unsigned int dictObjHash(const void *key) {
411 const robj *o = key;
412 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
413}
414
415unsigned int dictSdsHash(const void *key) {
416 return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
417}
418
1b1f47c9 419unsigned int dictSdsCaseHash(const void *key) {
420 return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
421}
422
e2641e09 423int dictEncObjKeyCompare(void *privdata, const void *key1,
424 const void *key2)
425{
426 robj *o1 = (robj*) key1, *o2 = (robj*) key2;
427 int cmp;
428
429 if (o1->encoding == REDIS_ENCODING_INT &&
430 o2->encoding == REDIS_ENCODING_INT)
431 return o1->ptr == o2->ptr;
432
433 o1 = getDecodedObject(o1);
434 o2 = getDecodedObject(o2);
435 cmp = dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
436 decrRefCount(o1);
437 decrRefCount(o2);
438 return cmp;
439}
440
441unsigned int dictEncObjHash(const void *key) {
442 robj *o = (robj*) key;
443
444 if (o->encoding == REDIS_ENCODING_RAW) {
445 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
446 } else {
447 if (o->encoding == REDIS_ENCODING_INT) {
448 char buf[32];
449 int len;
450
451 len = ll2string(buf,32,(long)o->ptr);
452 return dictGenHashFunction((unsigned char*)buf, len);
453 } else {
454 unsigned int hash;
455
456 o = getDecodedObject(o);
457 hash = dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
458 decrRefCount(o);
459 return hash;
460 }
461 }
462}
463
4dd444bb 464/* Sets type hash table */
e2641e09 465dictType setDictType = {
466 dictEncObjHash, /* hash function */
467 NULL, /* key dup */
468 NULL, /* val dup */
469 dictEncObjKeyCompare, /* key compare */
470 dictRedisObjectDestructor, /* key destructor */
471 NULL /* val destructor */
472};
473
474/* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
475dictType zsetDictType = {
476 dictEncObjHash, /* hash function */
477 NULL, /* key dup */
478 NULL, /* val dup */
479 dictEncObjKeyCompare, /* key compare */
480 dictRedisObjectDestructor, /* key destructor */
69ef89f2 481 NULL /* val destructor */
e2641e09 482};
483
484/* Db->dict, keys are sds strings, vals are Redis objects. */
485dictType dbDictType = {
486 dictSdsHash, /* hash function */
487 NULL, /* key dup */
488 NULL, /* val dup */
489 dictSdsKeyCompare, /* key compare */
490 dictSdsDestructor, /* key destructor */
491 dictRedisObjectDestructor /* val destructor */
492};
493
494/* Db->expires */
495dictType keyptrDictType = {
496 dictSdsHash, /* hash function */
497 NULL, /* key dup */
498 NULL, /* val dup */
499 dictSdsKeyCompare, /* key compare */
500 NULL, /* key destructor */
501 NULL /* val destructor */
502};
503
1b1f47c9 504/* Command table. sds string -> command struct pointer. */
505dictType commandTableDictType = {
506 dictSdsCaseHash, /* hash function */
507 NULL, /* key dup */
508 NULL, /* val dup */
509 dictSdsKeyCaseCompare, /* key compare */
510 dictSdsDestructor, /* key destructor */
511 NULL /* val destructor */
512};
513
e2641e09 514/* Hash type hash table (note that small hashes are represented with zimpaps) */
515dictType hashDictType = {
516 dictEncObjHash, /* hash function */
517 NULL, /* key dup */
518 NULL, /* val dup */
519 dictEncObjKeyCompare, /* key compare */
520 dictRedisObjectDestructor, /* key destructor */
521 dictRedisObjectDestructor /* val destructor */
522};
523
524/* Keylist hash table type has unencoded redis objects as keys and
525 * lists as values. It's used for blocking operations (BLPOP) and to
526 * map swapped keys to a list of clients waiting for this keys to be loaded. */
527dictType keylistDictType = {
528 dictObjHash, /* hash function */
529 NULL, /* key dup */
530 NULL, /* val dup */
531 dictObjKeyCompare, /* key compare */
532 dictRedisObjectDestructor, /* key destructor */
533 dictListDestructor /* val destructor */
534};
535
536int htNeedsResize(dict *dict) {
537 long long size, used;
538
539 size = dictSlots(dict);
540 used = dictSize(dict);
541 return (size && used && size > DICT_HT_INITIAL_SIZE &&
542 (used*100/size < REDIS_HT_MINFILL));
543}
544
545/* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
546 * we resize the hash table to save memory */
547void tryResizeHashTables(void) {
548 int j;
549
550 for (j = 0; j < server.dbnum; j++) {
551 if (htNeedsResize(server.db[j].dict))
552 dictResize(server.db[j].dict);
553 if (htNeedsResize(server.db[j].expires))
554 dictResize(server.db[j].expires);
555 }
556}
557
558/* Our hash table implementation performs rehashing incrementally while
559 * we write/read from the hash table. Still if the server is idle, the hash
560 * table will use two tables for a long time. So we try to use 1 millisecond
561 * of CPU time at every serverCron() loop in order to rehash some key. */
562void incrementallyRehash(void) {
563 int j;
564
565 for (j = 0; j < server.dbnum; j++) {
566 if (dictIsRehashing(server.db[j].dict)) {
567 dictRehashMilliseconds(server.db[j].dict,1);
568 break; /* already used our millisecond for this loop... */
569 }
570 }
571}
572
573/* This function is called once a background process of some kind terminates,
574 * as we want to avoid resizing the hash tables when there is a child in order
575 * to play well with copy-on-write (otherwise when a resize happens lots of
576 * memory pages are copied). The goal of this function is to update the ability
577 * for dict.c to resize the hash tables accordingly to the fact we have o not
578 * running childs. */
579void updateDictResizePolicy(void) {
f48cd4b9 580 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
e2641e09 581 dictEnableResize();
582 else
583 dictDisableResize();
584}
585
586/* ======================= Cron: called every 100 ms ======================== */
587
bcf2995c 588/* Try to expire a few timed out keys. The algorithm used is adaptive and
589 * will use few CPU cycles if there are few expiring keys, otherwise
590 * it will get more aggressive to avoid that too much memory is used by
591 * keys that can be removed from the keyspace. */
592void activeExpireCycle(void) {
593 int j;
594
595 for (j = 0; j < server.dbnum; j++) {
596 int expired;
597 redisDb *db = server.db+j;
598
599 /* Continue to expire if at the end of the cycle more than 25%
600 * of the keys were expired. */
601 do {
602 long num = dictSize(db->expires);
4be855e7 603 long long now = mstime();
bcf2995c 604
605 expired = 0;
606 if (num > REDIS_EXPIRELOOKUPS_PER_CRON)
607 num = REDIS_EXPIRELOOKUPS_PER_CRON;
608 while (num--) {
609 dictEntry *de;
4be855e7 610 long long t;
bcf2995c 611
612 if ((de = dictGetRandomKey(db->expires)) == NULL) break;
4be855e7 613 t = dictGetSignedIntegerVal(de);
bcf2995c 614 if (now > t) {
c0ba9ebe 615 sds key = dictGetKey(de);
bcf2995c 616 robj *keyobj = createStringObject(key,sdslen(key));
617
618 propagateExpire(db,keyobj);
619 dbDelete(db,keyobj);
620 decrRefCount(keyobj);
621 expired++;
622 server.stat_expiredkeys++;
623 }
624 }
625 } while (expired > REDIS_EXPIRELOOKUPS_PER_CRON/4);
626 }
627}
628
165346ca 629void updateLRUClock(void) {
56ff70f8 630 server.lruclock = (server.unixtime/REDIS_LRU_CLOCK_RESOLUTION) &
165346ca 631 REDIS_LRU_CLOCK_MAX;
632}
bcf2995c 633
250e7f69 634
635/* Add a sample to the operations per second array of samples. */
636void trackOperationsPerSecond(void) {
637 long long t = mstime() - server.ops_sec_last_sample_time;
638 long long ops = server.stat_numcommands - server.ops_sec_last_sample_ops;
639 long long ops_sec;
640
641 ops_sec = t > 0 ? (ops*1000/t) : 0;
642
643 server.ops_sec_samples[server.ops_sec_idx] = ops_sec;
644 server.ops_sec_idx = (server.ops_sec_idx+1) % REDIS_OPS_SEC_SAMPLES;
645 server.ops_sec_last_sample_time = mstime();
646 server.ops_sec_last_sample_ops = server.stat_numcommands;
647}
648
649/* Return the mean of all the samples. */
650long long getOperationsPerSecond(void) {
651 int j;
652 long long sum = 0;
653
654 for (j = 0; j < REDIS_OPS_SEC_SAMPLES; j++)
655 sum += server.ops_sec_samples[j];
656 return sum / REDIS_OPS_SEC_SAMPLES;
657}
658
f1eaf572 659/* Check for timeouts. Returns non-zero if the client was terminated */
660int clientsCronHandleTimeout(redisClient *c) {
9fa9ccb0 661 time_t now = server.unixtime;
cfa4b57c 662
663 if (server.maxidletime &&
664 !(c->flags & REDIS_SLAVE) && /* no timeout for slaves */
665 !(c->flags & REDIS_MASTER) && /* no timeout for masters */
666 !(c->flags & REDIS_BLOCKED) && /* no timeout for BLPOP */
667 dictSize(c->pubsub_channels) == 0 && /* no timeout for pubsub */
668 listLength(c->pubsub_patterns) == 0 &&
669 (now - c->lastinteraction > server.maxidletime))
670 {
671 redisLog(REDIS_VERBOSE,"Closing idle client");
672 freeClient(c);
f1eaf572 673 return 1;
cfa4b57c 674 } else if (c->flags & REDIS_BLOCKED) {
675 if (c->bpop.timeout != 0 && c->bpop.timeout < now) {
676 addReply(c,shared.nullmultibulk);
677 unblockClientWaitingData(c);
678 }
679 }
f1eaf572 680 return 0;
cfa4b57c 681}
682
9fa9ccb0 683/* The client query buffer is an sds.c string that can end with a lot of
f1eaf572 684 * free space not used, this function reclaims space if needed.
685 *
686 * The funciton always returns 0 as it never terminates the client. */
687int clientsCronResizeQueryBuffer(redisClient *c) {
9fa9ccb0 688 size_t querybuf_size = sdsAllocSize(c->querybuf);
689 time_t idletime = server.unixtime - c->lastinteraction;
690
691 /* There are two conditions to resize the query buffer:
692 * 1) Query buffer is > BIG_ARG and too big for latest peak.
693 * 2) Client is inactive and the buffer is bigger than 1k. */
694 if (((querybuf_size > REDIS_MBULK_BIG_ARG) &&
695 (querybuf_size/(c->querybuf_peak+1)) > 2) ||
696 (querybuf_size > 1024 && idletime > 2))
697 {
698 /* Only resize the query buffer if it is actually wasting space. */
699 if (sdsavail(c->querybuf) > 1024) {
700 c->querybuf = sdsRemoveFreeSpace(c->querybuf);
701 }
702 }
703 /* Reset the peak again to capture the peak memory usage in the next
704 * cycle. */
705 c->querybuf_peak = 0;
f1eaf572 706 return 0;
9fa9ccb0 707}
708
cfa4b57c 709void clientsCron(void) {
710 /* Make sure to process at least 1/100 of clients per call.
711 * Since this function is called 10 times per second we are sure that
712 * in the worst case we process all the clients in 10 seconds.
713 * In normal conditions (a reasonable number of clients) we process
714 * all the clients in a shorter time. */
9fa9ccb0 715 int numclients = listLength(server.clients);
716 int iterations = numclients/100;
cfa4b57c 717
9fa9ccb0 718 if (iterations < 50)
719 iterations = (numclients < 50) ? numclients : 50;
cfa4b57c 720 while(listLength(server.clients) && iterations--) {
721 redisClient *c;
722 listNode *head;
723
724 /* Rotate the list, take the current head, process.
725 * This way if the client must be removed from the list it's the
726 * first element and we don't incur into O(N) computation. */
727 listRotate(server.clients);
728 head = listFirst(server.clients);
729 c = listNodeValue(head);
f1eaf572 730 /* The following functions do different service checks on the client.
731 * The protocol is that they return non-zero if the client was
732 * terminated. */
733 if (clientsCronHandleTimeout(c)) continue;
734 if (clientsCronResizeQueryBuffer(c)) continue;
cfa4b57c 735 }
736}
737
e2641e09 738int serverCron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
89a1433e 739 int j, loops = server.cronloops;
e2641e09 740 REDIS_NOTUSED(eventLoop);
741 REDIS_NOTUSED(id);
742 REDIS_NOTUSED(clientData);
743
fc030ac7 744 /* Software watchdog: deliver the SIGALRM that will reach the signal
745 * handler if we don't return here fast enough. */
746 if (server.watchdog_period) watchdogScheduleSignal(server.watchdog_period);
747
e2641e09 748 /* We take a cached value of the unix time in the global state because
749 * with virtual memory and aging there is to store the current time
750 * in objects at every object access, and accuracy is not needed.
751 * To access a global var is faster than calling time(NULL) */
752 server.unixtime = time(NULL);
4f06867a 753
250e7f69 754 trackOperationsPerSecond();
755
ef59a8bc 756 /* We have just 22 bits per object for LRU information.
165346ca 757 * So we use an (eventually wrapping) LRU clock with 10 seconds resolution.
758 * 2^22 bits with 10 seconds resoluton is more or less 1.5 years.
e2641e09 759 *
165346ca 760 * Note that even if this will wrap after 1.5 years it's not a problem,
ef59a8bc 761 * everything will still work but just some object will appear younger
165346ca 762 * to Redis. But for this to happen a given object should never be touched
763 * for 1.5 years.
764 *
765 * Note that you can change the resolution altering the
766 * REDIS_LRU_CLOCK_RESOLUTION define.
e2641e09 767 */
165346ca 768 updateLRUClock();
e2641e09 769
17b24ff3 770 /* Record the max memory used since the server was started. */
771 if (zmalloc_used_memory() > server.stat_peak_memory)
772 server.stat_peak_memory = zmalloc_used_memory();
773
e2641e09 774 /* We received a SIGTERM, shutting down here in a safe way, as it is
775 * not ok doing so inside the signal handler. */
776 if (server.shutdown_asap) {
4ab8695d 777 if (prepareForShutdown(0) == REDIS_OK) exit(0);
e2641e09 778 redisLog(REDIS_WARNING,"SIGTERM received but errors trying to shut down the server, check the logs for more information");
779 }
780
781 /* Show some info about non-empty databases */
782 for (j = 0; j < server.dbnum; j++) {
783 long long size, used, vkeys;
784
785 size = dictSlots(server.db[j].dict);
786 used = dictSize(server.db[j].dict);
787 vkeys = dictSize(server.db[j].expires);
788 if (!(loops % 50) && (used || vkeys)) {
789 redisLog(REDIS_VERBOSE,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j,used,vkeys,size);
790 /* dictPrintStats(server.dict); */
791 }
792 }
793
794 /* We don't want to resize the hash tables while a bacground saving
795 * is in progress: the saving child is created using fork() that is
796 * implemented with a copy-on-write semantic in most modern systems, so
797 * if we resize the HT while there is the saving child at work actually
798 * a lot of memory movements in the parent will cause a lot of pages
799 * copied. */
f48cd4b9 800 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
e2641e09 801 if (!(loops % 10)) tryResizeHashTables();
802 if (server.activerehashing) incrementallyRehash();
803 }
804
805 /* Show information about connected clients */
806 if (!(loops % 50)) {
807 redisLog(REDIS_VERBOSE,"%d clients connected (%d slaves), %zu bytes in use",
808 listLength(server.clients)-listLength(server.slaves),
809 listLength(server.slaves),
ca734d17 810 zmalloc_used_memory());
e2641e09 811 }
812
cfa4b57c 813 /* We need to do a few operations on clients asynchronously. */
814 clientsCron();
e2641e09 815
b333e239 816 /* Start a scheduled AOF rewrite if this was requested by the user while
817 * a BGSAVE was in progress. */
f48cd4b9 818 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1 &&
2c915bcf 819 server.aof_rewrite_scheduled)
b333e239 820 {
821 rewriteAppendOnlyFileBackground();
822 }
823
f03fe802 824 /* Check if a background saving or AOF rewrite in progress terminated. */
f48cd4b9 825 if (server.rdb_child_pid != -1 || server.aof_child_pid != -1) {
e2641e09 826 int statloc;
827 pid_t pid;
828
829 if ((pid = wait3(&statloc,WNOHANG,NULL)) != 0) {
36c17a53 830 int exitcode = WEXITSTATUS(statloc);
831 int bysignal = 0;
832
833 if (WIFSIGNALED(statloc)) bysignal = WTERMSIG(statloc);
834
f48cd4b9 835 if (pid == server.rdb_child_pid) {
36c17a53 836 backgroundSaveDoneHandler(exitcode,bysignal);
e2641e09 837 } else {
36c17a53 838 backgroundRewriteDoneHandler(exitcode,bysignal);
e2641e09 839 }
840 updateDictResizePolicy();
841 }
c9d0c362 842 } else {
b333e239 843 /* If there is not a background saving/rewrite in progress check if
844 * we have to save/rewrite now */
e2641e09 845 for (j = 0; j < server.saveparamslen; j++) {
846 struct saveparam *sp = server.saveparams+j;
847
848 if (server.dirty >= sp->changes &&
56ff70f8 849 server.unixtime-server.lastsave > sp->seconds) {
e2641e09 850 redisLog(REDIS_NOTICE,"%d changes in %d seconds. Saving...",
851 sp->changes, sp->seconds);
f48cd4b9 852 rdbSaveBackground(server.rdb_filename);
e2641e09 853 break;
854 }
855 }
b333e239 856
857 /* Trigger an AOF rewrite if needed */
f48cd4b9 858 if (server.rdb_child_pid == -1 &&
ff2145ad 859 server.aof_child_pid == -1 &&
2c915bcf 860 server.aof_rewrite_perc &&
861 server.aof_current_size > server.aof_rewrite_min_size)
b333e239 862 {
2c915bcf 863 long long base = server.aof_rewrite_base_size ?
864 server.aof_rewrite_base_size : 1;
865 long long growth = (server.aof_current_size*100/base) - 100;
866 if (growth >= server.aof_rewrite_perc) {
19b46c9a 867 redisLog(REDIS_NOTICE,"Starting automatic rewriting of AOF on %lld%% growth",growth);
b333e239 868 rewriteAppendOnlyFileBackground();
869 }
870 }
e2641e09 871 }
872
db3c2a4f 873
874 /* If we postponed an AOF buffer flush, let's try to do it every time the
875 * cron function is called. */
876 if (server.aof_flush_postponed_start) flushAppendOnlyFile(0);
877
bcf2995c 878 /* Expire a few keys per cycle, only if this is a master.
879 * On slaves we wait for DEL operations synthesized by the master
880 * in order to guarantee a strict consistency. */
881 if (server.masterhost == NULL) activeExpireCycle();
e2641e09 882
8c43e663 883 /* Close clients that need to be closed asynchronous */
884 freeClientsInAsyncFreeQueue();
885
f4aa600b 886 /* Replication cron function -- used to reconnect to master and
887 * to detect transfer failures. */
62ec599c 888 if (!(loops % 10)) replicationCron();
f4aa600b 889
89a1433e 890 server.cronloops++;
e2641e09 891 return 100;
892}
893
894/* This function gets called every time Redis is entering the
895 * main loop of the event driven library, that is, before to sleep
896 * for ready file descriptors. */
897void beforeSleep(struct aeEventLoop *eventLoop) {
898 REDIS_NOTUSED(eventLoop);
a4ce7581
PN
899 listNode *ln;
900 redisClient *c;
e2641e09 901
a4ce7581
PN
902 /* Try to process pending commands for clients that were just unblocked. */
903 while (listLength(server.unblocked_clients)) {
904 ln = listFirst(server.unblocked_clients);
905 redisAssert(ln != NULL);
906 c = ln->value;
907 listDelNode(server.unblocked_clients,ln);
3bcffcbe 908 c->flags &= ~REDIS_UNBLOCKED;
a4ce7581
PN
909
910 /* Process remaining data in the input buffer. */
00010fa9 911 if (c->querybuf && sdslen(c->querybuf) > 0) {
912 server.current_client = c;
a4ce7581 913 processInputBuffer(c);
00010fa9 914 server.current_client = NULL;
915 }
a4ce7581
PN
916 }
917
e2641e09 918 /* Write the AOF buffer on disk */
db3c2a4f 919 flushAppendOnlyFile(0);
e2641e09 920}
921
922/* =========================== Server initialization ======================== */
923
924void createSharedObjects(void) {
925 int j;
926
927 shared.crlf = createObject(REDIS_STRING,sdsnew("\r\n"));
928 shared.ok = createObject(REDIS_STRING,sdsnew("+OK\r\n"));
929 shared.err = createObject(REDIS_STRING,sdsnew("-ERR\r\n"));
930 shared.emptybulk = createObject(REDIS_STRING,sdsnew("$0\r\n\r\n"));
931 shared.czero = createObject(REDIS_STRING,sdsnew(":0\r\n"));
932 shared.cone = createObject(REDIS_STRING,sdsnew(":1\r\n"));
933 shared.cnegone = createObject(REDIS_STRING,sdsnew(":-1\r\n"));
934 shared.nullbulk = createObject(REDIS_STRING,sdsnew("$-1\r\n"));
935 shared.nullmultibulk = createObject(REDIS_STRING,sdsnew("*-1\r\n"));
936 shared.emptymultibulk = createObject(REDIS_STRING,sdsnew("*0\r\n"));
937 shared.pong = createObject(REDIS_STRING,sdsnew("+PONG\r\n"));
938 shared.queued = createObject(REDIS_STRING,sdsnew("+QUEUED\r\n"));
939 shared.wrongtypeerr = createObject(REDIS_STRING,sdsnew(
940 "-ERR Operation against a key holding the wrong kind of value\r\n"));
941 shared.nokeyerr = createObject(REDIS_STRING,sdsnew(
942 "-ERR no such key\r\n"));
943 shared.syntaxerr = createObject(REDIS_STRING,sdsnew(
944 "-ERR syntax error\r\n"));
945 shared.sameobjecterr = createObject(REDIS_STRING,sdsnew(
946 "-ERR source and destination objects are the same\r\n"));
947 shared.outofrangeerr = createObject(REDIS_STRING,sdsnew(
948 "-ERR index out of range\r\n"));
7229d60d 949 shared.noscripterr = createObject(REDIS_STRING,sdsnew(
950 "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
97e7f8ae 951 shared.loadingerr = createObject(REDIS_STRING,sdsnew(
952 "-LOADING Redis is loading the dataset in memory\r\n"));
115e3ff3 953 shared.slowscripterr = createObject(REDIS_STRING,sdsnew(
4ab8695d 954 "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
c25e7eaf 955 shared.bgsaveerr = createObject(REDIS_STRING,sdsnew(
05406168 956 "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
957 shared.roslaveerr = createObject(REDIS_STRING,sdsnew(
958 "-READONLY You can't write against a read only slave.\r\n"));
3f7ad833 959 shared.oomerr = createObject(REDIS_STRING,sdsnew(
960 "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
e2641e09 961 shared.space = createObject(REDIS_STRING,sdsnew(" "));
962 shared.colon = createObject(REDIS_STRING,sdsnew(":"));
963 shared.plus = createObject(REDIS_STRING,sdsnew("+"));
964 shared.select0 = createStringObject("select 0\r\n",10);
965 shared.select1 = createStringObject("select 1\r\n",10);
966 shared.select2 = createStringObject("select 2\r\n",10);
967 shared.select3 = createStringObject("select 3\r\n",10);
968 shared.select4 = createStringObject("select 4\r\n",10);
969 shared.select5 = createStringObject("select 5\r\n",10);
970 shared.select6 = createStringObject("select 6\r\n",10);
971 shared.select7 = createStringObject("select 7\r\n",10);
972 shared.select8 = createStringObject("select 8\r\n",10);
973 shared.select9 = createStringObject("select 9\r\n",10);
974 shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
975 shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
976 shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
977 shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
978 shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
979 shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
355f8591 980 shared.del = createStringObject("DEL",3);
c1db214e 981 shared.rpop = createStringObject("RPOP",4);
982 shared.lpop = createStringObject("LPOP",4);
e2641e09 983 for (j = 0; j < REDIS_SHARED_INTEGERS; j++) {
984 shared.integers[j] = createObject(REDIS_STRING,(void*)(long)j);
985 shared.integers[j]->encoding = REDIS_ENCODING_INT;
986 }
355f8591 987 for (j = 0; j < REDIS_SHARED_BULKHDR_LEN; j++) {
988 shared.mbulkhdr[j] = createObject(REDIS_STRING,
989 sdscatprintf(sdsempty(),"*%d\r\n",j));
990 shared.bulkhdr[j] = createObject(REDIS_STRING,
991 sdscatprintf(sdsempty(),"$%d\r\n",j));
992 }
e2641e09 993}
994
995void initServerConfig() {
91d664d6 996 getRandomHexChars(server.runid,REDIS_RUN_ID_SIZE);
997 server.runid[REDIS_RUN_ID_SIZE] = '\0';
75eaac5c 998 server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
e2641e09 999 server.port = REDIS_SERVERPORT;
a5639e7d 1000 server.bindaddr = NULL;
5d10923f 1001 server.unixsocket = NULL;
85238765 1002 server.unixsocketperm = 0;
a5639e7d
PN
1003 server.ipfd = -1;
1004 server.sofd = -1;
1005 server.dbnum = REDIS_DEFAULT_DBNUM;
c6f9ee88 1006 server.verbosity = REDIS_NOTICE;
e2641e09 1007 server.maxidletime = REDIS_MAXIDLETIME;
becf5fdb 1008 server.client_max_querybuf_len = REDIS_MAX_QUERYBUF_LEN;
e2641e09 1009 server.saveparams = NULL;
97e7f8ae 1010 server.loading = 0;
e2641e09 1011 server.logfile = NULL; /* NULL = log on standard output */
e1a586ee
JH
1012 server.syslog_enabled = 0;
1013 server.syslog_ident = zstrdup("redis");
1014 server.syslog_facility = LOG_LOCAL0;
e2641e09 1015 server.daemonize = 0;
e394114d 1016 server.aof_state = REDIS_AOF_OFF;
2c915bcf 1017 server.aof_fsync = AOF_FSYNC_EVERYSEC;
1018 server.aof_no_fsync_on_rewrite = 0;
1019 server.aof_rewrite_perc = REDIS_AOF_REWRITE_PERC;
1020 server.aof_rewrite_min_size = REDIS_AOF_REWRITE_MIN_SIZE;
1021 server.aof_rewrite_base_size = 0;
1022 server.aof_rewrite_scheduled = 0;
ff2145ad 1023 server.aof_last_fsync = time(NULL);
81f32c7b 1024 server.aof_delayed_fsync = 0;
ff2145ad 1025 server.aof_fd = -1;
1026 server.aof_selected_db = -1; /* Make sure the first time will not match */
db3c2a4f 1027 server.aof_flush_postponed_start = 0;
e2641e09 1028 server.pidfile = zstrdup("/var/run/redis.pid");
f48cd4b9 1029 server.rdb_filename = zstrdup("dump.rdb");
2c915bcf 1030 server.aof_filename = zstrdup("appendonly.aof");
e2641e09 1031 server.requirepass = NULL;
f48cd4b9 1032 server.rdb_compression = 1;
e2641e09 1033 server.activerehashing = 1;
58732c23 1034 server.maxclients = REDIS_MAX_CLIENTS;
5fa95ad7 1035 server.bpop_blocked_clients = 0;
e2641e09 1036 server.maxmemory = 0;
165346ca 1037 server.maxmemory_policy = REDIS_MAXMEMORY_VOLATILE_LRU;
1038 server.maxmemory_samples = 3;
ebd85e9a
PN
1039 server.hash_max_ziplist_entries = REDIS_HASH_MAX_ZIPLIST_ENTRIES;
1040 server.hash_max_ziplist_value = REDIS_HASH_MAX_ZIPLIST_VALUE;
e2641e09 1041 server.list_max_ziplist_entries = REDIS_LIST_MAX_ZIPLIST_ENTRIES;
1042 server.list_max_ziplist_value = REDIS_LIST_MAX_ZIPLIST_VALUE;
96ffb2fe 1043 server.set_max_intset_entries = REDIS_SET_MAX_INTSET_ENTRIES;
3ea204e1
PN
1044 server.zset_max_ziplist_entries = REDIS_ZSET_MAX_ZIPLIST_ENTRIES;
1045 server.zset_max_ziplist_value = REDIS_ZSET_MAX_ZIPLIST_VALUE;
e2641e09 1046 server.shutdown_asap = 0;
aeecbdfa 1047 server.repl_ping_slave_period = REDIS_REPL_PING_SLAVE_PERIOD;
1048 server.repl_timeout = REDIS_REPL_TIMEOUT;
4ab8695d 1049 server.lua_caller = NULL;
eeffcf38 1050 server.lua_time_limit = REDIS_LUA_TIME_LIMIT;
070e3945 1051 server.lua_client = NULL;
115e3ff3 1052 server.lua_timedout = 0;
e2641e09 1053
95506e46 1054 updateLRUClock();
e2641e09 1055 resetServerSaveParams();
1056
1057 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1058 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1059 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1060 /* Replication related */
e2641e09 1061 server.masterauth = NULL;
1062 server.masterhost = NULL;
1063 server.masterport = 6379;
1064 server.master = NULL;
1844f990 1065 server.repl_state = REDIS_REPL_NONE;
890a2ed9 1066 server.repl_syncio_timeout = REDIS_REPL_SYNCIO_TIMEOUT;
4ebfc455 1067 server.repl_serve_stale_data = 1;
05406168 1068 server.repl_slave_ro = 1;
07486df6 1069 server.repl_down_since = -1;
e2641e09 1070
7eac2a75 1071 /* Client output buffer limits */
1072 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].hard_limit_bytes = 0;
1073 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_bytes = 0;
1074 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_seconds = 0;
c8a607f2 1075 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].hard_limit_bytes = 1024*1024*256;
1076 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_bytes = 1024*1024*64;
7eac2a75 1077 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_seconds = 60;
c8a607f2 1078 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].hard_limit_bytes = 1024*1024*32;
1079 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_bytes = 1024*1024*8;
7eac2a75 1080 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_seconds = 60;
1081
e2641e09 1082 /* Double constants initialization */
1083 R_Zero = 0.0;
1084 R_PosInf = 1.0/R_Zero;
1085 R_NegInf = -1.0/R_Zero;
1086 R_Nan = R_Zero/R_Zero;
8d3e063a 1087
1088 /* Command table -- we intiialize it here as it is part of the
1089 * initial configuration, since command names may be changed via
1090 * redis.conf using the rename-command directive. */
1091 server.commands = dictCreate(&commandTableDictType,NULL);
1092 populateCommandTable();
1093 server.delCommand = lookupCommandByCString("del");
1094 server.multiCommand = lookupCommandByCString("multi");
eeb34eff 1095 server.lpushCommand = lookupCommandByCString("lpush");
daa70b17 1096
1097 /* Slow log */
1098 server.slowlog_log_slower_than = REDIS_SLOWLOG_LOG_SLOWER_THAN;
1099 server.slowlog_max_len = REDIS_SLOWLOG_MAX_LEN;
fa5af017 1100
fc030ac7 1101 /* Debugging */
fa5af017 1102 server.assert_failed = "<no assertion failed>";
1103 server.assert_file = "<no file>";
1104 server.assert_line = 0;
1105 server.bug_report_start = 0;
fc030ac7 1106 server.watchdog_period = 0;
e2641e09 1107}
1108
e074416b 1109/* This function will try to raise the max number of open files accordingly to
1110 * the configured max number of clients. It will also account for 32 additional
1111 * file descriptors as we need a few more for persistence, listening
1112 * sockets, log files and so forth.
1113 *
1114 * If it will not be possible to set the limit accordingly to the configured
1115 * max number of clients, the function will do the reverse setting
1116 * server.maxclients to the value that we can actually handle. */
1117void adjustOpenFilesLimit(void) {
1118 rlim_t maxfiles = server.maxclients+32;
1119 struct rlimit limit;
1120
1121 if (maxfiles < 1024) maxfiles = 1024;
1122 if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
1123 redisLog(REDIS_WARNING,"Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
1124 strerror(errno));
1125 server.maxclients = 1024-32;
1126 } else {
1127 rlim_t oldlimit = limit.rlim_cur;
1128
1129 /* Set the max number of files if the current limit is not enough
1130 * for our needs. */
1131 if (oldlimit < maxfiles) {
1132 limit.rlim_cur = maxfiles;
1133 limit.rlim_max = maxfiles;
1134 if (setrlimit(RLIMIT_NOFILE,&limit) == -1) {
1135 server.maxclients = oldlimit-32;
1136 redisLog(REDIS_WARNING,"Unable to set the max number of files limit to %d (%s), setting the max clients configuration to %d.",
1137 (int) maxfiles, strerror(errno), (int) server.maxclients);
1138 } else {
1139 redisLog(REDIS_NOTICE,"Max number of open files set to %d",
1140 (int) maxfiles);
1141 }
1142 }
1143 }
1144}
1145
e2641e09 1146void initServer() {
1147 int j;
1148
1149 signal(SIGHUP, SIG_IGN);
1150 signal(SIGPIPE, SIG_IGN);
633a9410 1151 setupSignalHandlers();
e2641e09 1152
e1a586ee
JH
1153 if (server.syslog_enabled) {
1154 openlog(server.syslog_ident, LOG_PID | LOG_NDELAY | LOG_NOWAIT,
1155 server.syslog_facility);
1156 }
1157
00010fa9 1158 server.current_client = NULL;
e2641e09 1159 server.clients = listCreate();
7eac2a75 1160 server.clients_to_close = listCreate();
e2641e09 1161 server.slaves = listCreate();
1162 server.monitors = listCreate();
a4ce7581 1163 server.unblocked_clients = listCreate();
cea8c5cd 1164
e2641e09 1165 createSharedObjects();
e074416b 1166 adjustOpenFilesLimit();
1167 server.el = aeCreateEventLoop(server.maxclients+1024);
e2641e09 1168 server.db = zmalloc(sizeof(redisDb)*server.dbnum);
68d6345d 1169
a53b4c24 1170 if (server.port != 0) {
68d6345d 1171 server.ipfd = anetTcpServer(server.neterr,server.port,server.bindaddr);
a53b4c24 1172 if (server.ipfd == ANET_ERR) {
eef17490 1173 redisLog(REDIS_WARNING, "Opening port %d: %s",
1174 server.port, server.neterr);
a53b4c24 1175 exit(1);
1176 }
a5639e7d 1177 }
5d10923f
PN
1178 if (server.unixsocket != NULL) {
1179 unlink(server.unixsocket); /* don't care if this fails */
85238765 1180 server.sofd = anetUnixServer(server.neterr,server.unixsocket,server.unixsocketperm);
a5639e7d
PN
1181 if (server.sofd == ANET_ERR) {
1182 redisLog(REDIS_WARNING, "Opening socket: %s", server.neterr);
1183 exit(1);
1184 }
c61e6925 1185 }
a5639e7d
PN
1186 if (server.ipfd < 0 && server.sofd < 0) {
1187 redisLog(REDIS_WARNING, "Configured to not listen anywhere, exiting.");
e2641e09 1188 exit(1);
1189 }
1190 for (j = 0; j < server.dbnum; j++) {
1191 server.db[j].dict = dictCreate(&dbDictType,NULL);
1192 server.db[j].expires = dictCreate(&keyptrDictType,NULL);
1193 server.db[j].blocking_keys = dictCreate(&keylistDictType,NULL);
1194 server.db[j].watched_keys = dictCreate(&keylistDictType,NULL);
e2641e09 1195 server.db[j].id = j;
1196 }
1197 server.pubsub_channels = dictCreate(&keylistDictType,NULL);
1198 server.pubsub_patterns = listCreate();
1199 listSetFreeMethod(server.pubsub_patterns,freePubsubPattern);
1200 listSetMatchMethod(server.pubsub_patterns,listMatchPubsubPattern);
1201 server.cronloops = 0;
f48cd4b9 1202 server.rdb_child_pid = -1;
ff2145ad 1203 server.aof_child_pid = -1;
1204 server.aof_rewrite_buf = sdsempty();
1205 server.aof_buf = sdsempty();
e2641e09 1206 server.lastsave = time(NULL);
1207 server.dirty = 0;
1208 server.stat_numcommands = 0;
1209 server.stat_numconnections = 0;
1210 server.stat_expiredkeys = 0;
f21779ff 1211 server.stat_evictedkeys = 0;
e2641e09 1212 server.stat_starttime = time(NULL);
53eeeaff 1213 server.stat_keyspace_misses = 0;
1214 server.stat_keyspace_hits = 0;
17b24ff3 1215 server.stat_peak_memory = 0;
615e414c 1216 server.stat_fork_time = 0;
3c95e721 1217 server.stat_rejected_conn = 0;
250e7f69 1218 memset(server.ops_sec_samples,0,sizeof(server.ops_sec_samples));
1219 server.ops_sec_idx = 0;
1220 server.ops_sec_last_sample_time = mstime();
1221 server.ops_sec_last_sample_ops = 0;
e2641e09 1222 server.unixtime = time(NULL);
c25e7eaf 1223 server.lastbgsave_status = REDIS_OK;
4d3bbf35 1224 server.stop_writes_on_bgsave_err = 1;
e2641e09 1225 aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL);
a5639e7d 1226 if (server.ipfd > 0 && aeCreateFileEvent(server.el,server.ipfd,AE_READABLE,
ab17b909 1227 acceptTcpHandler,NULL) == AE_ERR) oom("creating file event");
a5639e7d 1228 if (server.sofd > 0 && aeCreateFileEvent(server.el,server.sofd,AE_READABLE,
ab17b909 1229 acceptUnixHandler,NULL) == AE_ERR) oom("creating file event");
e2641e09 1230
e394114d 1231 if (server.aof_state == REDIS_AOF_ON) {
ff2145ad 1232 server.aof_fd = open(server.aof_filename,
e394114d 1233 O_WRONLY|O_APPEND|O_CREAT,0644);
ff2145ad 1234 if (server.aof_fd == -1) {
e2641e09 1235 redisLog(REDIS_WARNING, "Can't open the append-only file: %s",
1236 strerror(errno));
1237 exit(1);
1238 }
1239 }
1240
d876678b 1241 /* 32 bit instances are limited to 4GB of address space, so if there is
1242 * no explicit limit in the user provided configuration we set a limit
1243 * at 3.5GB using maxmemory with 'noeviction' policy'. This saves
1244 * useless crashes of the Redis instance. */
1245 if (server.arch_bits == 32 && server.maxmemory == 0) {
1246 redisLog(REDIS_WARNING,"Warning: 32 bit instance detected but no memory limit set. Setting 3.5 GB maxmemory limit with 'noeviction' policy now.");
1247 server.maxmemory = 3584LL*(1024*1024); /* 3584 MB = 3.5 GB */
1248 server.maxmemory_policy = REDIS_MAXMEMORY_NO_EVICTION;
1249 }
1250
7585836e 1251 scriptingInit();
daa70b17 1252 slowlogInit();
8f61a72f 1253 bioInit();
e2641e09 1254}
1255
1b1f47c9 1256/* Populates the Redis Command Table starting from the hard coded list
1257 * we have on top of redis.c file. */
1258void populateCommandTable(void) {
1259 int j;
d7ed7fd2 1260 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1b1f47c9 1261
1262 for (j = 0; j < numcommands; j++) {
d7ed7fd2 1263 struct redisCommand *c = redisCommandTable+j;
5d02b00f 1264 char *f = c->sflags;
1b1f47c9 1265 int retval;
e2641e09 1266
5d02b00f 1267 while(*f != '\0') {
1268 switch(*f) {
1269 case 'w': c->flags |= REDIS_CMD_WRITE; break;
1270 case 'r': c->flags |= REDIS_CMD_READONLY; break;
1271 case 'm': c->flags |= REDIS_CMD_DENYOOM; break;
1272 case 'a': c->flags |= REDIS_CMD_ADMIN; break;
1273 case 'p': c->flags |= REDIS_CMD_PUBSUB; break;
1274 case 'f': c->flags |= REDIS_CMD_FORCE_REPLICATION; break;
b60ed6e8 1275 case 's': c->flags |= REDIS_CMD_NOSCRIPT; break;
1276 case 'R': c->flags |= REDIS_CMD_RANDOM; break;
548efd91 1277 case 'S': c->flags |= REDIS_CMD_SORT_FOR_SCRIPT; break;
5d02b00f 1278 default: redisPanic("Unsupported command flag"); break;
1279 }
1280 f++;
1281 }
1282
1b1f47c9 1283 retval = dictAdd(server.commands, sdsnew(c->name), c);
1284 assert(retval == DICT_OK);
1285 }
e2641e09 1286}
1287
d7ed7fd2 1288void resetCommandTableStats(void) {
1289 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1290 int j;
1291
1292 for (j = 0; j < numcommands; j++) {
1293 struct redisCommand *c = redisCommandTable+j;
1294
1295 c->microseconds = 0;
1296 c->calls = 0;
1297 }
1298}
1299
78d6a22d 1300/* ========================== Redis OP Array API ============================ */
1301
1302void redisOpArrayInit(redisOpArray *oa) {
1303 oa->ops = NULL;
1304 oa->numops = 0;
1305}
1306
1307int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
1308 robj **argv, int argc, int target)
1309{
1310 redisOp *op;
1311
1312 oa->ops = zrealloc(oa->ops,sizeof(redisOp)*(oa->numops+1));
1313 op = oa->ops+oa->numops;
1314 op->cmd = cmd;
1315 op->dbid = dbid;
1316 op->argv = argv;
1317 op->argc = argc;
1318 op->target = target;
1319 oa->numops++;
1320 return oa->numops;
1321}
1322
1323void redisOpArrayFree(redisOpArray *oa) {
1324 while(oa->numops) {
1325 int j;
1326 redisOp *op;
1327
1328 oa->numops--;
1329 op = oa->ops+oa->numops;
1330 for (j = 0; j < op->argc; j++)
1331 decrRefCount(op->argv[j]);
1332 zfree(op->argv);
1333 }
1334 zfree(oa->ops);
1335}
1336
e2641e09 1337/* ====================== Commands lookup and execution ===================== */
1338
1b1f47c9 1339struct redisCommand *lookupCommand(sds name) {
1340 return dictFetchValue(server.commands, name);
1341}
1342
1343struct redisCommand *lookupCommandByCString(char *s) {
1344 struct redisCommand *cmd;
1345 sds name = sdsnew(s);
1346
1347 cmd = dictFetchValue(server.commands, name);
1348 sdsfree(name);
1349 return cmd;
e2641e09 1350}
1351
ad08d059 1352/* Propagate the specified command (in the context of the specified database id)
1353 * to AOF, Slaves and Monitors.
1354 *
1355 * flags are an xor between:
1356 * + REDIS_PROPAGATE_NONE (no propagation of command at all)
1357 * + REDIS_PROPAGATE_AOF (propagate into the AOF file if is enabled)
1358 * + REDIS_PROPAGATE_REPL (propagate into the replication link)
1359 */
1360void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1361 int flags)
1362{
1363 if (server.aof_state != REDIS_AOF_OFF && flags & REDIS_PROPAGATE_AOF)
1364 feedAppendOnlyFile(cmd,dbid,argv,argc);
1365 if (flags & REDIS_PROPAGATE_REPL && listLength(server.slaves))
1366 replicationFeedSlaves(server.slaves,dbid,argv,argc);
1367}
1368
78d6a22d 1369/* Used inside commands to schedule the propagation of additional commands
1370 * after the current command is propagated to AOF / Replication. */
eeb34eff 1371void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1372 int target)
1373{
78d6a22d 1374 redisOpArrayAppend(&server.also_propagate,cmd,dbid,argv,argc,target);
eeb34eff 1375}
1376
e2641e09 1377/* Call() is the core of Redis execution of a command */
ce8b772b 1378void call(redisClient *c, int flags) {
daa70b17 1379 long long dirty, start = ustime(), duration;
e2641e09 1380
ad08d059 1381 /* Sent the command to clients in MONITOR mode, only if the commands are
1382 * not geneated from reading an AOF. */
1383 if (listLength(server.monitors) && !server.loading)
e31b615e 1384 replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
ad08d059 1385
1386 /* Call the command. */
78d6a22d 1387 redisOpArrayInit(&server.also_propagate);
e2641e09 1388 dirty = server.dirty;
09e2d9ee 1389 c->cmd->proc(c);
e2641e09 1390 dirty = server.dirty-dirty;
daa70b17 1391 duration = ustime()-start;
ce8b772b 1392
1393 /* When EVAL is called loading the AOF we don't want commands called
1394 * from Lua to go into the slowlog or to populate statistics. */
1395 if (server.loading && c->flags & REDIS_LUA_CLIENT)
1396 flags &= ~(REDIS_CALL_SLOWLOG | REDIS_CALL_STATS);
1397
ad08d059 1398 /* Log the command into the Slow log if needed, and populate the
1399 * per-command statistics that we show in INFO commandstats. */
ce8b772b 1400 if (flags & REDIS_CALL_SLOWLOG)
1401 slowlogPushEntryIfNeeded(c->argv,c->argc,duration);
1402 if (flags & REDIS_CALL_STATS) {
1403 c->cmd->microseconds += duration;
1404 c->cmd->calls++;
1405 }
ad08d059 1406
1407 /* Propagate the command into the AOF and replication link */
ce8b772b 1408 if (flags & REDIS_CALL_PROPAGATE) {
ad08d059 1409 int flags = REDIS_PROPAGATE_NONE;
1410
1411 if (c->cmd->flags & REDIS_CMD_FORCE_REPLICATION)
1412 flags |= REDIS_PROPAGATE_REPL;
1413 if (dirty)
1414 flags |= (REDIS_PROPAGATE_REPL | REDIS_PROPAGATE_AOF);
1415 if (flags != REDIS_PROPAGATE_NONE)
1416 propagate(c->cmd,c->db->id,c->argv,c->argc,flags);
ce8b772b 1417 }
eeb34eff 1418 /* Commands such as LPUSH or BRPOPLPUSH may propagate an additional
1419 * PUSH command. */
78d6a22d 1420 if (server.also_propagate.numops) {
eeb34eff 1421 int j;
78d6a22d 1422 redisOp *rop;
eeb34eff 1423
78d6a22d 1424 for (j = 0; j < server.also_propagate.numops; j++) {
1425 rop = &server.also_propagate.ops[j];
1426 propagate(rop->cmd, rop->dbid, rop->argv, rop->argc, rop->target);
1427 }
1428 redisOpArrayFree(&server.also_propagate);
eeb34eff 1429 }
e2641e09 1430 server.stat_numcommands++;
1431}
1432
1433/* If this function gets called we already read a whole
1434 * command, argments are in the client argv/argc fields.
1435 * processCommand() execute the command or prepare the
1436 * server for a bulk read from the client.
1437 *
1438 * If 1 is returned the client is still alive and valid and
1439 * and other operations can be performed by the caller. Otherwise
1440 * if 0 is returned the client was destroied (i.e. after QUIT). */
1441int processCommand(redisClient *c) {
941c9fa2
PN
1442 /* The QUIT command is handled separately. Normal command procs will
1443 * go through checking for replication and QUIT will cause trouble
1444 * when FORCE_REPLICATION is enabled and would be implemented in
1445 * a regular command proc. */
e2641e09 1446 if (!strcasecmp(c->argv[0]->ptr,"quit")) {
941c9fa2 1447 addReply(c,shared.ok);
5e78edb3 1448 c->flags |= REDIS_CLOSE_AFTER_REPLY;
cd8788f2 1449 return REDIS_ERR;
e2641e09 1450 }
1451
1452 /* Now lookup the command and check ASAP about trivial error conditions
09e2d9ee 1453 * such as wrong arity, bad command name and so forth. */
2c74a9f9 1454 c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
09e2d9ee 1455 if (!c->cmd) {
3ab20376
PN
1456 addReplyErrorFormat(c,"unknown command '%s'",
1457 (char*)c->argv[0]->ptr);
cd8788f2 1458 return REDIS_OK;
09e2d9ee 1459 } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
1460 (c->argc < -c->cmd->arity)) {
3ab20376 1461 addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
09e2d9ee 1462 c->cmd->name);
cd8788f2 1463 return REDIS_OK;
e2641e09 1464 }
e2641e09 1465
1466 /* Check if the user is authenticated */
09e2d9ee 1467 if (server.requirepass && !c->authenticated && c->cmd->proc != authCommand)
1468 {
3ab20376 1469 addReplyError(c,"operation not permitted");
cd8788f2 1470 return REDIS_OK;
e2641e09 1471 }
1472
1dd10ca2 1473 /* Handle the maxmemory directive.
1474 *
1475 * First we try to free some memory if possible (if there are volatile
1476 * keys in the dataset). If there are not the only thing we can do
1477 * is returning an error. */
f6b32c14 1478 if (server.maxmemory) {
1479 int retval = freeMemoryIfNeeded();
1480 if ((c->cmd->flags & REDIS_CMD_DENYOOM) && retval == REDIS_ERR) {
05406168 1481 addReply(c, shared.oomerr);
f6b32c14 1482 return REDIS_OK;
1483 }
e2641e09 1484 }
1485
c25e7eaf 1486 /* Don't accept write commands if there are problems persisting on disk. */
4d3bbf35 1487 if (server.stop_writes_on_bgsave_err &&
1488 server.saveparamslen > 0
1489 && server.lastbgsave_status == REDIS_ERR &&
c25e7eaf 1490 c->cmd->flags & REDIS_CMD_WRITE)
1491 {
1492 addReply(c, shared.bgsaveerr);
1493 return REDIS_OK;
05406168 1494 }
1495
1496 /* Don't accept wirte commands if this is a read only slave. But
1497 * accept write commands if this is our master. */
1498 if (server.masterhost && server.repl_slave_ro &&
1499 !(c->flags & REDIS_MASTER) &&
1500 c->cmd->flags & REDIS_CMD_WRITE)
1501 {
1502 addReply(c, shared.roslaveerr);
1503 return REDIS_OK;
c25e7eaf 1504 }
1505
e2641e09 1506 /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
1507 if ((dictSize(c->pubsub_channels) > 0 || listLength(c->pubsub_patterns) > 0)
1508 &&
09e2d9ee 1509 c->cmd->proc != subscribeCommand &&
1510 c->cmd->proc != unsubscribeCommand &&
1511 c->cmd->proc != psubscribeCommand &&
1512 c->cmd->proc != punsubscribeCommand) {
3ab20376 1513 addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / QUIT allowed in this context");
cd8788f2 1514 return REDIS_OK;
e2641e09 1515 }
1516
4ebfc455 1517 /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
1518 * we are a slave with a broken link with master. */
1844f990 1519 if (server.masterhost && server.repl_state != REDIS_REPL_CONNECTED &&
4ebfc455 1520 server.repl_serve_stale_data == 0 &&
09e2d9ee 1521 c->cmd->proc != infoCommand && c->cmd->proc != slaveofCommand)
4ebfc455 1522 {
1523 addReplyError(c,
1524 "link with MASTER is down and slave-serve-stale-data is set to no");
1525 return REDIS_OK;
1526 }
1527
97e7f8ae 1528 /* Loading DB? Return an error if the command is not INFO */
09e2d9ee 1529 if (server.loading && c->cmd->proc != infoCommand) {
97e7f8ae 1530 addReply(c, shared.loadingerr);
1531 return REDIS_OK;
1532 }
1533
4ab8695d 1534 /* Lua script too slow? Only allow SHUTDOWN NOSAVE and SCRIPT KILL. */
1535 if (server.lua_timedout &&
1536 !(c->cmd->proc != shutdownCommand &&
1537 c->argc == 2 &&
1538 tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
1539 !(c->cmd->proc == scriptCommand &&
1540 c->argc == 2 &&
1541 tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
1542 {
115e3ff3 1543 addReply(c, shared.slowscripterr);
1544 return REDIS_OK;
1545 }
1546
e2641e09 1547 /* Exec the command */
1548 if (c->flags & REDIS_MULTI &&
09e2d9ee 1549 c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
1550 c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
e2641e09 1551 {
09e2d9ee 1552 queueMultiCommand(c);
e2641e09 1553 addReply(c,shared.queued);
1554 } else {
ce8b772b 1555 call(c,REDIS_CALL_FULL);
e2641e09 1556 }
cd8788f2 1557 return REDIS_OK;
e2641e09 1558}
1559
1560/*================================== Shutdown =============================== */
1561
4ab8695d 1562int prepareForShutdown(int flags) {
1563 int save = flags & REDIS_SHUTDOWN_SAVE;
1564 int nosave = flags & REDIS_SHUTDOWN_NOSAVE;
1565
adae85cd 1566 redisLog(REDIS_WARNING,"User requested shutdown...");
e2641e09 1567 /* Kill the saving child if there is a background saving in progress.
1568 We want to avoid race conditions, for instance our saving child may
1569 overwrite the synchronous saving did by SHUTDOWN. */
f48cd4b9 1570 if (server.rdb_child_pid != -1) {
adae85cd 1571 redisLog(REDIS_WARNING,"There is a child saving an .rdb. Killing it!");
f48cd4b9 1572 kill(server.rdb_child_pid,SIGKILL);
1573 rdbRemoveTempFile(server.rdb_child_pid);
e2641e09 1574 }
e394114d 1575 if (server.aof_state != REDIS_AOF_OFF) {
adae85cd 1576 /* Kill the AOF saving child as the AOF we already have may be longer
1577 * but contains the full dataset anyway. */
ff2145ad 1578 if (server.aof_child_pid != -1) {
adae85cd 1579 redisLog(REDIS_WARNING,
1580 "There is a child rewriting the AOF. Killing it!");
ff2145ad 1581 kill(server.aof_child_pid,SIGKILL);
adae85cd 1582 }
e2641e09 1583 /* Append only file: fsync() the AOF and exit */
adae85cd 1584 redisLog(REDIS_NOTICE,"Calling fsync() on the AOF file.");
ff2145ad 1585 aof_fsync(server.aof_fd);
adae85cd 1586 }
4ab8695d 1587 if ((server.saveparamslen > 0 && !nosave) || save) {
adae85cd 1588 redisLog(REDIS_NOTICE,"Saving the final RDB snapshot before exiting.");
e2641e09 1589 /* Snapshotting. Perform a SYNC SAVE and exit */
f48cd4b9 1590 if (rdbSave(server.rdb_filename) != REDIS_OK) {
e2641e09 1591 /* Ooops.. error saving! The best we can do is to continue
1592 * operating. Note that if there was a background saving process,
1593 * in the next cron() Redis will be notified that the background
1594 * saving aborted, handling special stuff like slaves pending for
1595 * synchronization... */
adae85cd 1596 redisLog(REDIS_WARNING,"Error trying to save the DB, can't exit.");
e2641e09 1597 return REDIS_ERR;
1598 }
1599 }
adae85cd 1600 if (server.daemonize) {
1601 redisLog(REDIS_NOTICE,"Removing the pid file.");
1602 unlink(server.pidfile);
1603 }
80e87a46 1604 /* Close the listening sockets. Apparently this allows faster restarts. */
1605 if (server.ipfd != -1) close(server.ipfd);
1606 if (server.sofd != -1) close(server.sofd);
56209f72
NF
1607 if (server.unixsocket) {
1608 redisLog(REDIS_NOTICE,"Removing the unix socket file.");
1609 unlink(server.unixsocket); /* don't care if this fails */
1610 }
80e87a46 1611
adae85cd 1612 redisLog(REDIS_WARNING,"Redis is now ready to exit, bye bye...");
e2641e09 1613 return REDIS_OK;
1614}
1615
1616/*================================== Commands =============================== */
1617
1618void authCommand(redisClient *c) {
ab52d1f4 1619 if (!server.requirepass) {
1620 addReplyError(c,"Client sent AUTH, but no password is set");
1621 } else if (!strcmp(c->argv[1]->ptr, server.requirepass)) {
e2641e09 1622 c->authenticated = 1;
1623 addReply(c,shared.ok);
1624 } else {
1625 c->authenticated = 0;
3ab20376 1626 addReplyError(c,"invalid password");
e2641e09 1627 }
1628}
1629
1630void pingCommand(redisClient *c) {
1631 addReply(c,shared.pong);
1632}
1633
1634void echoCommand(redisClient *c) {
1635 addReplyBulk(c,c->argv[1]);
1636}
1637
9494f1f1 1638void timeCommand(redisClient *c) {
1639 struct timeval tv;
1640
1641 /* gettimeofday() can only fail if &tv is a bad addresss so we
1642 * don't check for errors. */
1643 gettimeofday(&tv,NULL);
1644 addReplyMultiBulkLen(c,2);
1645 addReplyBulkLongLong(c,tv.tv_sec);
1646 addReplyBulkLongLong(c,tv.tv_usec);
1647}
1648
e2641e09 1649/* Convert an amount of bytes into a human readable string in the form
1650 * of 100B, 2G, 100M, 4K, and so forth. */
1651void bytesToHuman(char *s, unsigned long long n) {
1652 double d;
1653
1654 if (n < 1024) {
1655 /* Bytes */
1656 sprintf(s,"%lluB",n);
1657 return;
1658 } else if (n < (1024*1024)) {
1659 d = (double)n/(1024);
1660 sprintf(s,"%.2fK",d);
1661 } else if (n < (1024LL*1024*1024)) {
1662 d = (double)n/(1024*1024);
1663 sprintf(s,"%.2fM",d);
1664 } else if (n < (1024LL*1024*1024*1024)) {
1665 d = (double)n/(1024LL*1024*1024);
1666 sprintf(s,"%.2fG",d);
1667 }
1668}
1669
1670/* Create the string returned by the INFO command. This is decoupled
1671 * by the INFO command itself as we need to report the same information
1672 * on memory corruption problems. */
1b085c9f 1673sds genRedisInfoString(char *section) {
1674 sds info = sdsempty();
56ff70f8 1675 time_t uptime = server.unixtime-server.stat_starttime;
d9cb288c 1676 int j, numcommands;
2b00385d 1677 struct rusage self_ru, c_ru;
7a1fd61e 1678 unsigned long lol, bib;
1b085c9f 1679 int allsections = 0, defsections = 0;
1680 int sections = 0;
1681
1682 if (section) {
1683 allsections = strcasecmp(section,"all") == 0;
0d808ef2 1684 defsections = strcasecmp(section,"default") == 0;
1b085c9f 1685 }
2b00385d 1686
1687 getrusage(RUSAGE_SELF, &self_ru);
1688 getrusage(RUSAGE_CHILDREN, &c_ru);
7a1fd61e 1689 getClientsMaxBuffers(&lol,&bib);
1b085c9f 1690
1691 /* Server */
1692 if (allsections || defsections || !strcasecmp(section,"server")) {
1693 if (sections++) info = sdscat(info,"\r\n");
e2641e09 1694 info = sdscatprintf(info,
1b085c9f 1695 "# Server\r\n"
1696 "redis_version:%s\r\n"
1697 "redis_git_sha1:%s\r\n"
1698 "redis_git_dirty:%d\r\n"
75eaac5c 1699 "arch_bits:%d\r\n"
1b085c9f 1700 "multiplexing_api:%s\r\n"
5db904bd 1701 "gcc_version:%d.%d.%d\r\n"
1b085c9f 1702 "process_id:%ld\r\n"
91d664d6 1703 "run_id:%s\r\n"
1b085c9f 1704 "tcp_port:%d\r\n"
1705 "uptime_in_seconds:%ld\r\n"
1706 "uptime_in_days:%ld\r\n"
1707 "lru_clock:%ld\r\n",
1708 REDIS_VERSION,
1709 redisGitSHA1(),
1710 strtol(redisGitDirty(),NULL,10) > 0,
75eaac5c 1711 server.arch_bits,
1b085c9f 1712 aeGetApiName(),
5db904bd 1713#ifdef __GNUC__
1714 __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
1715#else
1716 0,0,0,
1717#endif
1b085c9f 1718 (long) getpid(),
91d664d6 1719 server.runid,
1b085c9f 1720 server.port,
1721 uptime,
1722 uptime/(3600*24),
1723 (unsigned long) server.lruclock);
1724 }
1725
1726 /* Clients */
1727 if (allsections || defsections || !strcasecmp(section,"clients")) {
1728 if (sections++) info = sdscat(info,"\r\n");
1729 info = sdscatprintf(info,
1730 "# Clients\r\n"
3c08fdae 1731 "connected_clients:%lu\r\n"
1b085c9f 1732 "client_longest_output_list:%lu\r\n"
1733 "client_biggest_input_buf:%lu\r\n"
1734 "blocked_clients:%d\r\n",
1735 listLength(server.clients)-listLength(server.slaves),
1736 lol, bib,
1737 server.bpop_blocked_clients);
1738 }
1739
1740 /* Memory */
1741 if (allsections || defsections || !strcasecmp(section,"memory")) {
17b24ff3 1742 char hmem[64];
1743 char peak_hmem[64];
1744
1745 bytesToHuman(hmem,zmalloc_used_memory());
1746 bytesToHuman(peak_hmem,server.stat_peak_memory);
1b085c9f 1747 if (sections++) info = sdscat(info,"\r\n");
1748 info = sdscatprintf(info,
1749 "# Memory\r\n"
1750 "used_memory:%zu\r\n"
1751 "used_memory_human:%s\r\n"
1752 "used_memory_rss:%zu\r\n"
17b24ff3 1753 "used_memory_peak:%zu\r\n"
1754 "used_memory_peak_human:%s\r\n"
8c3402df 1755 "used_memory_lua:%lld\r\n"
1b085c9f 1756 "mem_fragmentation_ratio:%.2f\r\n"
32f99c51 1757 "mem_allocator:%s\r\n",
1b085c9f 1758 zmalloc_used_memory(),
1759 hmem,
1760 zmalloc_get_rss(),
17b24ff3 1761 server.stat_peak_memory,
1762 peak_hmem,
8c3402df 1763 ((long long)lua_gc(server.lua,LUA_GCCOUNT,0))*1024LL,
1b085c9f 1764 zmalloc_get_fragmentation_ratio(),
fec5a664 1765 ZMALLOC_LIB
12ebe2ac 1766 );
0d808ef2 1767 }
1768
1b085c9f 1769 /* Persistence */
1770 if (allsections || defsections || !strcasecmp(section,"persistence")) {
1771 if (sections++) info = sdscat(info,"\r\n");
e2641e09 1772 info = sdscatprintf(info,
1b085c9f 1773 "# Persistence\r\n"
1774 "loading:%d\r\n"
1775 "aof_enabled:%d\r\n"
1776 "changes_since_last_save:%lld\r\n"
1777 "bgsave_in_progress:%d\r\n"
1778 "last_save_time:%ld\r\n"
c25e7eaf 1779 "last_bgsave_status:%s\r\n"
1b085c9f 1780 "bgrewriteaof_in_progress:%d\r\n",
1781 server.loading,
e394114d 1782 server.aof_state != REDIS_AOF_OFF,
1b085c9f 1783 server.dirty,
f48cd4b9 1784 server.rdb_child_pid != -1,
1b085c9f 1785 server.lastsave,
c25e7eaf 1786 server.lastbgsave_status == REDIS_OK ? "ok" : "err",
ff2145ad 1787 server.aof_child_pid != -1);
1b085c9f 1788
e394114d 1789 if (server.aof_state != REDIS_AOF_OFF) {
d630abcd 1790 info = sdscatprintf(info,
1791 "aof_current_size:%lld\r\n"
1792 "aof_base_size:%lld\r\n"
e7ef418c 1793 "aof_pending_rewrite:%d\r\n"
1794 "aof_buffer_length:%zu\r\n"
81f32c7b 1795 "aof_pending_bio_fsync:%llu\r\n"
1796 "aof_delayed_fsync:%lu\r\n",
2c915bcf 1797 (long long) server.aof_current_size,
1798 (long long) server.aof_rewrite_base_size,
1799 server.aof_rewrite_scheduled,
ff2145ad 1800 sdslen(server.aof_buf),
81f32c7b 1801 bioPendingJobsOfType(REDIS_BIO_AOF_FSYNC),
1802 server.aof_delayed_fsync);
d630abcd 1803 }
1804
1b085c9f 1805 if (server.loading) {
1806 double perc;
1807 time_t eta, elapsed;
1808 off_t remaining_bytes = server.loading_total_bytes-
1809 server.loading_loaded_bytes;
1810
1811 perc = ((double)server.loading_loaded_bytes /
1812 server.loading_total_bytes) * 100;
1813
56ff70f8 1814 elapsed = server.unixtime-server.loading_start_time;
1b085c9f 1815 if (elapsed == 0) {
1816 eta = 1; /* A fake 1 second figure if we don't have
1817 enough info */
1818 } else {
1819 eta = (elapsed*remaining_bytes)/server.loading_loaded_bytes;
1820 }
1821
1822 info = sdscatprintf(info,
1823 "loading_start_time:%ld\r\n"
1824 "loading_total_bytes:%llu\r\n"
1825 "loading_loaded_bytes:%llu\r\n"
1826 "loading_loaded_perc:%.2f\r\n"
1827 "loading_eta_seconds:%ld\r\n"
1828 ,(unsigned long) server.loading_start_time,
1829 (unsigned long long) server.loading_total_bytes,
1830 (unsigned long long) server.loading_loaded_bytes,
1831 perc,
1832 eta
1833 );
1834 }
e2641e09 1835 }
1b085c9f 1836
1b085c9f 1837 /* Stats */
1838 if (allsections || defsections || !strcasecmp(section,"stats")) {
1839 if (sections++) info = sdscat(info,"\r\n");
97e7f8ae 1840 info = sdscatprintf(info,
1b085c9f 1841 "# Stats\r\n"
1842 "total_connections_received:%lld\r\n"
1843 "total_commands_processed:%lld\r\n"
250e7f69 1844 "instantaneous_ops_per_sec:%lld\r\n"
3c95e721 1845 "rejected_connections:%lld\r\n"
1b085c9f 1846 "expired_keys:%lld\r\n"
1847 "evicted_keys:%lld\r\n"
1848 "keyspace_hits:%lld\r\n"
1849 "keyspace_misses:%lld\r\n"
1850 "pubsub_channels:%ld\r\n"
3c08fdae 1851 "pubsub_patterns:%lu\r\n"
615e414c 1852 "latest_fork_usec:%lld\r\n",
1b085c9f 1853 server.stat_numconnections,
1854 server.stat_numcommands,
250e7f69 1855 getOperationsPerSecond(),
3c95e721 1856 server.stat_rejected_conn,
1b085c9f 1857 server.stat_expiredkeys,
1858 server.stat_evictedkeys,
1859 server.stat_keyspace_hits,
1860 server.stat_keyspace_misses,
1861 dictSize(server.pubsub_channels),
615e414c 1862 listLength(server.pubsub_patterns),
1863 server.stat_fork_time);
97e7f8ae 1864 }
67a1810b 1865
1b085c9f 1866 /* Replication */
1867 if (allsections || defsections || !strcasecmp(section,"replication")) {
1868 if (sections++) info = sdscat(info,"\r\n");
1869 info = sdscatprintf(info,
1870 "# Replication\r\n"
1871 "role:%s\r\n",
1872 server.masterhost == NULL ? "master" : "slave");
1873 if (server.masterhost) {
1874 info = sdscatprintf(info,
1875 "master_host:%s\r\n"
1876 "master_port:%d\r\n"
1877 "master_link_status:%s\r\n"
1878 "master_last_io_seconds_ago:%d\r\n"
1879 "master_sync_in_progress:%d\r\n"
1880 ,server.masterhost,
1881 server.masterport,
1844f990 1882 (server.repl_state == REDIS_REPL_CONNECTED) ?
1b085c9f 1883 "up" : "down",
1884 server.master ?
56ff70f8 1885 ((int)(server.unixtime-server.master->lastinteraction)) : -1,
1844f990 1886 server.repl_state == REDIS_REPL_TRANSFER
1b085c9f 1887 );
1888
1844f990 1889 if (server.repl_state == REDIS_REPL_TRANSFER) {
1b085c9f 1890 info = sdscatprintf(info,
1891 "master_sync_left_bytes:%ld\r\n"
1892 "master_sync_last_io_seconds_ago:%d\r\n"
1893 ,(long)server.repl_transfer_left,
56ff70f8 1894 (int)(server.unixtime-server.repl_transfer_lastio)
1b085c9f 1895 );
1896 }
07486df6 1897
1844f990 1898 if (server.repl_state != REDIS_REPL_CONNECTED) {
07486df6 1899 info = sdscatprintf(info,
1900 "master_link_down_since_seconds:%ld\r\n",
56ff70f8 1901 (long)server.unixtime-server.repl_down_since);
07486df6 1902 }
67a1810b 1903 }
1b085c9f 1904 info = sdscatprintf(info,
3c08fdae 1905 "connected_slaves:%lu\r\n",
1b085c9f 1906 listLength(server.slaves));
503d87a8 1907 if (listLength(server.slaves)) {
1908 int slaveid = 0;
1909 listNode *ln;
1910 listIter li;
1911
1912 listRewind(server.slaves,&li);
1913 while((ln = listNext(&li))) {
1914 redisClient *slave = listNodeValue(ln);
1915 char *state = NULL;
1916 char ip[32];
1917 int port;
1918
1919 if (anetPeerToString(slave->fd,ip,&port) == -1) continue;
1920 switch(slave->replstate) {
1921 case REDIS_REPL_WAIT_BGSAVE_START:
1922 case REDIS_REPL_WAIT_BGSAVE_END:
1923 state = "wait_bgsave";
1924 break;
1925 case REDIS_REPL_SEND_BULK:
1926 state = "send_bulk";
1927 break;
1928 case REDIS_REPL_ONLINE:
1929 state = "online";
1930 break;
1931 }
1932 if (state == NULL) continue;
1933 info = sdscatprintf(info,"slave%d:%s,%d,%s\r\n",
1934 slaveid,ip,port,state);
1935 slaveid++;
1936 }
1937 }
67a1810b 1938 }
67a1810b 1939
0d808ef2 1940 /* CPU */
1941 if (allsections || defsections || !strcasecmp(section,"cpu")) {
1b085c9f 1942 if (sections++) info = sdscat(info,"\r\n");
1943 info = sdscatprintf(info,
0d808ef2 1944 "# CPU\r\n"
1b085c9f 1945 "used_cpu_sys:%.2f\r\n"
1946 "used_cpu_user:%.2f\r\n"
5a9dd97c 1947 "used_cpu_sys_children:%.2f\r\n"
1948 "used_cpu_user_children:%.2f\r\n",
1b085c9f 1949 (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
d83eda48 1950 (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000,
1951 (float)c_ru.ru_stime.tv_sec+(float)c_ru.ru_stime.tv_usec/1000000,
1952 (float)c_ru.ru_utime.tv_sec+(float)c_ru.ru_utime.tv_usec/1000000);
0d808ef2 1953 }
1b085c9f 1954
0d808ef2 1955 /* cmdtime */
1956 if (allsections || !strcasecmp(section,"commandstats")) {
1957 if (sections++) info = sdscat(info,"\r\n");
1958 info = sdscatprintf(info, "# Commandstats\r\n");
d7ed7fd2 1959 numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1b085c9f 1960 for (j = 0; j < numcommands; j++) {
d7ed7fd2 1961 struct redisCommand *c = redisCommandTable+j;
0d808ef2 1962
d7ed7fd2 1963 if (!c->calls) continue;
1964 info = sdscatprintf(info,
1965 "cmdstat_%s:calls=%lld,usec=%lld,usec_per_call=%.2f\r\n",
1966 c->name, c->calls, c->microseconds,
1967 (c->calls == 0) ? 0 : ((float)c->microseconds/c->calls));
1b085c9f 1968 }
d9cb288c 1969 }
1970
1b085c9f 1971 /* Key space */
1972 if (allsections || defsections || !strcasecmp(section,"keyspace")) {
1973 if (sections++) info = sdscat(info,"\r\n");
1974 info = sdscatprintf(info, "# Keyspace\r\n");
1975 for (j = 0; j < server.dbnum; j++) {
1976 long long keys, vkeys;
e2641e09 1977
1b085c9f 1978 keys = dictSize(server.db[j].dict);
1979 vkeys = dictSize(server.db[j].expires);
1980 if (keys || vkeys) {
1981 info = sdscatprintf(info, "db%d:keys=%lld,expires=%lld\r\n",
1982 j, keys, vkeys);
1983 }
e2641e09 1984 }
1985 }
1986 return info;
1987}
1988
1989void infoCommand(redisClient *c) {
1b085c9f 1990 char *section = c->argc == 2 ? c->argv[1]->ptr : "default";
1991
1992 if (c->argc > 2) {
1993 addReply(c,shared.syntaxerr);
1994 return;
1995 }
1996 sds info = genRedisInfoString(section);
e2641e09 1997 addReplySds(c,sdscatprintf(sdsempty(),"$%lu\r\n",
1998 (unsigned long)sdslen(info)));
1999 addReplySds(c,info);
2000 addReply(c,shared.crlf);
2001}
2002
2003void monitorCommand(redisClient *c) {
2004 /* ignore MONITOR if aleady slave or in monitor mode */
2005 if (c->flags & REDIS_SLAVE) return;
2006
2007 c->flags |= (REDIS_SLAVE|REDIS_MONITOR);
2008 c->slaveseldb = 0;
2009 listAddNodeTail(server.monitors,c);
2010 addReply(c,shared.ok);
2011}
2012
2013/* ============================ Maxmemory directive ======================== */
2014
e2641e09 2015/* This function gets called when 'maxmemory' is set on the config file to limit
f6b32c14 2016 * the max memory used by the server, before processing a command.
e2641e09 2017 *
f6b32c14 2018 * The goal of the function is to free enough memory to keep Redis under the
2019 * configured memory limit.
e2641e09 2020 *
f6b32c14 2021 * The function starts calculating how many bytes should be freed to keep
2022 * Redis under the limit, and enters a loop selecting the best keys to
2023 * evict accordingly to the configured policy.
2024 *
2025 * If all the bytes needed to return back under the limit were freed the
2026 * function returns REDIS_OK, otherwise REDIS_ERR is returned, and the caller
2027 * should block the execution of commands that will result in more memory
2028 * used by the server.
e2641e09 2029 */
f6b32c14 2030int freeMemoryIfNeeded(void) {
2031 size_t mem_used, mem_tofree, mem_freed;
2032 int slaves = listLength(server.slaves);
2033
c1ef6ffe 2034 /* Remove the size of slaves output buffers and AOF buffer from the
2035 * count of used memory. */
f6b32c14 2036 mem_used = zmalloc_used_memory();
2037 if (slaves) {
2038 listIter li;
2039 listNode *ln;
2040
2041 listRewind(server.slaves,&li);
2042 while((ln = listNext(&li))) {
2043 redisClient *slave = listNodeValue(ln);
2044 unsigned long obuf_bytes = getClientOutputBufferMemoryUsage(slave);
2045 if (obuf_bytes > mem_used)
2046 mem_used = 0;
2047 else
2048 mem_used -= obuf_bytes;
2049 }
2050 }
c1ef6ffe 2051 if (server.aof_state != REDIS_AOF_OFF) {
2052 mem_used -= sdslen(server.aof_buf);
2053 mem_used -= sdslen(server.aof_rewrite_buf);
2054 }
5402c426 2055
f6b32c14 2056 /* Check if we are over the memory limit. */
2057 if (mem_used <= server.maxmemory) return REDIS_OK;
2058
2059 if (server.maxmemory_policy == REDIS_MAXMEMORY_NO_EVICTION)
2060 return REDIS_ERR; /* We need to free memory, but policy forbids. */
2061
2062 /* Compute how much memory we need to free. */
2063 mem_tofree = mem_used - server.maxmemory;
f6b32c14 2064 mem_freed = 0;
2065 while (mem_freed < mem_tofree) {
2066 int j, k, keys_freed = 0;
e2641e09 2067
165346ca 2068 for (j = 0; j < server.dbnum; j++) {
10c12171 2069 long bestval = 0; /* just to prevent warning */
165346ca 2070 sds bestkey = NULL;
2071 struct dictEntry *de;
2072 redisDb *db = server.db+j;
2073 dict *dict;
2074
2075 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2076 server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM)
2077 {
2078 dict = server.db[j].dict;
2079 } else {
2080 dict = server.db[j].expires;
2081 }
2082 if (dictSize(dict) == 0) continue;
2083
2084 /* volatile-random and allkeys-random policy */
2085 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM ||
2086 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_RANDOM)
2087 {
2088 de = dictGetRandomKey(dict);
c0ba9ebe 2089 bestkey = dictGetKey(de);
165346ca 2090 }
2091
2092 /* volatile-lru and allkeys-lru policy */
2093 else if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2094 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2095 {
2096 for (k = 0; k < server.maxmemory_samples; k++) {
2097 sds thiskey;
2098 long thisval;
2099 robj *o;
2100
2101 de = dictGetRandomKey(dict);
c0ba9ebe 2102 thiskey = dictGetKey(de);
0c2f75c6 2103 /* When policy is volatile-lru we need an additonal lookup
2104 * to locate the real key, as dict is set to db->expires. */
2105 if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2106 de = dictFind(db->dict, thiskey);
c0ba9ebe 2107 o = dictGetVal(de);
165346ca 2108 thisval = estimateObjectIdleTime(o);
2109
2110 /* Higher idle time is better candidate for deletion */
2111 if (bestkey == NULL || thisval > bestval) {
2112 bestkey = thiskey;
2113 bestval = thisval;
2114 }
2115 }
2116 }
2117
2118 /* volatile-ttl */
2119 else if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_TTL) {
2120 for (k = 0; k < server.maxmemory_samples; k++) {
2121 sds thiskey;
2122 long thisval;
2123
2124 de = dictGetRandomKey(dict);
c0ba9ebe 2125 thiskey = dictGetKey(de);
2126 thisval = (long) dictGetVal(de);
165346ca 2127
2128 /* Expire sooner (minor expire unix timestamp) is better
2129 * candidate for deletion */
2130 if (bestkey == NULL || thisval < bestval) {
2131 bestkey = thiskey;
2132 bestval = thisval;
2133 }
2134 }
2135 }
2136
2137 /* Finally remove the selected key. */
2138 if (bestkey) {
f6b32c14 2139 long long delta;
2140
165346ca 2141 robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
452229b6 2142 propagateExpire(db,keyobj);
f6b32c14 2143 /* We compute the amount of memory freed by dbDelete() alone.
2144 * It is possible that actually the memory needed to propagate
2145 * the DEL in AOF and replication link is greater than the one
2146 * we are freeing removing the key, but we can't account for
2147 * that otherwise we would never exit the loop.
2148 *
2149 * AOF and Output buffer memory will be freed eventually so
2150 * we only care about memory used by the key space. */
2151 delta = (long long) zmalloc_used_memory();
165346ca 2152 dbDelete(db,keyobj);
f6b32c14 2153 delta -= (long long) zmalloc_used_memory();
f6b32c14 2154 mem_freed += delta;
f21779ff 2155 server.stat_evictedkeys++;
165346ca 2156 decrRefCount(keyobj);
f6b32c14 2157 keys_freed++;
2158
2159 /* When the memory to free starts to be big enough, we may
2160 * start spending so much time here that is impossible to
2161 * deliver data to the slaves fast enough, so we force the
2162 * transmission here inside the loop. */
8b7c3455 2163 if (slaves) flushSlavesOutputBuffers();
165346ca 2164 }
2165 }
b129c6df 2166 if (!keys_freed) return REDIS_ERR; /* nothing to free... */
165346ca 2167 }
f6b32c14 2168 return REDIS_OK;
e2641e09 2169}
2170
2171/* =================================== Main! ================================ */
2172
2173#ifdef __linux__
2174int linuxOvercommitMemoryValue(void) {
2175 FILE *fp = fopen("/proc/sys/vm/overcommit_memory","r");
2176 char buf[64];
2177
2178 if (!fp) return -1;
2179 if (fgets(buf,64,fp) == NULL) {
2180 fclose(fp);
2181 return -1;
2182 }
2183 fclose(fp);
2184
2185 return atoi(buf);
2186}
2187
2188void linuxOvercommitMemoryWarning(void) {
2189 if (linuxOvercommitMemoryValue() == 0) {
2190 redisLog(REDIS_WARNING,"WARNING overcommit_memory is set to 0! Background save may fail under low memory condition. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
2191 }
2192}
2193#endif /* __linux__ */
2194
695fe874 2195void createPidFile(void) {
2196 /* Try to write the pid file in a best-effort way. */
2197 FILE *fp = fopen(server.pidfile,"w");
2198 if (fp) {
8ce39260 2199 fprintf(fp,"%d\n",(int)getpid());
695fe874 2200 fclose(fp);
2201 }
2202}
2203
e2641e09 2204void daemonize(void) {
2205 int fd;
e2641e09 2206
2207 if (fork() != 0) exit(0); /* parent exits */
2208 setsid(); /* create a new session */
2209
2210 /* Every output goes to /dev/null. If Redis is daemonized but
2211 * the 'logfile' is set to 'stdout' in the configuration file
2212 * it will not log at all. */
2213 if ((fd = open("/dev/null", O_RDWR, 0)) != -1) {
2214 dup2(fd, STDIN_FILENO);
2215 dup2(fd, STDOUT_FILENO);
2216 dup2(fd, STDERR_FILENO);
2217 if (fd > STDERR_FILENO) close(fd);
2218 }
e2641e09 2219}
2220
2221void version() {
188a17ed 2222 printf("Redis server v=%s sha=%s:%d malloc=%s\n", REDIS_VERSION,
2223 redisGitSHA1(), atoi(redisGitDirty()) > 0, ZMALLOC_LIB);
e2641e09 2224 exit(0);
2225}
2226
2227void usage() {
9268a5b5 2228 fprintf(stderr,"Usage: ./redis-server [/path/to/redis.conf] [options]\n");
e2641e09 2229 fprintf(stderr," ./redis-server - (read config from stdin)\n");
9268a5b5 2230 fprintf(stderr," ./redis-server -v or --version\n");
78d6a02b 2231 fprintf(stderr," ./redis-server -h or --help\n");
2232 fprintf(stderr," ./redis-server --test-memory <megabytes>\n\n");
9268a5b5 2233 fprintf(stderr,"Examples:\n");
2234 fprintf(stderr," ./redis-server (run the server with default conf)\n");
2235 fprintf(stderr," ./redis-server /etc/redis/6379.conf\n");
2236 fprintf(stderr," ./redis-server --port 7777\n");
2237 fprintf(stderr," ./redis-server --port 7777 --slaveof 127.0.0.1 8888\n");
2238 fprintf(stderr," ./redis-server /etc/myredis.conf --loglevel verbose\n");
e2641e09 2239 exit(1);
2240}
2241
996d503d 2242void redisAsciiArt(void) {
2243#include "asciilogo.h"
2244 char *buf = zmalloc(1024*16);
2245
2246 snprintf(buf,1024*16,ascii_logo,
2247 REDIS_VERSION,
2248 redisGitSHA1(),
2249 strtol(redisGitDirty(),NULL,10) > 0,
2250 (sizeof(long) == 8) ? "64" : "32",
571e257d 2251 "stand alone",
996d503d 2252 server.port,
2253 (long) getpid()
2254 );
2255 redisLogRaw(REDIS_NOTICE|REDIS_LOG_RAW,buf);
2256 zfree(buf);
2257}
2258
633a9410 2259static void sigtermHandler(int sig) {
e2641e09 2260 REDIS_NOTUSED(sig);
2261
be4f8ccc 2262 redisLogFromHandler(REDIS_WARNING,"Received SIGTERM, scheduling shutdown...");
e2641e09 2263 server.shutdown_asap = 1;
2264}
2265
633a9410 2266void setupSignalHandlers(void) {
e2641e09 2267 struct sigaction act;
2268
633a9410
PN
2269 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction is used.
2270 * Otherwise, sa_handler is used. */
2271 sigemptyset(&act.sa_mask);
e2641e09 2272 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND;
2273 act.sa_handler = sigtermHandler;
633a9410 2274 sigaction(SIGTERM, &act, NULL);
e2641e09 2275
633a9410
PN
2276#ifdef HAVE_BACKTRACE
2277 sigemptyset(&act.sa_mask);
2278 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND | SA_SIGINFO;
2279 act.sa_sigaction = sigsegvHandler;
2280 sigaction(SIGSEGV, &act, NULL);
2281 sigaction(SIGBUS, &act, NULL);
2282 sigaction(SIGFPE, &act, NULL);
2283 sigaction(SIGILL, &act, NULL);
2284#endif
2285 return;
e2641e09 2286}
e2641e09 2287
78d6a02b 2288void memtest(size_t megabytes, int passes);
2289
39ca1713 2290int main(int argc, char **argv) {
2291 long long start;
a48c8d87 2292 struct timeval tv;
39ca1713 2293
06c5523a 2294 /* We need to initialize our libraries, and the server configuration. */
39ca1713 2295 zmalloc_enable_thread_safeness();
a48c8d87 2296 srand(time(NULL)^getpid());
2297 gettimeofday(&tv,NULL);
2298 dictSetHashFunctionSeed(tv.tv_sec^tv.tv_usec^getpid());
39ca1713 2299 initServerConfig();
a48c8d87 2300
67c6f0f6 2301 if (argc >= 2) {
2302 int j = 1; /* First option to parse in argv[] */
2303 sds options = sdsempty();
2304 char *configfile = NULL;
2305
2306 /* Handle special options --help and --version */
39ca1713 2307 if (strcmp(argv[1], "-v") == 0 ||
2308 strcmp(argv[1], "--version") == 0) version();
4c8bd905 2309 if (strcmp(argv[1], "--help") == 0 ||
2310 strcmp(argv[1], "-h") == 0) usage();
78d6a02b 2311 if (strcmp(argv[1], "--test-memory") == 0) {
2312 if (argc == 3) {
ea693f02 2313 memtest(atoi(argv[2]),50);
78d6a02b 2314 exit(0);
2315 } else {
2316 fprintf(stderr,"Please specify the amount of memory to test in megabytes.\n");
2317 fprintf(stderr,"Example: ./redis-server --test-memory 4096\n\n");
2318 exit(1);
2319 }
2320 }
2321
67c6f0f6 2322 /* First argument is the config file name? */
2323 if (argv[j][0] != '-' || argv[j][1] != '-')
2324 configfile = argv[j++];
2325 /* All the other options are parsed and conceptually appended to the
2326 * configuration file. For instance --port 6380 will generate the
2327 * string "port 6380\n" to be parsed after the actual file name
2328 * is parsed, if any. */
2329 while(j != argc) {
2330 if (argv[j][0] == '-' && argv[j][1] == '-') {
2331 /* Option name */
2332 if (sdslen(options)) options = sdscat(options,"\n");
2333 options = sdscat(options,argv[j]+2);
2334 options = sdscat(options," ");
2335 } else {
2336 /* Option argument */
2337 options = sdscatrepr(options,argv[j],strlen(argv[j]));
2338 options = sdscat(options," ");
2339 }
2340 j++;
2341 }
39ca1713 2342 resetServerSaveParams();
67c6f0f6 2343 loadServerConfig(configfile,options);
2344 sdsfree(options);
39ca1713 2345 } else {
2346 redisLog(REDIS_WARNING,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
2347 }
2348 if (server.daemonize) daemonize();
2349 initServer();
2350 if (server.daemonize) createPidFile();
2351 redisAsciiArt();
27ccb94a 2352 redisLog(REDIS_WARNING,"Server started, Redis version " REDIS_VERSION);
39ca1713 2353#ifdef __linux__
2354 linuxOvercommitMemoryWarning();
2355#endif
2356 start = ustime();
e394114d 2357 if (server.aof_state == REDIS_AOF_ON) {
2c915bcf 2358 if (loadAppendOnlyFile(server.aof_filename) == REDIS_OK)
39ca1713 2359 redisLog(REDIS_NOTICE,"DB loaded from append only file: %.3f seconds",(float)(ustime()-start)/1000000);
2360 } else {
f48cd4b9 2361 if (rdbLoad(server.rdb_filename) == REDIS_OK) {
39ca1713 2362 redisLog(REDIS_NOTICE,"DB loaded from disk: %.3f seconds",
2363 (float)(ustime()-start)/1000000);
2364 } else if (errno != ENOENT) {
2365 redisLog(REDIS_WARNING,"Fatal error loading the DB. Exiting.");
2366 exit(1);
2367 }
2368 }
2369 if (server.ipfd > 0)
2370 redisLog(REDIS_NOTICE,"The server is now ready to accept connections on port %d", server.port);
2371 if (server.sofd > 0)
2372 redisLog(REDIS_NOTICE,"The server is now ready to accept connections at %s", server.unixsocket);
2373 aeSetBeforeSleepProc(server.el,beforeSleep);
2374 aeMain(server.el);
2375 aeDeleteEventLoop(server.el);
2376 return 0;
2377}
2378
e2641e09 2379/* The End */