]> git.saurik.com Git - redis.git/blame - src/redis.c
allocate alternate signal stack, change of sigaction flags for sigterm
[redis.git] / src / redis.c
CommitLineData
e2641e09 1/*
2 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 */
29
30#include "redis.h"
daa70b17 31#include "slowlog.h"
8f61a72f 32#include "bio.h"
e2641e09 33
e2641e09 34#include <time.h>
35#include <signal.h>
36#include <sys/wait.h>
37#include <errno.h>
38#include <assert.h>
39#include <ctype.h>
40#include <stdarg.h>
e2641e09 41#include <arpa/inet.h>
42#include <sys/stat.h>
43#include <fcntl.h>
44#include <sys/time.h>
45#include <sys/resource.h>
46#include <sys/uio.h>
47#include <limits.h>
48#include <float.h>
49#include <math.h>
2b00385d 50#include <sys/resource.h>
e2641e09 51
52/* Our shared "common" objects */
53
54struct sharedObjectsStruct shared;
55
c74b7c77 56/* Global vars that are actually used as constants. The following double
e2641e09 57 * values are used for double on-disk serialization, and are initialized
58 * at runtime to avoid strange compiler optimizations. */
59
60double R_Zero, R_PosInf, R_NegInf, R_Nan;
61
62/*================================= Globals ================================= */
63
c5757662
PH
64/* Alternate stack for SIGSEGV/etc handlers */
65char altstack[SIGSTKSZ];
66
e2641e09 67/* Global vars */
68struct redisServer server; /* server global state */
69struct redisCommand *commandTable;
5d02b00f 70
7501c66f 71/* Our command table.
72 *
73 * Every entry is composed of the following fields:
74 *
75 * name: a string representing the command name.
76 * function: pointer to the C function implementing the command.
77 * arity: number of arguments, it is possible to use -N to say >= N
78 * sflags: command flags as string. See below for a table of flags.
79 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
80 * get_keys_proc: an optional function to get key arguments from a command.
81 * This is only used when the following three fields are not
82 * enough to specify what arguments are keys.
83 * first_key_index: first argument that is a key
84 * last_key_index: last argument that is a key
85 * key_step: step to get all the keys from first to last argument. For instance
86 * in MSET the step is two since arguments are key,val,key,val,...
87 * microseconds: microseconds of total execution time for this command.
88 * calls: total number of calls of this command.
89 *
90 * The flags, microseconds and calls fields are computed by Redis and should
91 * always be set to zero.
92 *
93 * Command flags are expressed using strings where every character represents
94 * a flag. Later the populateCommandTable() function will take care of
95 * populating the real 'flags' field using this characters.
5d02b00f 96 *
97 * This is the meaning of the flags:
98 *
99 * w: write command (may modify the key space).
100 * r: read command (will never modify the key space).
101 * m: may increase memory usage once called. Don't allow if out of memory.
102 * a: admin command, like SAVE or SHUTDOWN.
103 * p: Pub/Sub related command.
b60ed6e8 104 * f: force replication of this command, regarless of server.dirty.
105 * s: command not allowed in scripts.
7e14a208 106 * R: random command. Command is not deterministic, that is, the same command
b60ed6e8 107 * with the same arguments, with the same key space, may have different
548efd91 108 * results. For instance SPOP and RANDOMKEY are two random commands.
109 * S: Sort command output array if called from script, so that the output
110 * is deterministic.
111 */
d7ed7fd2 112struct redisCommand redisCommandTable[] = {
5d02b00f 113 {"get",getCommand,2,"r",0,NULL,1,1,1,0,0},
114 {"set",setCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
115 {"setnx",setnxCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
39da5d1f 116 {"setex",setexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
117 {"psetex",psetexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
5d02b00f 118 {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
119 {"strlen",strlenCommand,2,"r",0,NULL,1,1,1,0,0},
120 {"del",delCommand,-2,"w",0,noPreloadGetKeys,1,-1,1,0,0},
121 {"exists",existsCommand,2,"r",0,NULL,1,1,1,0,0},
122 {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
123 {"getbit",getbitCommand,3,"r",0,NULL,1,1,1,0,0},
124 {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
125 {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
126 {"substr",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
127 {"incr",incrCommand,2,"wm",0,NULL,1,1,1,0,0},
128 {"decr",decrCommand,2,"wm",0,NULL,1,1,1,0,0},
129 {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
130 {"rpush",rpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
131 {"lpush",lpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
132 {"rpushx",rpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
133 {"lpushx",lpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
134 {"linsert",linsertCommand,5,"wm",0,NULL,1,1,1,0,0},
135 {"rpop",rpopCommand,2,"w",0,NULL,1,1,1,0,0},
136 {"lpop",lpopCommand,2,"w",0,NULL,1,1,1,0,0},
e41677b4 137 {"brpop",brpopCommand,-3,"ws",0,NULL,1,1,1,0,0},
138 {"brpoplpush",brpoplpushCommand,4,"wms",0,NULL,1,2,1,0,0},
139 {"blpop",blpopCommand,-3,"ws",0,NULL,1,-2,1,0,0},
5d02b00f 140 {"llen",llenCommand,2,"r",0,NULL,1,1,1,0,0},
141 {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
142 {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
143 {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
144 {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
145 {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
146 {"rpoplpush",rpoplpushCommand,3,"wm",0,NULL,1,2,1,0,0},
147 {"sadd",saddCommand,-3,"wm",0,NULL,1,1,1,0,0},
148 {"srem",sremCommand,-3,"w",0,NULL,1,1,1,0,0},
149 {"smove",smoveCommand,4,"w",0,NULL,1,2,1,0,0},
150 {"sismember",sismemberCommand,3,"r",0,NULL,1,1,1,0,0},
151 {"scard",scardCommand,2,"r",0,NULL,1,1,1,0,0},
15ef6053 152 {"spop",spopCommand,2,"wRs",0,NULL,1,1,1,0,0},
b60ed6e8 153 {"srandmember",srandmemberCommand,2,"rR",0,NULL,1,1,1,0,0},
548efd91 154 {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 155 {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 156 {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 157 {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 158 {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
1bcfa0f6 159 {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
548efd91 160 {"smembers",sinterCommand,2,"rS",0,NULL,1,1,1,0,0},
5d02b00f 161 {"zadd",zaddCommand,-4,"wm",0,NULL,1,1,1,0,0},
162 {"zincrby",zincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
163 {"zrem",zremCommand,-3,"w",0,NULL,1,1,1,0,0},
164 {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
165 {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
166 {"zunionstore",zunionstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
167 {"zinterstore",zinterstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
168 {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
169 {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
170 {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
171 {"zcount",zcountCommand,4,"r",0,NULL,1,1,1,0,0},
172 {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
173 {"zcard",zcardCommand,2,"r",0,NULL,1,1,1,0,0},
174 {"zscore",zscoreCommand,3,"r",0,NULL,1,1,1,0,0},
175 {"zrank",zrankCommand,3,"r",0,NULL,1,1,1,0,0},
176 {"zrevrank",zrevrankCommand,3,"r",0,NULL,1,1,1,0,0},
177 {"hset",hsetCommand,4,"wm",0,NULL,1,1,1,0,0},
178 {"hsetnx",hsetnxCommand,4,"wm",0,NULL,1,1,1,0,0},
179 {"hget",hgetCommand,3,"r",0,NULL,1,1,1,0,0},
180 {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
181 {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
182 {"hincrby",hincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
68bfe993 183 {"hincrbyfloat",hincrbyfloatCommand,4,"wm",0,NULL,1,1,1,0,0},
5d02b00f 184 {"hdel",hdelCommand,-3,"w",0,NULL,1,1,1,0,0},
185 {"hlen",hlenCommand,2,"r",0,NULL,1,1,1,0,0},
548efd91 186 {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
187 {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
5d02b00f 188 {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
189 {"hexists",hexistsCommand,3,"r",0,NULL,1,1,1,0,0},
190 {"incrby",incrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
191 {"decrby",decrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
5574b53e 192 {"incrbyfloat",incrbyfloatCommand,3,"wm",0,NULL,1,1,1,0,0},
5d02b00f 193 {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
194 {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
195 {"msetnx",msetnxCommand,-3,"wm",0,NULL,1,-1,2,0,0},
b60ed6e8 196 {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
5d02b00f 197 {"select",selectCommand,2,"r",0,NULL,0,0,0,0,0},
198 {"move",moveCommand,3,"w",0,NULL,1,1,1,0,0},
199 {"rename",renameCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
200 {"renamenx",renamenxCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
12d293ca 201 {"expire",expireCommand,3,"w",0,NULL,1,1,1,0,0},
202 {"expireat",expireatCommand,3,"w",0,NULL,1,1,1,0,0},
203 {"pexpire",pexpireCommand,3,"w",0,NULL,1,1,1,0,0},
204 {"pexpireat",pexpireatCommand,3,"w",0,NULL,1,1,1,0,0},
548efd91 205 {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
5d02b00f 206 {"dbsize",dbsizeCommand,1,"r",0,NULL,0,0,0,0,0},
e41677b4 207 {"auth",authCommand,2,"rs",0,NULL,0,0,0,0,0},
5d02b00f 208 {"ping",pingCommand,1,"r",0,NULL,0,0,0,0,0},
209 {"echo",echoCommand,2,"r",0,NULL,0,0,0,0,0},
e41677b4 210 {"save",saveCommand,1,"ars",0,NULL,0,0,0,0,0},
5d02b00f 211 {"bgsave",bgsaveCommand,1,"ar",0,NULL,0,0,0,0,0},
212 {"bgrewriteaof",bgrewriteaofCommand,1,"ar",0,NULL,0,0,0,0,0},
4ab8695d 213 {"shutdown",shutdownCommand,-1,"ar",0,NULL,0,0,0,0,0},
5d02b00f 214 {"lastsave",lastsaveCommand,1,"r",0,NULL,0,0,0,0,0},
215 {"type",typeCommand,2,"r",0,NULL,1,1,1,0,0},
b60ed6e8 216 {"multi",multiCommand,1,"rs",0,NULL,0,0,0,0,0},
f3fd419f 217 {"exec",execCommand,1,"s",0,NULL,0,0,0,0,0},
b60ed6e8 218 {"discard",discardCommand,1,"rs",0,NULL,0,0,0,0,0},
219 {"sync",syncCommand,1,"ars",0,NULL,0,0,0,0,0},
5d02b00f 220 {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
221 {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
2c861050 222 {"sort",sortCommand,-2,"wmS",0,NULL,1,1,1,0,0},
5d02b00f 223 {"info",infoCommand,-1,"r",0,NULL,0,0,0,0,0},
b60ed6e8 224 {"monitor",monitorCommand,1,"ars",0,NULL,0,0,0,0,0},
12d293ca 225 {"ttl",ttlCommand,2,"r",0,NULL,1,1,1,0,0},
226 {"pttl",pttlCommand,2,"r",0,NULL,1,1,1,0,0},
5d02b00f 227 {"persist",persistCommand,2,"w",0,NULL,1,1,1,0,0},
b60ed6e8 228 {"slaveof",slaveofCommand,3,"aws",0,NULL,0,0,0,0,0},
7dcdd281 229 {"debug",debugCommand,-2,"as",0,NULL,0,0,0,0,0},
5d02b00f 230 {"config",configCommand,-2,"ar",0,NULL,0,0,0,0,0},
b60ed6e8 231 {"subscribe",subscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
232 {"unsubscribe",unsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
233 {"psubscribe",psubscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
234 {"punsubscribe",punsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
bb0aadbe 235 {"publish",publishCommand,3,"pf",0,NULL,0,0,0,0,0},
b60ed6e8 236 {"watch",watchCommand,-2,"rs",0,noPreloadGetKeys,1,-1,1,0,0},
237 {"unwatch",unwatchCommand,1,"rs",0,NULL,0,0,0,0,0},
5d02b00f 238 {"cluster",clusterCommand,-2,"ar",0,NULL,0,0,0,0,0},
7afc3a96 239 {"restore",restoreCommand,4,"awm",0,NULL,1,1,1,0,0},
5d02b00f 240 {"migrate",migrateCommand,6,"aw",0,NULL,0,0,0,0,0},
6856c7b4 241 {"asking",askingCommand,1,"r",0,NULL,0,0,0,0,0},
1bcfa0f6 242 {"dump",dumpCommand,2,"ar",0,NULL,1,1,1,0,0},
243 {"object",objectCommand,-2,"r",0,NULL,2,2,2,0,0},
5d02b00f 244 {"client",clientCommand,-2,"ar",0,NULL,0,0,0,0,0},
f3fd419f 245 {"eval",evalCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
246 {"evalsha",evalShaCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
070e3945 247 {"slowlog",slowlogCommand,-2,"r",0,NULL,0,0,0,0,0},
9494f1f1 248 {"script",scriptCommand,-2,"ras",0,NULL,0,0,0,0,0},
249 {"time",timeCommand,1,"rR",0,NULL,0,0,0,0,0}
e2641e09 250};
251
252/*============================ Utility functions ============================ */
253
9c104c68 254/* Low level logging. To use only for very big messages, otherwise
255 * redisLog() is to prefer. */
256void redisLogRaw(int level, const char *msg) {
e1a586ee
JH
257 const int syslogLevelMap[] = { LOG_DEBUG, LOG_INFO, LOG_NOTICE, LOG_WARNING };
258 const char *c = ".-*#";
259 time_t now = time(NULL);
e2641e09 260 FILE *fp;
23072961 261 char buf[64];
996d503d 262 int rawmode = (level & REDIS_LOG_RAW);
23072961 263
996d503d 264 level &= 0xff; /* clear flags */
23072961 265 if (level < server.verbosity) return;
e2641e09 266
267 fp = (server.logfile == NULL) ? stdout : fopen(server.logfile,"a");
268 if (!fp) return;
269
996d503d 270 if (rawmode) {
271 fprintf(fp,"%s",msg);
272 } else {
273 strftime(buf,sizeof(buf),"%d %b %H:%M:%S",localtime(&now));
274 fprintf(fp,"[%d] %s %c %s\n",(int)getpid(),buf,c[level],msg);
275 }
e1a586ee
JH
276 fflush(fp);
277
e2641e09 278 if (server.logfile) fclose(fp);
e1a586ee
JH
279
280 if (server.syslog_enabled) syslog(syslogLevelMap[level], "%s", msg);
e2641e09 281}
282
9c104c68 283/* Like redisLogRaw() but with printf-alike support. This is the funciton that
284 * is used across the code. The raw version is only used in order to dump
285 * the INFO output on crash. */
286void redisLog(int level, const char *fmt, ...) {
287 va_list ap;
288 char msg[REDIS_MAX_LOGMSG_LEN];
289
996d503d 290 if ((level&0xff) < server.verbosity) return;
9c104c68 291
292 va_start(ap, fmt);
293 vsnprintf(msg, sizeof(msg), fmt, ap);
294 va_end(ap);
295
296 redisLogRaw(level,msg);
297}
298
a7d12cba 299/* Log a fixed message without printf-alike capabilities, in a way that is
300 * safe to call from a signal handler.
301 *
302 * We actually use this only for signals that are not fatal from the point
303 * of view of Redis. Signals that are going to kill the server anyway and
304 * where we need printf-alike features are served by redisLog(). */
305void redisLogFromHandler(int level, const char *msg) {
306 int fd;
307 char buf[64];
308
309 if ((level&0xff) < server.verbosity ||
310 (server.logfile == NULL && server.daemonize)) return;
311 fd = server.logfile ?
312 open(server.logfile, O_APPEND|O_CREAT|O_WRONLY, 0644) :
5471b8ba 313 STDOUT_FILENO;
a7d12cba 314 if (fd == -1) return;
315 ll2string(buf,sizeof(buf),getpid());
316 write(fd,"[",1);
317 write(fd,buf,strlen(buf));
318 write(fd," | signal handler] (",20);
319 ll2string(buf,sizeof(buf),time(NULL));
320 write(fd,buf,strlen(buf));
321 write(fd,") ",2);
322 write(fd,msg,strlen(msg));
323 write(fd,"\n",1);
5471b8ba 324 if (server.logfile) close(fd);
a7d12cba 325}
326
e2641e09 327/* Redis generally does not try to recover from out of memory conditions
328 * when allocating objects or strings, it is not clear if it will be possible
329 * to report this condition to the client since the networking layer itself
330 * is based on heap allocation for send buffers, so we simply abort.
331 * At least the code will be simpler to read... */
332void oom(const char *msg) {
333 redisLog(REDIS_WARNING, "%s: Out of memory\n",msg);
334 sleep(1);
335 abort();
336}
337
d9cb288c 338/* Return the UNIX time in microseconds */
339long long ustime(void) {
340 struct timeval tv;
341 long long ust;
342
343 gettimeofday(&tv, NULL);
344 ust = ((long long)tv.tv_sec)*1000000;
345 ust += tv.tv_usec;
346 return ust;
347}
348
2c2b2085 349/* Return the UNIX time in milliseconds */
350long long mstime(void) {
351 return ustime()/1000;
352}
353
e2641e09 354/*====================== Hash table type implementation ==================== */
355
356/* This is an hash table type that uses the SDS dynamic strings libary as
357 * keys and radis objects as values (objects can hold SDS strings,
358 * lists, sets). */
359
360void dictVanillaFree(void *privdata, void *val)
361{
362 DICT_NOTUSED(privdata);
363 zfree(val);
364}
365
366void dictListDestructor(void *privdata, void *val)
367{
368 DICT_NOTUSED(privdata);
369 listRelease((list*)val);
370}
371
372int dictSdsKeyCompare(void *privdata, const void *key1,
373 const void *key2)
374{
375 int l1,l2;
376 DICT_NOTUSED(privdata);
377
378 l1 = sdslen((sds)key1);
379 l2 = sdslen((sds)key2);
380 if (l1 != l2) return 0;
381 return memcmp(key1, key2, l1) == 0;
382}
383
1b1f47c9 384/* A case insensitive version used for the command lookup table. */
385int dictSdsKeyCaseCompare(void *privdata, const void *key1,
386 const void *key2)
387{
388 DICT_NOTUSED(privdata);
389
390 return strcasecmp(key1, key2) == 0;
391}
392
e2641e09 393void dictRedisObjectDestructor(void *privdata, void *val)
394{
395 DICT_NOTUSED(privdata);
396
397 if (val == NULL) return; /* Values of swapped out keys as set to NULL */
398 decrRefCount(val);
399}
400
401void dictSdsDestructor(void *privdata, void *val)
402{
403 DICT_NOTUSED(privdata);
404
405 sdsfree(val);
406}
407
408int dictObjKeyCompare(void *privdata, const void *key1,
409 const void *key2)
410{
411 const robj *o1 = key1, *o2 = key2;
412 return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
413}
414
415unsigned int dictObjHash(const void *key) {
416 const robj *o = key;
417 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
418}
419
420unsigned int dictSdsHash(const void *key) {
421 return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
422}
423
1b1f47c9 424unsigned int dictSdsCaseHash(const void *key) {
425 return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
426}
427
e2641e09 428int dictEncObjKeyCompare(void *privdata, const void *key1,
429 const void *key2)
430{
431 robj *o1 = (robj*) key1, *o2 = (robj*) key2;
432 int cmp;
433
434 if (o1->encoding == REDIS_ENCODING_INT &&
435 o2->encoding == REDIS_ENCODING_INT)
436 return o1->ptr == o2->ptr;
437
438 o1 = getDecodedObject(o1);
439 o2 = getDecodedObject(o2);
440 cmp = dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
441 decrRefCount(o1);
442 decrRefCount(o2);
443 return cmp;
444}
445
446unsigned int dictEncObjHash(const void *key) {
447 robj *o = (robj*) key;
448
449 if (o->encoding == REDIS_ENCODING_RAW) {
450 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
451 } else {
452 if (o->encoding == REDIS_ENCODING_INT) {
453 char buf[32];
454 int len;
455
456 len = ll2string(buf,32,(long)o->ptr);
457 return dictGenHashFunction((unsigned char*)buf, len);
458 } else {
459 unsigned int hash;
460
461 o = getDecodedObject(o);
462 hash = dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
463 decrRefCount(o);
464 return hash;
465 }
466 }
467}
468
4dd444bb 469/* Sets type hash table */
e2641e09 470dictType setDictType = {
471 dictEncObjHash, /* hash function */
472 NULL, /* key dup */
473 NULL, /* val dup */
474 dictEncObjKeyCompare, /* key compare */
475 dictRedisObjectDestructor, /* key destructor */
476 NULL /* val destructor */
477};
478
479/* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
480dictType zsetDictType = {
481 dictEncObjHash, /* hash function */
482 NULL, /* key dup */
483 NULL, /* val dup */
484 dictEncObjKeyCompare, /* key compare */
485 dictRedisObjectDestructor, /* key destructor */
69ef89f2 486 NULL /* val destructor */
e2641e09 487};
488
489/* Db->dict, keys are sds strings, vals are Redis objects. */
490dictType dbDictType = {
491 dictSdsHash, /* hash function */
492 NULL, /* key dup */
493 NULL, /* val dup */
494 dictSdsKeyCompare, /* key compare */
495 dictSdsDestructor, /* key destructor */
496 dictRedisObjectDestructor /* val destructor */
497};
498
499/* Db->expires */
500dictType keyptrDictType = {
501 dictSdsHash, /* hash function */
502 NULL, /* key dup */
503 NULL, /* val dup */
504 dictSdsKeyCompare, /* key compare */
505 NULL, /* key destructor */
506 NULL /* val destructor */
507};
508
1b1f47c9 509/* Command table. sds string -> command struct pointer. */
510dictType commandTableDictType = {
511 dictSdsCaseHash, /* hash function */
512 NULL, /* key dup */
513 NULL, /* val dup */
514 dictSdsKeyCaseCompare, /* key compare */
515 dictSdsDestructor, /* key destructor */
516 NULL /* val destructor */
517};
518
e2641e09 519/* Hash type hash table (note that small hashes are represented with zimpaps) */
520dictType hashDictType = {
521 dictEncObjHash, /* hash function */
522 NULL, /* key dup */
523 NULL, /* val dup */
524 dictEncObjKeyCompare, /* key compare */
525 dictRedisObjectDestructor, /* key destructor */
526 dictRedisObjectDestructor /* val destructor */
527};
528
529/* Keylist hash table type has unencoded redis objects as keys and
530 * lists as values. It's used for blocking operations (BLPOP) and to
531 * map swapped keys to a list of clients waiting for this keys to be loaded. */
532dictType keylistDictType = {
533 dictObjHash, /* hash function */
534 NULL, /* key dup */
535 NULL, /* val dup */
536 dictObjKeyCompare, /* key compare */
537 dictRedisObjectDestructor, /* key destructor */
538 dictListDestructor /* val destructor */
539};
540
ecc91094 541/* Cluster nodes hash table, mapping nodes addresses 1.2.3.4:6379 to
542 * clusterNode structures. */
543dictType clusterNodesDictType = {
544 dictSdsHash, /* hash function */
545 NULL, /* key dup */
546 NULL, /* val dup */
547 dictSdsKeyCompare, /* key compare */
548 dictSdsDestructor, /* key destructor */
549 NULL /* val destructor */
550};
551
e2641e09 552int htNeedsResize(dict *dict) {
553 long long size, used;
554
555 size = dictSlots(dict);
556 used = dictSize(dict);
557 return (size && used && size > DICT_HT_INITIAL_SIZE &&
558 (used*100/size < REDIS_HT_MINFILL));
559}
560
561/* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
562 * we resize the hash table to save memory */
563void tryResizeHashTables(void) {
564 int j;
565
566 for (j = 0; j < server.dbnum; j++) {
567 if (htNeedsResize(server.db[j].dict))
568 dictResize(server.db[j].dict);
569 if (htNeedsResize(server.db[j].expires))
570 dictResize(server.db[j].expires);
571 }
572}
573
574/* Our hash table implementation performs rehashing incrementally while
575 * we write/read from the hash table. Still if the server is idle, the hash
576 * table will use two tables for a long time. So we try to use 1 millisecond
577 * of CPU time at every serverCron() loop in order to rehash some key. */
578void incrementallyRehash(void) {
579 int j;
580
581 for (j = 0; j < server.dbnum; j++) {
582 if (dictIsRehashing(server.db[j].dict)) {
583 dictRehashMilliseconds(server.db[j].dict,1);
584 break; /* already used our millisecond for this loop... */
585 }
586 }
587}
588
589/* This function is called once a background process of some kind terminates,
590 * as we want to avoid resizing the hash tables when there is a child in order
591 * to play well with copy-on-write (otherwise when a resize happens lots of
592 * memory pages are copied). The goal of this function is to update the ability
593 * for dict.c to resize the hash tables accordingly to the fact we have o not
594 * running childs. */
595void updateDictResizePolicy(void) {
f48cd4b9 596 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
e2641e09 597 dictEnableResize();
598 else
599 dictDisableResize();
600}
601
602/* ======================= Cron: called every 100 ms ======================== */
603
bcf2995c 604/* Try to expire a few timed out keys. The algorithm used is adaptive and
605 * will use few CPU cycles if there are few expiring keys, otherwise
606 * it will get more aggressive to avoid that too much memory is used by
607 * keys that can be removed from the keyspace. */
608void activeExpireCycle(void) {
609 int j;
610
611 for (j = 0; j < server.dbnum; j++) {
612 int expired;
613 redisDb *db = server.db+j;
614
615 /* Continue to expire if at the end of the cycle more than 25%
616 * of the keys were expired. */
617 do {
618 long num = dictSize(db->expires);
4be855e7 619 long long now = mstime();
bcf2995c 620
621 expired = 0;
622 if (num > REDIS_EXPIRELOOKUPS_PER_CRON)
623 num = REDIS_EXPIRELOOKUPS_PER_CRON;
624 while (num--) {
625 dictEntry *de;
4be855e7 626 long long t;
bcf2995c 627
628 if ((de = dictGetRandomKey(db->expires)) == NULL) break;
4be855e7 629 t = dictGetSignedIntegerVal(de);
bcf2995c 630 if (now > t) {
c0ba9ebe 631 sds key = dictGetKey(de);
bcf2995c 632 robj *keyobj = createStringObject(key,sdslen(key));
633
634 propagateExpire(db,keyobj);
635 dbDelete(db,keyobj);
636 decrRefCount(keyobj);
637 expired++;
638 server.stat_expiredkeys++;
639 }
640 }
641 } while (expired > REDIS_EXPIRELOOKUPS_PER_CRON/4);
642 }
643}
644
165346ca 645void updateLRUClock(void) {
d1949054 646 server.lruclock = (server.unixtime/REDIS_LRU_CLOCK_RESOLUTION) &
165346ca 647 REDIS_LRU_CLOCK_MAX;
648}
bcf2995c 649
250e7f69 650
651/* Add a sample to the operations per second array of samples. */
652void trackOperationsPerSecond(void) {
653 long long t = mstime() - server.ops_sec_last_sample_time;
654 long long ops = server.stat_numcommands - server.ops_sec_last_sample_ops;
655 long long ops_sec;
656
657 ops_sec = t > 0 ? (ops*1000/t) : 0;
658
659 server.ops_sec_samples[server.ops_sec_idx] = ops_sec;
660 server.ops_sec_idx = (server.ops_sec_idx+1) % REDIS_OPS_SEC_SAMPLES;
661 server.ops_sec_last_sample_time = mstime();
662 server.ops_sec_last_sample_ops = server.stat_numcommands;
663}
664
665/* Return the mean of all the samples. */
666long long getOperationsPerSecond(void) {
667 int j;
668 long long sum = 0;
669
670 for (j = 0; j < REDIS_OPS_SEC_SAMPLES; j++)
671 sum += server.ops_sec_samples[j];
672 return sum / REDIS_OPS_SEC_SAMPLES;
673}
674
c9d3dda2 675/* Check for timeouts. Returns non-zero if the client was terminated */
676int clientsCronHandleTimeout(redisClient *c) {
ae22bf1e 677 time_t now = server.unixtime;
d19015be 678
679 if (server.maxidletime &&
680 !(c->flags & REDIS_SLAVE) && /* no timeout for slaves */
681 !(c->flags & REDIS_MASTER) && /* no timeout for masters */
682 !(c->flags & REDIS_BLOCKED) && /* no timeout for BLPOP */
683 dictSize(c->pubsub_channels) == 0 && /* no timeout for pubsub */
684 listLength(c->pubsub_patterns) == 0 &&
685 (now - c->lastinteraction > server.maxidletime))
686 {
687 redisLog(REDIS_VERBOSE,"Closing idle client");
688 freeClient(c);
c9d3dda2 689 return 1;
d19015be 690 } else if (c->flags & REDIS_BLOCKED) {
691 if (c->bpop.timeout != 0 && c->bpop.timeout < now) {
692 addReply(c,shared.nullmultibulk);
693 unblockClientWaitingData(c);
694 }
695 }
c9d3dda2 696 return 0;
d19015be 697}
698
ae22bf1e 699/* The client query buffer is an sds.c string that can end with a lot of
c9d3dda2 700 * free space not used, this function reclaims space if needed.
701 *
702 * The funciton always returns 0 as it never terminates the client. */
703int clientsCronResizeQueryBuffer(redisClient *c) {
ae22bf1e 704 size_t querybuf_size = sdsAllocSize(c->querybuf);
705 time_t idletime = server.unixtime - c->lastinteraction;
706
707 /* There are two conditions to resize the query buffer:
708 * 1) Query buffer is > BIG_ARG and too big for latest peak.
709 * 2) Client is inactive and the buffer is bigger than 1k. */
710 if (((querybuf_size > REDIS_MBULK_BIG_ARG) &&
711 (querybuf_size/(c->querybuf_peak+1)) > 2) ||
712 (querybuf_size > 1024 && idletime > 2))
713 {
714 /* Only resize the query buffer if it is actually wasting space. */
715 if (sdsavail(c->querybuf) > 1024) {
716 c->querybuf = sdsRemoveFreeSpace(c->querybuf);
717 }
718 }
719 /* Reset the peak again to capture the peak memory usage in the next
720 * cycle. */
721 c->querybuf_peak = 0;
c9d3dda2 722 return 0;
ae22bf1e 723}
724
d19015be 725void clientsCron(void) {
726 /* Make sure to process at least 1/100 of clients per call.
727 * Since this function is called 10 times per second we are sure that
728 * in the worst case we process all the clients in 10 seconds.
729 * In normal conditions (a reasonable number of clients) we process
730 * all the clients in a shorter time. */
ae22bf1e 731 int numclients = listLength(server.clients);
732 int iterations = numclients/100;
d19015be 733
ae22bf1e 734 if (iterations < 50)
735 iterations = (numclients < 50) ? numclients : 50;
d19015be 736 while(listLength(server.clients) && iterations--) {
737 redisClient *c;
738 listNode *head;
739
740 /* Rotate the list, take the current head, process.
741 * This way if the client must be removed from the list it's the
742 * first element and we don't incur into O(N) computation. */
743 listRotate(server.clients);
744 head = listFirst(server.clients);
745 c = listNodeValue(head);
c9d3dda2 746 /* The following functions do different service checks on the client.
747 * The protocol is that they return non-zero if the client was
748 * terminated. */
749 if (clientsCronHandleTimeout(c)) continue;
750 if (clientsCronResizeQueryBuffer(c)) continue;
d19015be 751 }
752}
753
e2641e09 754int serverCron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
89a1433e 755 int j, loops = server.cronloops;
e2641e09 756 REDIS_NOTUSED(eventLoop);
757 REDIS_NOTUSED(id);
758 REDIS_NOTUSED(clientData);
759
39bd025c 760 /* Software watchdog: deliver the SIGALRM that will reach the signal
761 * handler if we don't return here fast enough. */
762 if (server.watchdog_period) watchdogScheduleSignal(server.watchdog_period);
763
e2641e09 764 /* We take a cached value of the unix time in the global state because
765 * with virtual memory and aging there is to store the current time
766 * in objects at every object access, and accuracy is not needed.
767 * To access a global var is faster than calling time(NULL) */
768 server.unixtime = time(NULL);
4f06867a 769
250e7f69 770 trackOperationsPerSecond();
771
ef59a8bc 772 /* We have just 22 bits per object for LRU information.
165346ca 773 * So we use an (eventually wrapping) LRU clock with 10 seconds resolution.
774 * 2^22 bits with 10 seconds resoluton is more or less 1.5 years.
e2641e09 775 *
165346ca 776 * Note that even if this will wrap after 1.5 years it's not a problem,
ef59a8bc 777 * everything will still work but just some object will appear younger
165346ca 778 * to Redis. But for this to happen a given object should never be touched
779 * for 1.5 years.
780 *
781 * Note that you can change the resolution altering the
782 * REDIS_LRU_CLOCK_RESOLUTION define.
e2641e09 783 */
165346ca 784 updateLRUClock();
e2641e09 785
17b24ff3 786 /* Record the max memory used since the server was started. */
787 if (zmalloc_used_memory() > server.stat_peak_memory)
788 server.stat_peak_memory = zmalloc_used_memory();
789
e2641e09 790 /* We received a SIGTERM, shutting down here in a safe way, as it is
791 * not ok doing so inside the signal handler. */
792 if (server.shutdown_asap) {
4ab8695d 793 if (prepareForShutdown(0) == REDIS_OK) exit(0);
e2641e09 794 redisLog(REDIS_WARNING,"SIGTERM received but errors trying to shut down the server, check the logs for more information");
795 }
796
797 /* Show some info about non-empty databases */
798 for (j = 0; j < server.dbnum; j++) {
799 long long size, used, vkeys;
800
801 size = dictSlots(server.db[j].dict);
802 used = dictSize(server.db[j].dict);
803 vkeys = dictSize(server.db[j].expires);
804 if (!(loops % 50) && (used || vkeys)) {
805 redisLog(REDIS_VERBOSE,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j,used,vkeys,size);
806 /* dictPrintStats(server.dict); */
807 }
808 }
809
810 /* We don't want to resize the hash tables while a bacground saving
811 * is in progress: the saving child is created using fork() that is
812 * implemented with a copy-on-write semantic in most modern systems, so
813 * if we resize the HT while there is the saving child at work actually
814 * a lot of memory movements in the parent will cause a lot of pages
815 * copied. */
f48cd4b9 816 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
e2641e09 817 if (!(loops % 10)) tryResizeHashTables();
818 if (server.activerehashing) incrementallyRehash();
819 }
820
821 /* Show information about connected clients */
822 if (!(loops % 50)) {
823 redisLog(REDIS_VERBOSE,"%d clients connected (%d slaves), %zu bytes in use",
824 listLength(server.clients)-listLength(server.slaves),
825 listLength(server.slaves),
ca734d17 826 zmalloc_used_memory());
e2641e09 827 }
828
d19015be 829 /* We need to do a few operations on clients asynchronously. */
830 clientsCron();
e2641e09 831
b333e239 832 /* Start a scheduled AOF rewrite if this was requested by the user while
833 * a BGSAVE was in progress. */
f48cd4b9 834 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1 &&
2c915bcf 835 server.aof_rewrite_scheduled)
b333e239 836 {
837 rewriteAppendOnlyFileBackground();
838 }
839
f03fe802 840 /* Check if a background saving or AOF rewrite in progress terminated. */
f48cd4b9 841 if (server.rdb_child_pid != -1 || server.aof_child_pid != -1) {
e2641e09 842 int statloc;
843 pid_t pid;
844
845 if ((pid = wait3(&statloc,WNOHANG,NULL)) != 0) {
36c17a53 846 int exitcode = WEXITSTATUS(statloc);
847 int bysignal = 0;
848
849 if (WIFSIGNALED(statloc)) bysignal = WTERMSIG(statloc);
850
f48cd4b9 851 if (pid == server.rdb_child_pid) {
36c17a53 852 backgroundSaveDoneHandler(exitcode,bysignal);
e2641e09 853 } else {
36c17a53 854 backgroundRewriteDoneHandler(exitcode,bysignal);
e2641e09 855 }
856 updateDictResizePolicy();
857 }
c9d0c362 858 } else {
b333e239 859 /* If there is not a background saving/rewrite in progress check if
860 * we have to save/rewrite now */
e2641e09 861 for (j = 0; j < server.saveparamslen; j++) {
862 struct saveparam *sp = server.saveparams+j;
863
864 if (server.dirty >= sp->changes &&
d1949054 865 server.unixtime-server.lastsave > sp->seconds) {
e2641e09 866 redisLog(REDIS_NOTICE,"%d changes in %d seconds. Saving...",
867 sp->changes, sp->seconds);
f48cd4b9 868 rdbSaveBackground(server.rdb_filename);
e2641e09 869 break;
870 }
871 }
b333e239 872
873 /* Trigger an AOF rewrite if needed */
f48cd4b9 874 if (server.rdb_child_pid == -1 &&
ff2145ad 875 server.aof_child_pid == -1 &&
2c915bcf 876 server.aof_rewrite_perc &&
877 server.aof_current_size > server.aof_rewrite_min_size)
b333e239 878 {
2c915bcf 879 long long base = server.aof_rewrite_base_size ?
880 server.aof_rewrite_base_size : 1;
881 long long growth = (server.aof_current_size*100/base) - 100;
882 if (growth >= server.aof_rewrite_perc) {
19b46c9a 883 redisLog(REDIS_NOTICE,"Starting automatic rewriting of AOF on %lld%% growth",growth);
b333e239 884 rewriteAppendOnlyFileBackground();
885 }
886 }
e2641e09 887 }
888
db3c2a4f 889
890 /* If we postponed an AOF buffer flush, let's try to do it every time the
891 * cron function is called. */
892 if (server.aof_flush_postponed_start) flushAppendOnlyFile(0);
893
bcf2995c 894 /* Expire a few keys per cycle, only if this is a master.
895 * On slaves we wait for DEL operations synthesized by the master
896 * in order to guarantee a strict consistency. */
897 if (server.masterhost == NULL) activeExpireCycle();
e2641e09 898
8c43e663 899 /* Close clients that need to be closed asynchronous */
900 freeClientsInAsyncFreeQueue();
901
f4aa600b 902 /* Replication cron function -- used to reconnect to master and
903 * to detect transfer failures. */
62ec599c 904 if (!(loops % 10)) replicationCron();
f4aa600b 905
ecc91094 906 /* Run other sub-systems specific cron jobs */
907 if (server.cluster_enabled && !(loops % 10)) clusterCron();
908
89a1433e 909 server.cronloops++;
e2641e09 910 return 100;
911}
912
913/* This function gets called every time Redis is entering the
914 * main loop of the event driven library, that is, before to sleep
915 * for ready file descriptors. */
916void beforeSleep(struct aeEventLoop *eventLoop) {
917 REDIS_NOTUSED(eventLoop);
a4ce7581
PN
918 listNode *ln;
919 redisClient *c;
e2641e09 920
a4ce7581
PN
921 /* Try to process pending commands for clients that were just unblocked. */
922 while (listLength(server.unblocked_clients)) {
923 ln = listFirst(server.unblocked_clients);
924 redisAssert(ln != NULL);
925 c = ln->value;
926 listDelNode(server.unblocked_clients,ln);
3bcffcbe 927 c->flags &= ~REDIS_UNBLOCKED;
a4ce7581
PN
928
929 /* Process remaining data in the input buffer. */
00010fa9 930 if (c->querybuf && sdslen(c->querybuf) > 0) {
931 server.current_client = c;
a4ce7581 932 processInputBuffer(c);
00010fa9 933 server.current_client = NULL;
934 }
a4ce7581
PN
935 }
936
e2641e09 937 /* Write the AOF buffer on disk */
db3c2a4f 938 flushAppendOnlyFile(0);
e2641e09 939}
940
941/* =========================== Server initialization ======================== */
942
943void createSharedObjects(void) {
944 int j;
945
946 shared.crlf = createObject(REDIS_STRING,sdsnew("\r\n"));
947 shared.ok = createObject(REDIS_STRING,sdsnew("+OK\r\n"));
948 shared.err = createObject(REDIS_STRING,sdsnew("-ERR\r\n"));
949 shared.emptybulk = createObject(REDIS_STRING,sdsnew("$0\r\n\r\n"));
950 shared.czero = createObject(REDIS_STRING,sdsnew(":0\r\n"));
951 shared.cone = createObject(REDIS_STRING,sdsnew(":1\r\n"));
952 shared.cnegone = createObject(REDIS_STRING,sdsnew(":-1\r\n"));
953 shared.nullbulk = createObject(REDIS_STRING,sdsnew("$-1\r\n"));
954 shared.nullmultibulk = createObject(REDIS_STRING,sdsnew("*-1\r\n"));
955 shared.emptymultibulk = createObject(REDIS_STRING,sdsnew("*0\r\n"));
956 shared.pong = createObject(REDIS_STRING,sdsnew("+PONG\r\n"));
957 shared.queued = createObject(REDIS_STRING,sdsnew("+QUEUED\r\n"));
958 shared.wrongtypeerr = createObject(REDIS_STRING,sdsnew(
959 "-ERR Operation against a key holding the wrong kind of value\r\n"));
960 shared.nokeyerr = createObject(REDIS_STRING,sdsnew(
961 "-ERR no such key\r\n"));
962 shared.syntaxerr = createObject(REDIS_STRING,sdsnew(
963 "-ERR syntax error\r\n"));
964 shared.sameobjecterr = createObject(REDIS_STRING,sdsnew(
965 "-ERR source and destination objects are the same\r\n"));
966 shared.outofrangeerr = createObject(REDIS_STRING,sdsnew(
967 "-ERR index out of range\r\n"));
7229d60d 968 shared.noscripterr = createObject(REDIS_STRING,sdsnew(
969 "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
97e7f8ae 970 shared.loadingerr = createObject(REDIS_STRING,sdsnew(
971 "-LOADING Redis is loading the dataset in memory\r\n"));
115e3ff3 972 shared.slowscripterr = createObject(REDIS_STRING,sdsnew(
4ab8695d 973 "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
c25e7eaf 974 shared.bgsaveerr = createObject(REDIS_STRING,sdsnew(
f3fd419f 975 "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
976 shared.roslaveerr = createObject(REDIS_STRING,sdsnew(
977 "-READONLY You can't write against a read only slave.\r\n"));
b22eab8f 978 shared.oomerr = createObject(REDIS_STRING,sdsnew(
979 "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
e2641e09 980 shared.space = createObject(REDIS_STRING,sdsnew(" "));
981 shared.colon = createObject(REDIS_STRING,sdsnew(":"));
982 shared.plus = createObject(REDIS_STRING,sdsnew("+"));
f892797e
JJ
983
984 for (j = 0; j < REDIS_SHARED_SELECT_CMDS; j++) {
985 shared.select[j] = createObject(REDIS_STRING,
986 sdscatprintf(sdsempty(),"select %d\r\n", j));
987 }
e2641e09 988 shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
989 shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
990 shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
991 shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
992 shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
993 shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
355f8591 994 shared.del = createStringObject("DEL",3);
c1db214e 995 shared.rpop = createStringObject("RPOP",4);
996 shared.lpop = createStringObject("LPOP",4);
e2641e09 997 for (j = 0; j < REDIS_SHARED_INTEGERS; j++) {
998 shared.integers[j] = createObject(REDIS_STRING,(void*)(long)j);
999 shared.integers[j]->encoding = REDIS_ENCODING_INT;
1000 }
355f8591 1001 for (j = 0; j < REDIS_SHARED_BULKHDR_LEN; j++) {
1002 shared.mbulkhdr[j] = createObject(REDIS_STRING,
1003 sdscatprintf(sdsempty(),"*%d\r\n",j));
1004 shared.bulkhdr[j] = createObject(REDIS_STRING,
1005 sdscatprintf(sdsempty(),"$%d\r\n",j));
1006 }
e2641e09 1007}
1008
1009void initServerConfig() {
91d664d6 1010 getRandomHexChars(server.runid,REDIS_RUN_ID_SIZE);
1011 server.runid[REDIS_RUN_ID_SIZE] = '\0';
75eaac5c 1012 server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
e2641e09 1013 server.port = REDIS_SERVERPORT;
a5639e7d 1014 server.bindaddr = NULL;
5d10923f 1015 server.unixsocket = NULL;
85238765 1016 server.unixsocketperm = 0;
a5639e7d
PN
1017 server.ipfd = -1;
1018 server.sofd = -1;
1019 server.dbnum = REDIS_DEFAULT_DBNUM;
c6f9ee88 1020 server.verbosity = REDIS_NOTICE;
e2641e09 1021 server.maxidletime = REDIS_MAXIDLETIME;
becf5fdb 1022 server.client_max_querybuf_len = REDIS_MAX_QUERYBUF_LEN;
e2641e09 1023 server.saveparams = NULL;
97e7f8ae 1024 server.loading = 0;
e2641e09 1025 server.logfile = NULL; /* NULL = log on standard output */
e1a586ee
JH
1026 server.syslog_enabled = 0;
1027 server.syslog_ident = zstrdup("redis");
1028 server.syslog_facility = LOG_LOCAL0;
e2641e09 1029 server.daemonize = 0;
e394114d 1030 server.aof_state = REDIS_AOF_OFF;
2c915bcf 1031 server.aof_fsync = AOF_FSYNC_EVERYSEC;
1032 server.aof_no_fsync_on_rewrite = 0;
1033 server.aof_rewrite_perc = REDIS_AOF_REWRITE_PERC;
1034 server.aof_rewrite_min_size = REDIS_AOF_REWRITE_MIN_SIZE;
1035 server.aof_rewrite_base_size = 0;
1036 server.aof_rewrite_scheduled = 0;
ff2145ad 1037 server.aof_last_fsync = time(NULL);
c1d01b3c 1038 server.aof_delayed_fsync = 0;
ff2145ad 1039 server.aof_fd = -1;
1040 server.aof_selected_db = -1; /* Make sure the first time will not match */
db3c2a4f 1041 server.aof_flush_postponed_start = 0;
e2641e09 1042 server.pidfile = zstrdup("/var/run/redis.pid");
f48cd4b9 1043 server.rdb_filename = zstrdup("dump.rdb");
2c915bcf 1044 server.aof_filename = zstrdup("appendonly.aof");
e2641e09 1045 server.requirepass = NULL;
f48cd4b9 1046 server.rdb_compression = 1;
e2641e09 1047 server.activerehashing = 1;
58732c23 1048 server.maxclients = REDIS_MAX_CLIENTS;
5fa95ad7 1049 server.bpop_blocked_clients = 0;
e2641e09 1050 server.maxmemory = 0;
165346ca 1051 server.maxmemory_policy = REDIS_MAXMEMORY_VOLATILE_LRU;
1052 server.maxmemory_samples = 3;
ebd85e9a
PN
1053 server.hash_max_ziplist_entries = REDIS_HASH_MAX_ZIPLIST_ENTRIES;
1054 server.hash_max_ziplist_value = REDIS_HASH_MAX_ZIPLIST_VALUE;
e2641e09 1055 server.list_max_ziplist_entries = REDIS_LIST_MAX_ZIPLIST_ENTRIES;
1056 server.list_max_ziplist_value = REDIS_LIST_MAX_ZIPLIST_VALUE;
96ffb2fe 1057 server.set_max_intset_entries = REDIS_SET_MAX_INTSET_ENTRIES;
3ea204e1
PN
1058 server.zset_max_ziplist_entries = REDIS_ZSET_MAX_ZIPLIST_ENTRIES;
1059 server.zset_max_ziplist_value = REDIS_ZSET_MAX_ZIPLIST_VALUE;
e2641e09 1060 server.shutdown_asap = 0;
aeecbdfa 1061 server.repl_ping_slave_period = REDIS_REPL_PING_SLAVE_PERIOD;
1062 server.repl_timeout = REDIS_REPL_TIMEOUT;
ecc91094 1063 server.cluster_enabled = 0;
ef21ab96 1064 server.cluster.configfile = zstrdup("nodes.conf");
4ab8695d 1065 server.lua_caller = NULL;
eeffcf38 1066 server.lua_time_limit = REDIS_LUA_TIME_LIMIT;
070e3945 1067 server.lua_client = NULL;
115e3ff3 1068 server.lua_timedout = 0;
e2641e09 1069
95506e46 1070 updateLRUClock();
e2641e09 1071 resetServerSaveParams();
1072
1073 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1074 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1075 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1076 /* Replication related */
e2641e09 1077 server.masterauth = NULL;
1078 server.masterhost = NULL;
1079 server.masterport = 6379;
1080 server.master = NULL;
1844f990 1081 server.repl_state = REDIS_REPL_NONE;
890a2ed9 1082 server.repl_syncio_timeout = REDIS_REPL_SYNCIO_TIMEOUT;
4ebfc455 1083 server.repl_serve_stale_data = 1;
f3fd419f 1084 server.repl_slave_ro = 1;
07486df6 1085 server.repl_down_since = -1;
e2641e09 1086
7eac2a75 1087 /* Client output buffer limits */
1088 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].hard_limit_bytes = 0;
1089 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_bytes = 0;
1090 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_seconds = 0;
c8a607f2 1091 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].hard_limit_bytes = 1024*1024*256;
1092 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_bytes = 1024*1024*64;
7eac2a75 1093 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_seconds = 60;
c8a607f2 1094 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].hard_limit_bytes = 1024*1024*32;
1095 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_bytes = 1024*1024*8;
7eac2a75 1096 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_seconds = 60;
1097
e2641e09 1098 /* Double constants initialization */
1099 R_Zero = 0.0;
1100 R_PosInf = 1.0/R_Zero;
1101 R_NegInf = -1.0/R_Zero;
1102 R_Nan = R_Zero/R_Zero;
8d3e063a 1103
1104 /* Command table -- we intiialize it here as it is part of the
1105 * initial configuration, since command names may be changed via
1106 * redis.conf using the rename-command directive. */
1107 server.commands = dictCreate(&commandTableDictType,NULL);
1108 populateCommandTable();
1109 server.delCommand = lookupCommandByCString("del");
1110 server.multiCommand = lookupCommandByCString("multi");
eeb34eff 1111 server.lpushCommand = lookupCommandByCString("lpush");
daa70b17 1112
1113 /* Slow log */
1114 server.slowlog_log_slower_than = REDIS_SLOWLOG_LOG_SLOWER_THAN;
1115 server.slowlog_max_len = REDIS_SLOWLOG_MAX_LEN;
fa5af017 1116
39bd025c 1117 /* Debugging */
fa5af017 1118 server.assert_failed = "<no assertion failed>";
1119 server.assert_file = "<no file>";
1120 server.assert_line = 0;
1121 server.bug_report_start = 0;
39bd025c 1122 server.watchdog_period = 0;
e2641e09 1123}
1124
e074416b 1125/* This function will try to raise the max number of open files accordingly to
1126 * the configured max number of clients. It will also account for 32 additional
1127 * file descriptors as we need a few more for persistence, listening
1128 * sockets, log files and so forth.
1129 *
1130 * If it will not be possible to set the limit accordingly to the configured
1131 * max number of clients, the function will do the reverse setting
1132 * server.maxclients to the value that we can actually handle. */
1133void adjustOpenFilesLimit(void) {
1134 rlim_t maxfiles = server.maxclients+32;
1135 struct rlimit limit;
1136
1137 if (maxfiles < 1024) maxfiles = 1024;
1138 if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
1139 redisLog(REDIS_WARNING,"Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
1140 strerror(errno));
1141 server.maxclients = 1024-32;
1142 } else {
1143 rlim_t oldlimit = limit.rlim_cur;
1144
1145 /* Set the max number of files if the current limit is not enough
1146 * for our needs. */
1147 if (oldlimit < maxfiles) {
e7957ca6 1148 rlim_t f;
1149
1150 f = maxfiles;
1151 while(f > oldlimit) {
1152 limit.rlim_cur = f;
1153 limit.rlim_max = f;
1154 if (setrlimit(RLIMIT_NOFILE,&limit) != -1) break;
1155 f -= 128;
1156 }
1157 if (f < oldlimit) f = oldlimit;
1158 if (f != maxfiles) {
1159 server.maxclients = f-32;
e074416b 1160 redisLog(REDIS_WARNING,"Unable to set the max number of files limit to %d (%s), setting the max clients configuration to %d.",
1161 (int) maxfiles, strerror(errno), (int) server.maxclients);
1162 } else {
1163 redisLog(REDIS_NOTICE,"Max number of open files set to %d",
1164 (int) maxfiles);
1165 }
1166 }
1167 }
1168}
1169
e2641e09 1170void initServer() {
1171 int j;
1172
1173 signal(SIGHUP, SIG_IGN);
1174 signal(SIGPIPE, SIG_IGN);
633a9410 1175 setupSignalHandlers();
e2641e09 1176
e1a586ee
JH
1177 if (server.syslog_enabled) {
1178 openlog(server.syslog_ident, LOG_PID | LOG_NDELAY | LOG_NOWAIT,
1179 server.syslog_facility);
1180 }
1181
00010fa9 1182 server.current_client = NULL;
e2641e09 1183 server.clients = listCreate();
7eac2a75 1184 server.clients_to_close = listCreate();
e2641e09 1185 server.slaves = listCreate();
1186 server.monitors = listCreate();
a4ce7581 1187 server.unblocked_clients = listCreate();
cea8c5cd 1188
e2641e09 1189 createSharedObjects();
e074416b 1190 adjustOpenFilesLimit();
1191 server.el = aeCreateEventLoop(server.maxclients+1024);
e2641e09 1192 server.db = zmalloc(sizeof(redisDb)*server.dbnum);
68d6345d 1193
a53b4c24 1194 if (server.port != 0) {
68d6345d 1195 server.ipfd = anetTcpServer(server.neterr,server.port,server.bindaddr);
a53b4c24 1196 if (server.ipfd == ANET_ERR) {
eef17490 1197 redisLog(REDIS_WARNING, "Opening port %d: %s",
1198 server.port, server.neterr);
a53b4c24 1199 exit(1);
1200 }
a5639e7d 1201 }
5d10923f
PN
1202 if (server.unixsocket != NULL) {
1203 unlink(server.unixsocket); /* don't care if this fails */
85238765 1204 server.sofd = anetUnixServer(server.neterr,server.unixsocket,server.unixsocketperm);
a5639e7d
PN
1205 if (server.sofd == ANET_ERR) {
1206 redisLog(REDIS_WARNING, "Opening socket: %s", server.neterr);
1207 exit(1);
1208 }
c61e6925 1209 }
a5639e7d
PN
1210 if (server.ipfd < 0 && server.sofd < 0) {
1211 redisLog(REDIS_WARNING, "Configured to not listen anywhere, exiting.");
e2641e09 1212 exit(1);
1213 }
1214 for (j = 0; j < server.dbnum; j++) {
1215 server.db[j].dict = dictCreate(&dbDictType,NULL);
1216 server.db[j].expires = dictCreate(&keyptrDictType,NULL);
1217 server.db[j].blocking_keys = dictCreate(&keylistDictType,NULL);
1218 server.db[j].watched_keys = dictCreate(&keylistDictType,NULL);
e2641e09 1219 server.db[j].id = j;
1220 }
1221 server.pubsub_channels = dictCreate(&keylistDictType,NULL);
1222 server.pubsub_patterns = listCreate();
1223 listSetFreeMethod(server.pubsub_patterns,freePubsubPattern);
1224 listSetMatchMethod(server.pubsub_patterns,listMatchPubsubPattern);
1225 server.cronloops = 0;
f48cd4b9 1226 server.rdb_child_pid = -1;
ff2145ad 1227 server.aof_child_pid = -1;
1228 server.aof_rewrite_buf = sdsempty();
1229 server.aof_buf = sdsempty();
e2641e09 1230 server.lastsave = time(NULL);
1231 server.dirty = 0;
1232 server.stat_numcommands = 0;
1233 server.stat_numconnections = 0;
1234 server.stat_expiredkeys = 0;
f21779ff 1235 server.stat_evictedkeys = 0;
e2641e09 1236 server.stat_starttime = time(NULL);
53eeeaff 1237 server.stat_keyspace_misses = 0;
1238 server.stat_keyspace_hits = 0;
17b24ff3 1239 server.stat_peak_memory = 0;
615e414c 1240 server.stat_fork_time = 0;
3c95e721 1241 server.stat_rejected_conn = 0;
250e7f69 1242 memset(server.ops_sec_samples,0,sizeof(server.ops_sec_samples));
1243 server.ops_sec_idx = 0;
1244 server.ops_sec_last_sample_time = mstime();
1245 server.ops_sec_last_sample_ops = 0;
e2641e09 1246 server.unixtime = time(NULL);
c25e7eaf 1247 server.lastbgsave_status = REDIS_OK;
4d3bbf35 1248 server.stop_writes_on_bgsave_err = 1;
e2641e09 1249 aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL);
a5639e7d 1250 if (server.ipfd > 0 && aeCreateFileEvent(server.el,server.ipfd,AE_READABLE,
ab17b909 1251 acceptTcpHandler,NULL) == AE_ERR) oom("creating file event");
a5639e7d 1252 if (server.sofd > 0 && aeCreateFileEvent(server.el,server.sofd,AE_READABLE,
ab17b909 1253 acceptUnixHandler,NULL) == AE_ERR) oom("creating file event");
e2641e09 1254
e394114d 1255 if (server.aof_state == REDIS_AOF_ON) {
ff2145ad 1256 server.aof_fd = open(server.aof_filename,
e394114d 1257 O_WRONLY|O_APPEND|O_CREAT,0644);
ff2145ad 1258 if (server.aof_fd == -1) {
e2641e09 1259 redisLog(REDIS_WARNING, "Can't open the append-only file: %s",
1260 strerror(errno));
1261 exit(1);
1262 }
1263 }
1264
d876678b 1265 /* 32 bit instances are limited to 4GB of address space, so if there is
1266 * no explicit limit in the user provided configuration we set a limit
1267 * at 3.5GB using maxmemory with 'noeviction' policy'. This saves
1268 * useless crashes of the Redis instance. */
1269 if (server.arch_bits == 32 && server.maxmemory == 0) {
1270 redisLog(REDIS_WARNING,"Warning: 32 bit instance detected but no memory limit set. Setting 3.5 GB maxmemory limit with 'noeviction' policy now.");
1271 server.maxmemory = 3584LL*(1024*1024); /* 3584 MB = 3.5 GB */
1272 server.maxmemory_policy = REDIS_MAXMEMORY_NO_EVICTION;
1273 }
1274
ecc91094 1275 if (server.cluster_enabled) clusterInit();
7585836e 1276 scriptingInit();
daa70b17 1277 slowlogInit();
8f61a72f 1278 bioInit();
e2641e09 1279}
1280
1b1f47c9 1281/* Populates the Redis Command Table starting from the hard coded list
1282 * we have on top of redis.c file. */
1283void populateCommandTable(void) {
1284 int j;
d7ed7fd2 1285 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1b1f47c9 1286
1287 for (j = 0; j < numcommands; j++) {
d7ed7fd2 1288 struct redisCommand *c = redisCommandTable+j;
5d02b00f 1289 char *f = c->sflags;
1b1f47c9 1290 int retval;
e2641e09 1291
5d02b00f 1292 while(*f != '\0') {
1293 switch(*f) {
1294 case 'w': c->flags |= REDIS_CMD_WRITE; break;
1295 case 'r': c->flags |= REDIS_CMD_READONLY; break;
1296 case 'm': c->flags |= REDIS_CMD_DENYOOM; break;
1297 case 'a': c->flags |= REDIS_CMD_ADMIN; break;
1298 case 'p': c->flags |= REDIS_CMD_PUBSUB; break;
1299 case 'f': c->flags |= REDIS_CMD_FORCE_REPLICATION; break;
b60ed6e8 1300 case 's': c->flags |= REDIS_CMD_NOSCRIPT; break;
1301 case 'R': c->flags |= REDIS_CMD_RANDOM; break;
548efd91 1302 case 'S': c->flags |= REDIS_CMD_SORT_FOR_SCRIPT; break;
5d02b00f 1303 default: redisPanic("Unsupported command flag"); break;
1304 }
1305 f++;
1306 }
1307
1b1f47c9 1308 retval = dictAdd(server.commands, sdsnew(c->name), c);
1309 assert(retval == DICT_OK);
1310 }
e2641e09 1311}
1312
d7ed7fd2 1313void resetCommandTableStats(void) {
1314 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1315 int j;
1316
1317 for (j = 0; j < numcommands; j++) {
1318 struct redisCommand *c = redisCommandTable+j;
1319
1320 c->microseconds = 0;
1321 c->calls = 0;
1322 }
1323}
1324
78d6a22d 1325/* ========================== Redis OP Array API ============================ */
1326
1327void redisOpArrayInit(redisOpArray *oa) {
1328 oa->ops = NULL;
1329 oa->numops = 0;
1330}
1331
1332int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
1333 robj **argv, int argc, int target)
1334{
1335 redisOp *op;
1336
1337 oa->ops = zrealloc(oa->ops,sizeof(redisOp)*(oa->numops+1));
1338 op = oa->ops+oa->numops;
1339 op->cmd = cmd;
1340 op->dbid = dbid;
1341 op->argv = argv;
1342 op->argc = argc;
1343 op->target = target;
1344 oa->numops++;
1345 return oa->numops;
1346}
1347
1348void redisOpArrayFree(redisOpArray *oa) {
1349 while(oa->numops) {
1350 int j;
1351 redisOp *op;
1352
1353 oa->numops--;
1354 op = oa->ops+oa->numops;
1355 for (j = 0; j < op->argc; j++)
1356 decrRefCount(op->argv[j]);
1357 zfree(op->argv);
1358 }
1359 zfree(oa->ops);
1360}
1361
e2641e09 1362/* ====================== Commands lookup and execution ===================== */
1363
1b1f47c9 1364struct redisCommand *lookupCommand(sds name) {
1365 return dictFetchValue(server.commands, name);
1366}
1367
1368struct redisCommand *lookupCommandByCString(char *s) {
1369 struct redisCommand *cmd;
1370 sds name = sdsnew(s);
1371
1372 cmd = dictFetchValue(server.commands, name);
1373 sdsfree(name);
1374 return cmd;
e2641e09 1375}
1376
ad08d059 1377/* Propagate the specified command (in the context of the specified database id)
1378 * to AOF, Slaves and Monitors.
1379 *
1380 * flags are an xor between:
1381 * + REDIS_PROPAGATE_NONE (no propagation of command at all)
1382 * + REDIS_PROPAGATE_AOF (propagate into the AOF file if is enabled)
1383 * + REDIS_PROPAGATE_REPL (propagate into the replication link)
1384 */
1385void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1386 int flags)
1387{
1388 if (server.aof_state != REDIS_AOF_OFF && flags & REDIS_PROPAGATE_AOF)
1389 feedAppendOnlyFile(cmd,dbid,argv,argc);
1390 if (flags & REDIS_PROPAGATE_REPL && listLength(server.slaves))
1391 replicationFeedSlaves(server.slaves,dbid,argv,argc);
1392}
1393
78d6a22d 1394/* Used inside commands to schedule the propagation of additional commands
1395 * after the current command is propagated to AOF / Replication. */
eeb34eff 1396void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1397 int target)
1398{
78d6a22d 1399 redisOpArrayAppend(&server.also_propagate,cmd,dbid,argv,argc,target);
eeb34eff 1400}
1401
e2641e09 1402/* Call() is the core of Redis execution of a command */
ce8b772b 1403void call(redisClient *c, int flags) {
daa70b17 1404 long long dirty, start = ustime(), duration;
e2641e09 1405
ad08d059 1406 /* Sent the command to clients in MONITOR mode, only if the commands are
1407 * not geneated from reading an AOF. */
1408 if (listLength(server.monitors) && !server.loading)
e31b615e 1409 replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
ad08d059 1410
1411 /* Call the command. */
78d6a22d 1412 redisOpArrayInit(&server.also_propagate);
e2641e09 1413 dirty = server.dirty;
09e2d9ee 1414 c->cmd->proc(c);
e2641e09 1415 dirty = server.dirty-dirty;
daa70b17 1416 duration = ustime()-start;
ce8b772b 1417
1418 /* When EVAL is called loading the AOF we don't want commands called
1419 * from Lua to go into the slowlog or to populate statistics. */
1420 if (server.loading && c->flags & REDIS_LUA_CLIENT)
1421 flags &= ~(REDIS_CALL_SLOWLOG | REDIS_CALL_STATS);
1422
ad08d059 1423 /* Log the command into the Slow log if needed, and populate the
1424 * per-command statistics that we show in INFO commandstats. */
ce8b772b 1425 if (flags & REDIS_CALL_SLOWLOG)
1426 slowlogPushEntryIfNeeded(c->argv,c->argc,duration);
1427 if (flags & REDIS_CALL_STATS) {
1428 c->cmd->microseconds += duration;
1429 c->cmd->calls++;
1430 }
ad08d059 1431
1432 /* Propagate the command into the AOF and replication link */
ce8b772b 1433 if (flags & REDIS_CALL_PROPAGATE) {
ad08d059 1434 int flags = REDIS_PROPAGATE_NONE;
1435
1436 if (c->cmd->flags & REDIS_CMD_FORCE_REPLICATION)
1437 flags |= REDIS_PROPAGATE_REPL;
1438 if (dirty)
1439 flags |= (REDIS_PROPAGATE_REPL | REDIS_PROPAGATE_AOF);
1440 if (flags != REDIS_PROPAGATE_NONE)
1441 propagate(c->cmd,c->db->id,c->argv,c->argc,flags);
ce8b772b 1442 }
eeb34eff 1443 /* Commands such as LPUSH or BRPOPLPUSH may propagate an additional
1444 * PUSH command. */
78d6a22d 1445 if (server.also_propagate.numops) {
eeb34eff 1446 int j;
78d6a22d 1447 redisOp *rop;
eeb34eff 1448
78d6a22d 1449 for (j = 0; j < server.also_propagate.numops; j++) {
1450 rop = &server.also_propagate.ops[j];
1451 propagate(rop->cmd, rop->dbid, rop->argv, rop->argc, rop->target);
1452 }
1453 redisOpArrayFree(&server.also_propagate);
eeb34eff 1454 }
e2641e09 1455 server.stat_numcommands++;
1456}
1457
1458/* If this function gets called we already read a whole
1459 * command, argments are in the client argv/argc fields.
1460 * processCommand() execute the command or prepare the
1461 * server for a bulk read from the client.
1462 *
1463 * If 1 is returned the client is still alive and valid and
1464 * and other operations can be performed by the caller. Otherwise
1465 * if 0 is returned the client was destroied (i.e. after QUIT). */
1466int processCommand(redisClient *c) {
941c9fa2
PN
1467 /* The QUIT command is handled separately. Normal command procs will
1468 * go through checking for replication and QUIT will cause trouble
1469 * when FORCE_REPLICATION is enabled and would be implemented in
1470 * a regular command proc. */
e2641e09 1471 if (!strcasecmp(c->argv[0]->ptr,"quit")) {
941c9fa2 1472 addReply(c,shared.ok);
5e78edb3 1473 c->flags |= REDIS_CLOSE_AFTER_REPLY;
cd8788f2 1474 return REDIS_ERR;
e2641e09 1475 }
1476
1477 /* Now lookup the command and check ASAP about trivial error conditions
09e2d9ee 1478 * such as wrong arity, bad command name and so forth. */
2c74a9f9 1479 c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
09e2d9ee 1480 if (!c->cmd) {
3ab20376
PN
1481 addReplyErrorFormat(c,"unknown command '%s'",
1482 (char*)c->argv[0]->ptr);
cd8788f2 1483 return REDIS_OK;
09e2d9ee 1484 } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
1485 (c->argc < -c->cmd->arity)) {
3ab20376 1486 addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
09e2d9ee 1487 c->cmd->name);
cd8788f2 1488 return REDIS_OK;
e2641e09 1489 }
e2641e09 1490
1491 /* Check if the user is authenticated */
09e2d9ee 1492 if (server.requirepass && !c->authenticated && c->cmd->proc != authCommand)
1493 {
3ab20376 1494 addReplyError(c,"operation not permitted");
cd8788f2 1495 return REDIS_OK;
e2641e09 1496 }
1497
ecc91094 1498 /* If cluster is enabled, redirect here */
1499 if (server.cluster_enabled &&
09e2d9ee 1500 !(c->cmd->getkeys_proc == NULL && c->cmd->firstkey == 0)) {
ecc91094 1501 int hashslot;
1502
1503 if (server.cluster.state != REDIS_CLUSTER_OK) {
1504 addReplyError(c,"The cluster is down. Check with CLUSTER INFO for more information");
1505 return REDIS_OK;
1506 } else {
eda827f8 1507 int ask;
09e2d9ee 1508 clusterNode *n = getNodeByQuery(c,c->cmd,c->argv,c->argc,&hashslot,&ask);
ecc91094 1509 if (n == NULL) {
eda827f8 1510 addReplyError(c,"Multi keys request invalid in cluster");
ecc91094 1511 return REDIS_OK;
1512 } else if (n != server.cluster.myself) {
1513 addReplySds(c,sdscatprintf(sdsempty(),
eda827f8 1514 "-%s %d %s:%d\r\n", ask ? "ASK" : "MOVED",
1515 hashslot,n->ip,n->port));
ecc91094 1516 return REDIS_OK;
1517 }
1518 }
1519 }
1520
1dd10ca2 1521 /* Handle the maxmemory directive.
1522 *
1523 * First we try to free some memory if possible (if there are volatile
1524 * keys in the dataset). If there are not the only thing we can do
1525 * is returning an error. */
f6b32c14 1526 if (server.maxmemory) {
1527 int retval = freeMemoryIfNeeded();
1528 if ((c->cmd->flags & REDIS_CMD_DENYOOM) && retval == REDIS_ERR) {
f3fd419f 1529 addReply(c, shared.oomerr);
f6b32c14 1530 return REDIS_OK;
1531 }
e2641e09 1532 }
1533
c25e7eaf 1534 /* Don't accept write commands if there are problems persisting on disk. */
4d3bbf35 1535 if (server.stop_writes_on_bgsave_err &&
1536 server.saveparamslen > 0
1537 && server.lastbgsave_status == REDIS_ERR &&
c25e7eaf 1538 c->cmd->flags & REDIS_CMD_WRITE)
1539 {
1540 addReply(c, shared.bgsaveerr);
1541 return REDIS_OK;
1542 }
1543
f3fd419f 1544 /* Don't accept wirte commands if this is a read only slave. But
1545 * accept write commands if this is our master. */
1546 if (server.masterhost && server.repl_slave_ro &&
1547 !(c->flags & REDIS_MASTER) &&
1548 c->cmd->flags & REDIS_CMD_WRITE)
1549 {
1550 addReply(c, shared.roslaveerr);
1551 return REDIS_OK;
1552 }
1553
e2641e09 1554 /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
1555 if ((dictSize(c->pubsub_channels) > 0 || listLength(c->pubsub_patterns) > 0)
1556 &&
09e2d9ee 1557 c->cmd->proc != subscribeCommand &&
1558 c->cmd->proc != unsubscribeCommand &&
1559 c->cmd->proc != psubscribeCommand &&
1560 c->cmd->proc != punsubscribeCommand) {
3ab20376 1561 addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / QUIT allowed in this context");
cd8788f2 1562 return REDIS_OK;
e2641e09 1563 }
1564
4ebfc455 1565 /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
1566 * we are a slave with a broken link with master. */
1844f990 1567 if (server.masterhost && server.repl_state != REDIS_REPL_CONNECTED &&
4ebfc455 1568 server.repl_serve_stale_data == 0 &&
09e2d9ee 1569 c->cmd->proc != infoCommand && c->cmd->proc != slaveofCommand)
4ebfc455 1570 {
1571 addReplyError(c,
1572 "link with MASTER is down and slave-serve-stale-data is set to no");
1573 return REDIS_OK;
1574 }
1575
97e7f8ae 1576 /* Loading DB? Return an error if the command is not INFO */
09e2d9ee 1577 if (server.loading && c->cmd->proc != infoCommand) {
97e7f8ae 1578 addReply(c, shared.loadingerr);
1579 return REDIS_OK;
1580 }
1581
4ab8695d 1582 /* Lua script too slow? Only allow SHUTDOWN NOSAVE and SCRIPT KILL. */
1583 if (server.lua_timedout &&
1584 !(c->cmd->proc != shutdownCommand &&
1585 c->argc == 2 &&
1586 tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
1587 !(c->cmd->proc == scriptCommand &&
1588 c->argc == 2 &&
1589 tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
1590 {
115e3ff3 1591 addReply(c, shared.slowscripterr);
1592 return REDIS_OK;
1593 }
1594
e2641e09 1595 /* Exec the command */
1596 if (c->flags & REDIS_MULTI &&
09e2d9ee 1597 c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
1598 c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
e2641e09 1599 {
09e2d9ee 1600 queueMultiCommand(c);
e2641e09 1601 addReply(c,shared.queued);
1602 } else {
ce8b772b 1603 call(c,REDIS_CALL_FULL);
e2641e09 1604 }
cd8788f2 1605 return REDIS_OK;
e2641e09 1606}
1607
1608/*================================== Shutdown =============================== */
1609
4ab8695d 1610int prepareForShutdown(int flags) {
1611 int save = flags & REDIS_SHUTDOWN_SAVE;
1612 int nosave = flags & REDIS_SHUTDOWN_NOSAVE;
1613
adae85cd 1614 redisLog(REDIS_WARNING,"User requested shutdown...");
e2641e09 1615 /* Kill the saving child if there is a background saving in progress.
1616 We want to avoid race conditions, for instance our saving child may
1617 overwrite the synchronous saving did by SHUTDOWN. */
f48cd4b9 1618 if (server.rdb_child_pid != -1) {
adae85cd 1619 redisLog(REDIS_WARNING,"There is a child saving an .rdb. Killing it!");
f48cd4b9 1620 kill(server.rdb_child_pid,SIGKILL);
1621 rdbRemoveTempFile(server.rdb_child_pid);
e2641e09 1622 }
e394114d 1623 if (server.aof_state != REDIS_AOF_OFF) {
adae85cd 1624 /* Kill the AOF saving child as the AOF we already have may be longer
1625 * but contains the full dataset anyway. */
ff2145ad 1626 if (server.aof_child_pid != -1) {
adae85cd 1627 redisLog(REDIS_WARNING,
1628 "There is a child rewriting the AOF. Killing it!");
ff2145ad 1629 kill(server.aof_child_pid,SIGKILL);
adae85cd 1630 }
e2641e09 1631 /* Append only file: fsync() the AOF and exit */
adae85cd 1632 redisLog(REDIS_NOTICE,"Calling fsync() on the AOF file.");
ff2145ad 1633 aof_fsync(server.aof_fd);
adae85cd 1634 }
4ab8695d 1635 if ((server.saveparamslen > 0 && !nosave) || save) {
adae85cd 1636 redisLog(REDIS_NOTICE,"Saving the final RDB snapshot before exiting.");
e2641e09 1637 /* Snapshotting. Perform a SYNC SAVE and exit */
f48cd4b9 1638 if (rdbSave(server.rdb_filename) != REDIS_OK) {
e2641e09 1639 /* Ooops.. error saving! The best we can do is to continue
1640 * operating. Note that if there was a background saving process,
1641 * in the next cron() Redis will be notified that the background
1642 * saving aborted, handling special stuff like slaves pending for
1643 * synchronization... */
adae85cd 1644 redisLog(REDIS_WARNING,"Error trying to save the DB, can't exit.");
e2641e09 1645 return REDIS_ERR;
1646 }
1647 }
adae85cd 1648 if (server.daemonize) {
1649 redisLog(REDIS_NOTICE,"Removing the pid file.");
1650 unlink(server.pidfile);
1651 }
80e87a46 1652 /* Close the listening sockets. Apparently this allows faster restarts. */
1653 if (server.ipfd != -1) close(server.ipfd);
1654 if (server.sofd != -1) close(server.sofd);
56209f72
NF
1655 if (server.unixsocket) {
1656 redisLog(REDIS_NOTICE,"Removing the unix socket file.");
1657 unlink(server.unixsocket); /* don't care if this fails */
1658 }
80e87a46 1659
adae85cd 1660 redisLog(REDIS_WARNING,"Redis is now ready to exit, bye bye...");
e2641e09 1661 return REDIS_OK;
1662}
1663
1664/*================================== Commands =============================== */
1665
1666void authCommand(redisClient *c) {
ab52d1f4 1667 if (!server.requirepass) {
1668 addReplyError(c,"Client sent AUTH, but no password is set");
1669 } else if (!strcmp(c->argv[1]->ptr, server.requirepass)) {
e2641e09 1670 c->authenticated = 1;
1671 addReply(c,shared.ok);
1672 } else {
1673 c->authenticated = 0;
3ab20376 1674 addReplyError(c,"invalid password");
e2641e09 1675 }
1676}
1677
1678void pingCommand(redisClient *c) {
1679 addReply(c,shared.pong);
1680}
1681
1682void echoCommand(redisClient *c) {
1683 addReplyBulk(c,c->argv[1]);
1684}
1685
9494f1f1 1686void timeCommand(redisClient *c) {
1687 struct timeval tv;
1688
1689 /* gettimeofday() can only fail if &tv is a bad addresss so we
1690 * don't check for errors. */
1691 gettimeofday(&tv,NULL);
1692 addReplyMultiBulkLen(c,2);
1693 addReplyBulkLongLong(c,tv.tv_sec);
1694 addReplyBulkLongLong(c,tv.tv_usec);
1695}
1696
e2641e09 1697/* Convert an amount of bytes into a human readable string in the form
1698 * of 100B, 2G, 100M, 4K, and so forth. */
1699void bytesToHuman(char *s, unsigned long long n) {
1700 double d;
1701
1702 if (n < 1024) {
1703 /* Bytes */
1704 sprintf(s,"%lluB",n);
1705 return;
1706 } else if (n < (1024*1024)) {
1707 d = (double)n/(1024);
1708 sprintf(s,"%.2fK",d);
1709 } else if (n < (1024LL*1024*1024)) {
1710 d = (double)n/(1024*1024);
1711 sprintf(s,"%.2fM",d);
1712 } else if (n < (1024LL*1024*1024*1024)) {
1713 d = (double)n/(1024LL*1024*1024);
1714 sprintf(s,"%.2fG",d);
1715 }
1716}
1717
1718/* Create the string returned by the INFO command. This is decoupled
1719 * by the INFO command itself as we need to report the same information
1720 * on memory corruption problems. */
1b085c9f 1721sds genRedisInfoString(char *section) {
1722 sds info = sdsempty();
d1949054 1723 time_t uptime = server.unixtime-server.stat_starttime;
d9cb288c 1724 int j, numcommands;
2b00385d 1725 struct rusage self_ru, c_ru;
7a1fd61e 1726 unsigned long lol, bib;
1b085c9f 1727 int allsections = 0, defsections = 0;
1728 int sections = 0;
1729
1730 if (section) {
1731 allsections = strcasecmp(section,"all") == 0;
0d808ef2 1732 defsections = strcasecmp(section,"default") == 0;
1b085c9f 1733 }
2b00385d 1734
1735 getrusage(RUSAGE_SELF, &self_ru);
1736 getrusage(RUSAGE_CHILDREN, &c_ru);
7a1fd61e 1737 getClientsMaxBuffers(&lol,&bib);
1b085c9f 1738
1739 /* Server */
1740 if (allsections || defsections || !strcasecmp(section,"server")) {
1741 if (sections++) info = sdscat(info,"\r\n");
e2641e09 1742 info = sdscatprintf(info,
1b085c9f 1743 "# Server\r\n"
1744 "redis_version:%s\r\n"
1745 "redis_git_sha1:%s\r\n"
1746 "redis_git_dirty:%d\r\n"
75eaac5c 1747 "arch_bits:%d\r\n"
1b085c9f 1748 "multiplexing_api:%s\r\n"
5db904bd 1749 "gcc_version:%d.%d.%d\r\n"
1b085c9f 1750 "process_id:%ld\r\n"
91d664d6 1751 "run_id:%s\r\n"
1b085c9f 1752 "tcp_port:%d\r\n"
1753 "uptime_in_seconds:%ld\r\n"
1754 "uptime_in_days:%ld\r\n"
1755 "lru_clock:%ld\r\n",
1756 REDIS_VERSION,
1757 redisGitSHA1(),
1758 strtol(redisGitDirty(),NULL,10) > 0,
75eaac5c 1759 server.arch_bits,
1b085c9f 1760 aeGetApiName(),
5db904bd 1761#ifdef __GNUC__
1762 __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
1763#else
1764 0,0,0,
1765#endif
1b085c9f 1766 (long) getpid(),
91d664d6 1767 server.runid,
1b085c9f 1768 server.port,
1769 uptime,
1770 uptime/(3600*24),
1771 (unsigned long) server.lruclock);
1772 }
1773
1774 /* Clients */
1775 if (allsections || defsections || !strcasecmp(section,"clients")) {
1776 if (sections++) info = sdscat(info,"\r\n");
1777 info = sdscatprintf(info,
1778 "# Clients\r\n"
3c08fdae 1779 "connected_clients:%lu\r\n"
1b085c9f 1780 "client_longest_output_list:%lu\r\n"
1781 "client_biggest_input_buf:%lu\r\n"
1782 "blocked_clients:%d\r\n",
1783 listLength(server.clients)-listLength(server.slaves),
1784 lol, bib,
1785 server.bpop_blocked_clients);
1786 }
1787
1788 /* Memory */
1789 if (allsections || defsections || !strcasecmp(section,"memory")) {
17b24ff3 1790 char hmem[64];
1791 char peak_hmem[64];
1792
1793 bytesToHuman(hmem,zmalloc_used_memory());
1794 bytesToHuman(peak_hmem,server.stat_peak_memory);
1b085c9f 1795 if (sections++) info = sdscat(info,"\r\n");
1796 info = sdscatprintf(info,
1797 "# Memory\r\n"
1798 "used_memory:%zu\r\n"
1799 "used_memory_human:%s\r\n"
1800 "used_memory_rss:%zu\r\n"
17b24ff3 1801 "used_memory_peak:%zu\r\n"
1802 "used_memory_peak_human:%s\r\n"
8c3402df 1803 "used_memory_lua:%lld\r\n"
1b085c9f 1804 "mem_fragmentation_ratio:%.2f\r\n"
32f99c51 1805 "mem_allocator:%s\r\n",
1b085c9f 1806 zmalloc_used_memory(),
1807 hmem,
1808 zmalloc_get_rss(),
17b24ff3 1809 server.stat_peak_memory,
1810 peak_hmem,
8c3402df 1811 ((long long)lua_gc(server.lua,LUA_GCCOUNT,0))*1024LL,
1b085c9f 1812 zmalloc_get_fragmentation_ratio(),
fec5a664 1813 ZMALLOC_LIB
12ebe2ac 1814 );
0d808ef2 1815 }
1816
1b085c9f 1817 /* Persistence */
1818 if (allsections || defsections || !strcasecmp(section,"persistence")) {
1819 if (sections++) info = sdscat(info,"\r\n");
e2641e09 1820 info = sdscatprintf(info,
1b085c9f 1821 "# Persistence\r\n"
1822 "loading:%d\r\n"
1823 "aof_enabled:%d\r\n"
1824 "changes_since_last_save:%lld\r\n"
1825 "bgsave_in_progress:%d\r\n"
1826 "last_save_time:%ld\r\n"
c25e7eaf 1827 "last_bgsave_status:%s\r\n"
1b085c9f 1828 "bgrewriteaof_in_progress:%d\r\n",
1829 server.loading,
e394114d 1830 server.aof_state != REDIS_AOF_OFF,
1b085c9f 1831 server.dirty,
f48cd4b9 1832 server.rdb_child_pid != -1,
1b085c9f 1833 server.lastsave,
c25e7eaf 1834 server.lastbgsave_status == REDIS_OK ? "ok" : "err",
ff2145ad 1835 server.aof_child_pid != -1);
1b085c9f 1836
e394114d 1837 if (server.aof_state != REDIS_AOF_OFF) {
d630abcd 1838 info = sdscatprintf(info,
1839 "aof_current_size:%lld\r\n"
1840 "aof_base_size:%lld\r\n"
e7ef418c 1841 "aof_pending_rewrite:%d\r\n"
1842 "aof_buffer_length:%zu\r\n"
c1d01b3c 1843 "aof_pending_bio_fsync:%llu\r\n"
1844 "aof_delayed_fsync:%lu\r\n",
2c915bcf 1845 (long long) server.aof_current_size,
1846 (long long) server.aof_rewrite_base_size,
1847 server.aof_rewrite_scheduled,
ff2145ad 1848 sdslen(server.aof_buf),
c1d01b3c 1849 bioPendingJobsOfType(REDIS_BIO_AOF_FSYNC),
1850 server.aof_delayed_fsync);
d630abcd 1851 }
1852
1b085c9f 1853 if (server.loading) {
1854 double perc;
1855 time_t eta, elapsed;
1856 off_t remaining_bytes = server.loading_total_bytes-
1857 server.loading_loaded_bytes;
1858
1859 perc = ((double)server.loading_loaded_bytes /
1860 server.loading_total_bytes) * 100;
1861
d1949054 1862 elapsed = server.unixtime-server.loading_start_time;
1b085c9f 1863 if (elapsed == 0) {
1864 eta = 1; /* A fake 1 second figure if we don't have
1865 enough info */
1866 } else {
1867 eta = (elapsed*remaining_bytes)/server.loading_loaded_bytes;
1868 }
1869
1870 info = sdscatprintf(info,
1871 "loading_start_time:%ld\r\n"
1872 "loading_total_bytes:%llu\r\n"
1873 "loading_loaded_bytes:%llu\r\n"
1874 "loading_loaded_perc:%.2f\r\n"
1875 "loading_eta_seconds:%ld\r\n"
1876 ,(unsigned long) server.loading_start_time,
1877 (unsigned long long) server.loading_total_bytes,
1878 (unsigned long long) server.loading_loaded_bytes,
1879 perc,
1880 eta
1881 );
1882 }
e2641e09 1883 }
1b085c9f 1884
1b085c9f 1885 /* Stats */
1886 if (allsections || defsections || !strcasecmp(section,"stats")) {
1887 if (sections++) info = sdscat(info,"\r\n");
97e7f8ae 1888 info = sdscatprintf(info,
1b085c9f 1889 "# Stats\r\n"
1890 "total_connections_received:%lld\r\n"
1891 "total_commands_processed:%lld\r\n"
250e7f69 1892 "instantaneous_ops_per_sec:%lld\r\n"
3c95e721 1893 "rejected_connections:%lld\r\n"
1b085c9f 1894 "expired_keys:%lld\r\n"
1895 "evicted_keys:%lld\r\n"
1896 "keyspace_hits:%lld\r\n"
1897 "keyspace_misses:%lld\r\n"
1898 "pubsub_channels:%ld\r\n"
3c08fdae 1899 "pubsub_patterns:%lu\r\n"
615e414c 1900 "latest_fork_usec:%lld\r\n",
1b085c9f 1901 server.stat_numconnections,
1902 server.stat_numcommands,
250e7f69 1903 getOperationsPerSecond(),
3c95e721 1904 server.stat_rejected_conn,
1b085c9f 1905 server.stat_expiredkeys,
1906 server.stat_evictedkeys,
1907 server.stat_keyspace_hits,
1908 server.stat_keyspace_misses,
1909 dictSize(server.pubsub_channels),
615e414c 1910 listLength(server.pubsub_patterns),
1911 server.stat_fork_time);
97e7f8ae 1912 }
67a1810b 1913
1b085c9f 1914 /* Replication */
1915 if (allsections || defsections || !strcasecmp(section,"replication")) {
1916 if (sections++) info = sdscat(info,"\r\n");
1917 info = sdscatprintf(info,
1918 "# Replication\r\n"
1919 "role:%s\r\n",
1920 server.masterhost == NULL ? "master" : "slave");
1921 if (server.masterhost) {
1922 info = sdscatprintf(info,
1923 "master_host:%s\r\n"
1924 "master_port:%d\r\n"
1925 "master_link_status:%s\r\n"
1926 "master_last_io_seconds_ago:%d\r\n"
1927 "master_sync_in_progress:%d\r\n"
1928 ,server.masterhost,
1929 server.masterport,
1844f990 1930 (server.repl_state == REDIS_REPL_CONNECTED) ?
1b085c9f 1931 "up" : "down",
1932 server.master ?
d1949054 1933 ((int)(server.unixtime-server.master->lastinteraction)) : -1,
1844f990 1934 server.repl_state == REDIS_REPL_TRANSFER
1b085c9f 1935 );
1936
1844f990 1937 if (server.repl_state == REDIS_REPL_TRANSFER) {
1b085c9f 1938 info = sdscatprintf(info,
1939 "master_sync_left_bytes:%ld\r\n"
1940 "master_sync_last_io_seconds_ago:%d\r\n"
1941 ,(long)server.repl_transfer_left,
d1949054 1942 (int)(server.unixtime-server.repl_transfer_lastio)
1b085c9f 1943 );
1944 }
07486df6 1945
1844f990 1946 if (server.repl_state != REDIS_REPL_CONNECTED) {
07486df6 1947 info = sdscatprintf(info,
1948 "master_link_down_since_seconds:%ld\r\n",
d1949054 1949 (long)server.unixtime-server.repl_down_since);
07486df6 1950 }
67a1810b 1951 }
1b085c9f 1952 info = sdscatprintf(info,
3c08fdae 1953 "connected_slaves:%lu\r\n",
1b085c9f 1954 listLength(server.slaves));
503d87a8 1955 if (listLength(server.slaves)) {
1956 int slaveid = 0;
1957 listNode *ln;
1958 listIter li;
1959
1960 listRewind(server.slaves,&li);
1961 while((ln = listNext(&li))) {
1962 redisClient *slave = listNodeValue(ln);
1963 char *state = NULL;
1964 char ip[32];
1965 int port;
1966
1967 if (anetPeerToString(slave->fd,ip,&port) == -1) continue;
1968 switch(slave->replstate) {
1969 case REDIS_REPL_WAIT_BGSAVE_START:
1970 case REDIS_REPL_WAIT_BGSAVE_END:
1971 state = "wait_bgsave";
1972 break;
1973 case REDIS_REPL_SEND_BULK:
1974 state = "send_bulk";
1975 break;
1976 case REDIS_REPL_ONLINE:
1977 state = "online";
1978 break;
1979 }
1980 if (state == NULL) continue;
1981 info = sdscatprintf(info,"slave%d:%s,%d,%s\r\n",
1982 slaveid,ip,port,state);
1983 slaveid++;
1984 }
1985 }
67a1810b 1986 }
67a1810b 1987
0d808ef2 1988 /* CPU */
1989 if (allsections || defsections || !strcasecmp(section,"cpu")) {
1b085c9f 1990 if (sections++) info = sdscat(info,"\r\n");
1991 info = sdscatprintf(info,
0d808ef2 1992 "# CPU\r\n"
1b085c9f 1993 "used_cpu_sys:%.2f\r\n"
1994 "used_cpu_user:%.2f\r\n"
5a9dd97c 1995 "used_cpu_sys_children:%.2f\r\n"
1996 "used_cpu_user_children:%.2f\r\n",
1b085c9f 1997 (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
d83eda48 1998 (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000,
1999 (float)c_ru.ru_stime.tv_sec+(float)c_ru.ru_stime.tv_usec/1000000,
2000 (float)c_ru.ru_utime.tv_sec+(float)c_ru.ru_utime.tv_usec/1000000);
0d808ef2 2001 }
1b085c9f 2002
0d808ef2 2003 /* cmdtime */
2004 if (allsections || !strcasecmp(section,"commandstats")) {
2005 if (sections++) info = sdscat(info,"\r\n");
2006 info = sdscatprintf(info, "# Commandstats\r\n");
d7ed7fd2 2007 numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1b085c9f 2008 for (j = 0; j < numcommands; j++) {
d7ed7fd2 2009 struct redisCommand *c = redisCommandTable+j;
0d808ef2 2010
d7ed7fd2 2011 if (!c->calls) continue;
2012 info = sdscatprintf(info,
2013 "cmdstat_%s:calls=%lld,usec=%lld,usec_per_call=%.2f\r\n",
2014 c->name, c->calls, c->microseconds,
2015 (c->calls == 0) ? 0 : ((float)c->microseconds/c->calls));
1b085c9f 2016 }
d9cb288c 2017 }
2018
1c708b25
SS
2019 /* Clusetr */
2020 if (allsections || defsections || !strcasecmp(section,"cluster")) {
2021 if (sections++) info = sdscat(info,"\r\n");
2022 info = sdscatprintf(info,
2023 "# Cluster\r\n"
2024 "cluster_enabled:%d\r\n",
2025 server.cluster_enabled);
2026 }
2027
1b085c9f 2028 /* Key space */
2029 if (allsections || defsections || !strcasecmp(section,"keyspace")) {
2030 if (sections++) info = sdscat(info,"\r\n");
2031 info = sdscatprintf(info, "# Keyspace\r\n");
2032 for (j = 0; j < server.dbnum; j++) {
2033 long long keys, vkeys;
e2641e09 2034
1b085c9f 2035 keys = dictSize(server.db[j].dict);
2036 vkeys = dictSize(server.db[j].expires);
2037 if (keys || vkeys) {
2038 info = sdscatprintf(info, "db%d:keys=%lld,expires=%lld\r\n",
2039 j, keys, vkeys);
2040 }
e2641e09 2041 }
2042 }
2043 return info;
2044}
2045
2046void infoCommand(redisClient *c) {
1b085c9f 2047 char *section = c->argc == 2 ? c->argv[1]->ptr : "default";
2048
2049 if (c->argc > 2) {
2050 addReply(c,shared.syntaxerr);
2051 return;
2052 }
2053 sds info = genRedisInfoString(section);
e2641e09 2054 addReplySds(c,sdscatprintf(sdsempty(),"$%lu\r\n",
2055 (unsigned long)sdslen(info)));
2056 addReplySds(c,info);
2057 addReply(c,shared.crlf);
2058}
2059
2060void monitorCommand(redisClient *c) {
2061 /* ignore MONITOR if aleady slave or in monitor mode */
2062 if (c->flags & REDIS_SLAVE) return;
2063
2064 c->flags |= (REDIS_SLAVE|REDIS_MONITOR);
2065 c->slaveseldb = 0;
2066 listAddNodeTail(server.monitors,c);
2067 addReply(c,shared.ok);
2068}
2069
2070/* ============================ Maxmemory directive ======================== */
2071
e2641e09 2072/* This function gets called when 'maxmemory' is set on the config file to limit
f6b32c14 2073 * the max memory used by the server, before processing a command.
e2641e09 2074 *
f6b32c14 2075 * The goal of the function is to free enough memory to keep Redis under the
2076 * configured memory limit.
e2641e09 2077 *
f6b32c14 2078 * The function starts calculating how many bytes should be freed to keep
2079 * Redis under the limit, and enters a loop selecting the best keys to
2080 * evict accordingly to the configured policy.
2081 *
2082 * If all the bytes needed to return back under the limit were freed the
2083 * function returns REDIS_OK, otherwise REDIS_ERR is returned, and the caller
2084 * should block the execution of commands that will result in more memory
2085 * used by the server.
e2641e09 2086 */
f6b32c14 2087int freeMemoryIfNeeded(void) {
2088 size_t mem_used, mem_tofree, mem_freed;
2089 int slaves = listLength(server.slaves);
2090
c1ef6ffe 2091 /* Remove the size of slaves output buffers and AOF buffer from the
2092 * count of used memory. */
f6b32c14 2093 mem_used = zmalloc_used_memory();
2094 if (slaves) {
2095 listIter li;
2096 listNode *ln;
2097
2098 listRewind(server.slaves,&li);
2099 while((ln = listNext(&li))) {
2100 redisClient *slave = listNodeValue(ln);
2101 unsigned long obuf_bytes = getClientOutputBufferMemoryUsage(slave);
2102 if (obuf_bytes > mem_used)
2103 mem_used = 0;
2104 else
2105 mem_used -= obuf_bytes;
2106 }
2107 }
c1ef6ffe 2108 if (server.aof_state != REDIS_AOF_OFF) {
2109 mem_used -= sdslen(server.aof_buf);
2110 mem_used -= sdslen(server.aof_rewrite_buf);
2111 }
5402c426 2112
f6b32c14 2113 /* Check if we are over the memory limit. */
2114 if (mem_used <= server.maxmemory) return REDIS_OK;
2115
2116 if (server.maxmemory_policy == REDIS_MAXMEMORY_NO_EVICTION)
2117 return REDIS_ERR; /* We need to free memory, but policy forbids. */
2118
2119 /* Compute how much memory we need to free. */
2120 mem_tofree = mem_used - server.maxmemory;
f6b32c14 2121 mem_freed = 0;
2122 while (mem_freed < mem_tofree) {
2123 int j, k, keys_freed = 0;
e2641e09 2124
165346ca 2125 for (j = 0; j < server.dbnum; j++) {
10c12171 2126 long bestval = 0; /* just to prevent warning */
165346ca 2127 sds bestkey = NULL;
2128 struct dictEntry *de;
2129 redisDb *db = server.db+j;
2130 dict *dict;
2131
2132 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2133 server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM)
2134 {
2135 dict = server.db[j].dict;
2136 } else {
2137 dict = server.db[j].expires;
2138 }
2139 if (dictSize(dict) == 0) continue;
2140
2141 /* volatile-random and allkeys-random policy */
2142 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM ||
2143 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_RANDOM)
2144 {
2145 de = dictGetRandomKey(dict);
c0ba9ebe 2146 bestkey = dictGetKey(de);
165346ca 2147 }
2148
2149 /* volatile-lru and allkeys-lru policy */
2150 else if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2151 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2152 {
2153 for (k = 0; k < server.maxmemory_samples; k++) {
2154 sds thiskey;
2155 long thisval;
2156 robj *o;
2157
2158 de = dictGetRandomKey(dict);
c0ba9ebe 2159 thiskey = dictGetKey(de);
0c2f75c6 2160 /* When policy is volatile-lru we need an additonal lookup
2161 * to locate the real key, as dict is set to db->expires. */
2162 if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2163 de = dictFind(db->dict, thiskey);
c0ba9ebe 2164 o = dictGetVal(de);
165346ca 2165 thisval = estimateObjectIdleTime(o);
2166
2167 /* Higher idle time is better candidate for deletion */
2168 if (bestkey == NULL || thisval > bestval) {
2169 bestkey = thiskey;
2170 bestval = thisval;
2171 }
2172 }
2173 }
2174
2175 /* volatile-ttl */
2176 else if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_TTL) {
2177 for (k = 0; k < server.maxmemory_samples; k++) {
2178 sds thiskey;
2179 long thisval;
2180
2181 de = dictGetRandomKey(dict);
c0ba9ebe 2182 thiskey = dictGetKey(de);
2183 thisval = (long) dictGetVal(de);
165346ca 2184
2185 /* Expire sooner (minor expire unix timestamp) is better
2186 * candidate for deletion */
2187 if (bestkey == NULL || thisval < bestval) {
2188 bestkey = thiskey;
2189 bestval = thisval;
2190 }
2191 }
2192 }
2193
2194 /* Finally remove the selected key. */
2195 if (bestkey) {
f6b32c14 2196 long long delta;
2197
165346ca 2198 robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
452229b6 2199 propagateExpire(db,keyobj);
f6b32c14 2200 /* We compute the amount of memory freed by dbDelete() alone.
2201 * It is possible that actually the memory needed to propagate
2202 * the DEL in AOF and replication link is greater than the one
2203 * we are freeing removing the key, but we can't account for
2204 * that otherwise we would never exit the loop.
2205 *
2206 * AOF and Output buffer memory will be freed eventually so
2207 * we only care about memory used by the key space. */
2208 delta = (long long) zmalloc_used_memory();
165346ca 2209 dbDelete(db,keyobj);
f6b32c14 2210 delta -= (long long) zmalloc_used_memory();
f6b32c14 2211 mem_freed += delta;
f21779ff 2212 server.stat_evictedkeys++;
165346ca 2213 decrRefCount(keyobj);
f6b32c14 2214 keys_freed++;
2215
2216 /* When the memory to free starts to be big enough, we may
2217 * start spending so much time here that is impossible to
2218 * deliver data to the slaves fast enough, so we force the
2219 * transmission here inside the loop. */
8b7c3455 2220 if (slaves) flushSlavesOutputBuffers();
165346ca 2221 }
2222 }
b129c6df 2223 if (!keys_freed) return REDIS_ERR; /* nothing to free... */
165346ca 2224 }
f6b32c14 2225 return REDIS_OK;
e2641e09 2226}
2227
2228/* =================================== Main! ================================ */
2229
2230#ifdef __linux__
2231int linuxOvercommitMemoryValue(void) {
2232 FILE *fp = fopen("/proc/sys/vm/overcommit_memory","r");
2233 char buf[64];
2234
2235 if (!fp) return -1;
2236 if (fgets(buf,64,fp) == NULL) {
2237 fclose(fp);
2238 return -1;
2239 }
2240 fclose(fp);
2241
2242 return atoi(buf);
2243}
2244
2245void linuxOvercommitMemoryWarning(void) {
2246 if (linuxOvercommitMemoryValue() == 0) {
2247 redisLog(REDIS_WARNING,"WARNING overcommit_memory is set to 0! Background save may fail under low memory condition. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
2248 }
2249}
2250#endif /* __linux__ */
2251
695fe874 2252void createPidFile(void) {
2253 /* Try to write the pid file in a best-effort way. */
2254 FILE *fp = fopen(server.pidfile,"w");
2255 if (fp) {
8ce39260 2256 fprintf(fp,"%d\n",(int)getpid());
695fe874 2257 fclose(fp);
2258 }
2259}
2260
e2641e09 2261void daemonize(void) {
2262 int fd;
e2641e09 2263
2264 if (fork() != 0) exit(0); /* parent exits */
2265 setsid(); /* create a new session */
2266
2267 /* Every output goes to /dev/null. If Redis is daemonized but
2268 * the 'logfile' is set to 'stdout' in the configuration file
2269 * it will not log at all. */
2270 if ((fd = open("/dev/null", O_RDWR, 0)) != -1) {
2271 dup2(fd, STDIN_FILENO);
2272 dup2(fd, STDOUT_FILENO);
2273 dup2(fd, STDERR_FILENO);
2274 if (fd > STDERR_FILENO) close(fd);
2275 }
e2641e09 2276}
2277
2278void version() {
1b247d13 2279 printf("Redis server v=%s sha=%s:%d malloc=%s\n", REDIS_VERSION,
2280 redisGitSHA1(), atoi(redisGitDirty()) > 0, ZMALLOC_LIB);
e2641e09 2281 exit(0);
2282}
2283
2284void usage() {
9268a5b5 2285 fprintf(stderr,"Usage: ./redis-server [/path/to/redis.conf] [options]\n");
e2641e09 2286 fprintf(stderr," ./redis-server - (read config from stdin)\n");
9268a5b5 2287 fprintf(stderr," ./redis-server -v or --version\n");
c5166e3f 2288 fprintf(stderr," ./redis-server -h or --help\n");
2289 fprintf(stderr," ./redis-server --test-memory <megabytes>\n\n");
9268a5b5 2290 fprintf(stderr,"Examples:\n");
2291 fprintf(stderr," ./redis-server (run the server with default conf)\n");
2292 fprintf(stderr," ./redis-server /etc/redis/6379.conf\n");
2293 fprintf(stderr," ./redis-server --port 7777\n");
2294 fprintf(stderr," ./redis-server --port 7777 --slaveof 127.0.0.1 8888\n");
2295 fprintf(stderr," ./redis-server /etc/myredis.conf --loglevel verbose\n");
e2641e09 2296 exit(1);
2297}
2298
996d503d 2299void redisAsciiArt(void) {
2300#include "asciilogo.h"
2301 char *buf = zmalloc(1024*16);
2302
2303 snprintf(buf,1024*16,ascii_logo,
2304 REDIS_VERSION,
2305 redisGitSHA1(),
2306 strtol(redisGitDirty(),NULL,10) > 0,
2307 (sizeof(long) == 8) ? "64" : "32",
2308 server.cluster_enabled ? "cluster" : "stand alone",
2309 server.port,
2310 (long) getpid()
2311 );
2312 redisLogRaw(REDIS_NOTICE|REDIS_LOG_RAW,buf);
2313 zfree(buf);
2314}
2315
633a9410 2316static void sigtermHandler(int sig) {
e2641e09 2317 REDIS_NOTUSED(sig);
2318
a7d12cba 2319 redisLogFromHandler(REDIS_WARNING,"Received SIGTERM, scheduling shutdown...");
e2641e09 2320 server.shutdown_asap = 1;
2321}
2322
633a9410 2323void setupSignalHandlers(void) {
e2641e09 2324 struct sigaction act;
c5757662
PH
2325 stack_t stack;
2326
2327 stack.ss_sp = altstack;
2328 stack.ss_flags = 0;
2329 stack.ss_size = SIGSTKSZ;
2330
2331 sigaltstack(&stack, NULL);
e2641e09 2332
633a9410
PN
2333 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction is used.
2334 * Otherwise, sa_handler is used. */
2335 sigemptyset(&act.sa_mask);
c5757662 2336 act.sa_flags = 0;
e2641e09 2337 act.sa_handler = sigtermHandler;
633a9410 2338 sigaction(SIGTERM, &act, NULL);
e2641e09 2339
633a9410 2340#ifdef HAVE_BACKTRACE
c5757662
PH
2341 /* Use alternate stack so we don't clobber stack in case of segv, or when we run out of stack ..
2342 * also resethand & nodefer so we can get interrupted (and killed) if we cause SEGV during SEGV handler */
633a9410
PN
2343 sigemptyset(&act.sa_mask);
2344 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND | SA_SIGINFO;
2345 act.sa_sigaction = sigsegvHandler;
2346 sigaction(SIGSEGV, &act, NULL);
2347 sigaction(SIGBUS, &act, NULL);
2348 sigaction(SIGFPE, &act, NULL);
2349 sigaction(SIGILL, &act, NULL);
2350#endif
2351 return;
e2641e09 2352}
e2641e09 2353
c5166e3f 2354void memtest(size_t megabytes, int passes);
2355
39ca1713 2356int main(int argc, char **argv) {
2357 long long start;
a48c8d87 2358 struct timeval tv;
39ca1713 2359
06c5523a 2360 /* We need to initialize our libraries, and the server configuration. */
39ca1713 2361 zmalloc_enable_thread_safeness();
a48c8d87 2362 srand(time(NULL)^getpid());
2363 gettimeofday(&tv,NULL);
2364 dictSetHashFunctionSeed(tv.tv_sec^tv.tv_usec^getpid());
39ca1713 2365 initServerConfig();
a48c8d87 2366
67c6f0f6 2367 if (argc >= 2) {
2368 int j = 1; /* First option to parse in argv[] */
2369 sds options = sdsempty();
2370 char *configfile = NULL;
2371
2372 /* Handle special options --help and --version */
39ca1713 2373 if (strcmp(argv[1], "-v") == 0 ||
2374 strcmp(argv[1], "--version") == 0) version();
4c8bd905 2375 if (strcmp(argv[1], "--help") == 0 ||
2376 strcmp(argv[1], "-h") == 0) usage();
c5166e3f 2377 if (strcmp(argv[1], "--test-memory") == 0) {
2378 if (argc == 3) {
d033ccb0 2379 memtest(atoi(argv[2]),50);
c5166e3f 2380 exit(0);
2381 } else {
2382 fprintf(stderr,"Please specify the amount of memory to test in megabytes.\n");
2383 fprintf(stderr,"Example: ./redis-server --test-memory 4096\n\n");
2384 exit(1);
2385 }
2386 }
2387
67c6f0f6 2388 /* First argument is the config file name? */
2389 if (argv[j][0] != '-' || argv[j][1] != '-')
2390 configfile = argv[j++];
2391 /* All the other options are parsed and conceptually appended to the
2392 * configuration file. For instance --port 6380 will generate the
2393 * string "port 6380\n" to be parsed after the actual file name
2394 * is parsed, if any. */
2395 while(j != argc) {
2396 if (argv[j][0] == '-' && argv[j][1] == '-') {
2397 /* Option name */
2398 if (sdslen(options)) options = sdscat(options,"\n");
2399 options = sdscat(options,argv[j]+2);
2400 options = sdscat(options," ");
2401 } else {
2402 /* Option argument */
2403 options = sdscatrepr(options,argv[j],strlen(argv[j]));
2404 options = sdscat(options," ");
2405 }
2406 j++;
2407 }
39ca1713 2408 resetServerSaveParams();
67c6f0f6 2409 loadServerConfig(configfile,options);
2410 sdsfree(options);
39ca1713 2411 } else {
2412 redisLog(REDIS_WARNING,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
2413 }
2414 if (server.daemonize) daemonize();
2415 initServer();
2416 if (server.daemonize) createPidFile();
2417 redisAsciiArt();
27ccb94a 2418 redisLog(REDIS_WARNING,"Server started, Redis version " REDIS_VERSION);
39ca1713 2419#ifdef __linux__
2420 linuxOvercommitMemoryWarning();
2421#endif
2422 start = ustime();
e394114d 2423 if (server.aof_state == REDIS_AOF_ON) {
2c915bcf 2424 if (loadAppendOnlyFile(server.aof_filename) == REDIS_OK)
39ca1713 2425 redisLog(REDIS_NOTICE,"DB loaded from append only file: %.3f seconds",(float)(ustime()-start)/1000000);
2426 } else {
f48cd4b9 2427 if (rdbLoad(server.rdb_filename) == REDIS_OK) {
39ca1713 2428 redisLog(REDIS_NOTICE,"DB loaded from disk: %.3f seconds",
2429 (float)(ustime()-start)/1000000);
2430 } else if (errno != ENOENT) {
2431 redisLog(REDIS_WARNING,"Fatal error loading the DB. Exiting.");
2432 exit(1);
2433 }
2434 }
2435 if (server.ipfd > 0)
2436 redisLog(REDIS_NOTICE,"The server is now ready to accept connections on port %d", server.port);
2437 if (server.sofd > 0)
2438 redisLog(REDIS_NOTICE,"The server is now ready to accept connections at %s", server.unixsocket);
2439 aeSetBeforeSleepProc(server.el,beforeSleep);
2440 aeMain(server.el);
2441 aeDeleteEventLoop(server.el);
2442 return 0;
2443}
2444
e2641e09 2445/* The End */