]> git.saurik.com Git - redis.git/blob - src/redis.c
When the user-provided 'maxclients' value is too big for the max number of files...
[redis.git] / src / redis.c
1 /*
2 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 */
29
30 #include "redis.h"
31 #include "slowlog.h"
32 #include "bio.h"
33
34 #include <time.h>
35 #include <signal.h>
36 #include <sys/wait.h>
37 #include <errno.h>
38 #include <assert.h>
39 #include <ctype.h>
40 #include <stdarg.h>
41 #include <arpa/inet.h>
42 #include <sys/stat.h>
43 #include <fcntl.h>
44 #include <sys/time.h>
45 #include <sys/resource.h>
46 #include <sys/uio.h>
47 #include <limits.h>
48 #include <float.h>
49 #include <math.h>
50 #include <sys/resource.h>
51
52 /* Our shared "common" objects */
53
54 struct sharedObjectsStruct shared;
55
56 /* Global vars that are actually used as constants. The following double
57 * values are used for double on-disk serialization, and are initialized
58 * at runtime to avoid strange compiler optimizations. */
59
60 double R_Zero, R_PosInf, R_NegInf, R_Nan;
61
62 /*================================= Globals ================================= */
63
64 /* Global vars */
65 struct redisServer server; /* server global state */
66 struct redisCommand *commandTable;
67
68 /* Our command table.
69 *
70 * Every entry is composed of the following fields:
71 *
72 * name: a string representing the command name.
73 * function: pointer to the C function implementing the command.
74 * arity: number of arguments, it is possible to use -N to say >= N
75 * sflags: command flags as string. See below for a table of flags.
76 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
77 * get_keys_proc: an optional function to get key arguments from a command.
78 * This is only used when the following three fields are not
79 * enough to specify what arguments are keys.
80 * first_key_index: first argument that is a key
81 * last_key_index: last argument that is a key
82 * key_step: step to get all the keys from first to last argument. For instance
83 * in MSET the step is two since arguments are key,val,key,val,...
84 * microseconds: microseconds of total execution time for this command.
85 * calls: total number of calls of this command.
86 *
87 * The flags, microseconds and calls fields are computed by Redis and should
88 * always be set to zero.
89 *
90 * Command flags are expressed using strings where every character represents
91 * a flag. Later the populateCommandTable() function will take care of
92 * populating the real 'flags' field using this characters.
93 *
94 * This is the meaning of the flags:
95 *
96 * w: write command (may modify the key space).
97 * r: read command (will never modify the key space).
98 * m: may increase memory usage once called. Don't allow if out of memory.
99 * a: admin command, like SAVE or SHUTDOWN.
100 * p: Pub/Sub related command.
101 * f: force replication of this command, regarless of server.dirty.
102 * s: command not allowed in scripts.
103 * R: random command. Command is not deterministic, that is, the same command
104 * with the same arguments, with the same key space, may have different
105 * results. For instance SPOP and RANDOMKEY are two random commands.
106 * S: Sort command output array if called from script, so that the output
107 * is deterministic.
108 */
109 struct redisCommand redisCommandTable[] = {
110 {"get",getCommand,2,"r",0,NULL,1,1,1,0,0},
111 {"set",setCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
112 {"setnx",setnxCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
113 {"setex",setexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
114 {"psetex",psetexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
115 {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
116 {"strlen",strlenCommand,2,"r",0,NULL,1,1,1,0,0},
117 {"del",delCommand,-2,"w",0,noPreloadGetKeys,1,-1,1,0,0},
118 {"exists",existsCommand,2,"r",0,NULL,1,1,1,0,0},
119 {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
120 {"getbit",getbitCommand,3,"r",0,NULL,1,1,1,0,0},
121 {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
122 {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
123 {"substr",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
124 {"incr",incrCommand,2,"wm",0,NULL,1,1,1,0,0},
125 {"decr",decrCommand,2,"wm",0,NULL,1,1,1,0,0},
126 {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
127 {"rpush",rpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
128 {"lpush",lpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
129 {"rpushx",rpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
130 {"lpushx",lpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
131 {"linsert",linsertCommand,5,"wm",0,NULL,1,1,1,0,0},
132 {"rpop",rpopCommand,2,"w",0,NULL,1,1,1,0,0},
133 {"lpop",lpopCommand,2,"w",0,NULL,1,1,1,0,0},
134 {"brpop",brpopCommand,-3,"ws",0,NULL,1,1,1,0,0},
135 {"brpoplpush",brpoplpushCommand,4,"wms",0,NULL,1,2,1,0,0},
136 {"blpop",blpopCommand,-3,"ws",0,NULL,1,-2,1,0,0},
137 {"llen",llenCommand,2,"r",0,NULL,1,1,1,0,0},
138 {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
139 {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
140 {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
141 {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
142 {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
143 {"rpoplpush",rpoplpushCommand,3,"wm",0,NULL,1,2,1,0,0},
144 {"sadd",saddCommand,-3,"wm",0,NULL,1,1,1,0,0},
145 {"srem",sremCommand,-3,"w",0,NULL,1,1,1,0,0},
146 {"smove",smoveCommand,4,"w",0,NULL,1,2,1,0,0},
147 {"sismember",sismemberCommand,3,"r",0,NULL,1,1,1,0,0},
148 {"scard",scardCommand,2,"r",0,NULL,1,1,1,0,0},
149 {"spop",spopCommand,2,"wRs",0,NULL,1,1,1,0,0},
150 {"srandmember",srandmemberCommand,2,"rR",0,NULL,1,1,1,0,0},
151 {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
152 {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
153 {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
154 {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
155 {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
156 {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
157 {"smembers",sinterCommand,2,"rS",0,NULL,1,1,1,0,0},
158 {"zadd",zaddCommand,-4,"wm",0,NULL,1,1,1,0,0},
159 {"zincrby",zincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
160 {"zrem",zremCommand,-3,"w",0,NULL,1,1,1,0,0},
161 {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
162 {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
163 {"zunionstore",zunionstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
164 {"zinterstore",zinterstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
165 {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
166 {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
167 {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
168 {"zcount",zcountCommand,4,"r",0,NULL,1,1,1,0,0},
169 {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
170 {"zcard",zcardCommand,2,"r",0,NULL,1,1,1,0,0},
171 {"zscore",zscoreCommand,3,"r",0,NULL,1,1,1,0,0},
172 {"zrank",zrankCommand,3,"r",0,NULL,1,1,1,0,0},
173 {"zrevrank",zrevrankCommand,3,"r",0,NULL,1,1,1,0,0},
174 {"hset",hsetCommand,4,"wm",0,NULL,1,1,1,0,0},
175 {"hsetnx",hsetnxCommand,4,"wm",0,NULL,1,1,1,0,0},
176 {"hget",hgetCommand,3,"r",0,NULL,1,1,1,0,0},
177 {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
178 {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
179 {"hincrby",hincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
180 {"hincrbyfloat",hincrbyfloatCommand,4,"wm",0,NULL,1,1,1,0,0},
181 {"hdel",hdelCommand,-3,"w",0,NULL,1,1,1,0,0},
182 {"hlen",hlenCommand,2,"r",0,NULL,1,1,1,0,0},
183 {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
184 {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
185 {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
186 {"hexists",hexistsCommand,3,"r",0,NULL,1,1,1,0,0},
187 {"incrby",incrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
188 {"decrby",decrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
189 {"incrbyfloat",incrbyfloatCommand,3,"wm",0,NULL,1,1,1,0,0},
190 {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
191 {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
192 {"msetnx",msetnxCommand,-3,"wm",0,NULL,1,-1,2,0,0},
193 {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
194 {"select",selectCommand,2,"r",0,NULL,0,0,0,0,0},
195 {"move",moveCommand,3,"w",0,NULL,1,1,1,0,0},
196 {"rename",renameCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
197 {"renamenx",renamenxCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
198 {"expire",expireCommand,3,"w",0,NULL,1,1,1,0,0},
199 {"expireat",expireatCommand,3,"w",0,NULL,1,1,1,0,0},
200 {"pexpire",pexpireCommand,3,"w",0,NULL,1,1,1,0,0},
201 {"pexpireat",pexpireatCommand,3,"w",0,NULL,1,1,1,0,0},
202 {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
203 {"dbsize",dbsizeCommand,1,"r",0,NULL,0,0,0,0,0},
204 {"auth",authCommand,2,"rs",0,NULL,0,0,0,0,0},
205 {"ping",pingCommand,1,"r",0,NULL,0,0,0,0,0},
206 {"echo",echoCommand,2,"r",0,NULL,0,0,0,0,0},
207 {"save",saveCommand,1,"ars",0,NULL,0,0,0,0,0},
208 {"bgsave",bgsaveCommand,1,"ar",0,NULL,0,0,0,0,0},
209 {"bgrewriteaof",bgrewriteaofCommand,1,"ar",0,NULL,0,0,0,0,0},
210 {"shutdown",shutdownCommand,-1,"ar",0,NULL,0,0,0,0,0},
211 {"lastsave",lastsaveCommand,1,"r",0,NULL,0,0,0,0,0},
212 {"type",typeCommand,2,"r",0,NULL,1,1,1,0,0},
213 {"multi",multiCommand,1,"rs",0,NULL,0,0,0,0,0},
214 {"exec",execCommand,1,"s",0,NULL,0,0,0,0,0},
215 {"discard",discardCommand,1,"rs",0,NULL,0,0,0,0,0},
216 {"sync",syncCommand,1,"ars",0,NULL,0,0,0,0,0},
217 {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
218 {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
219 {"sort",sortCommand,-2,"wmS",0,NULL,1,1,1,0,0},
220 {"info",infoCommand,-1,"r",0,NULL,0,0,0,0,0},
221 {"monitor",monitorCommand,1,"ars",0,NULL,0,0,0,0,0},
222 {"ttl",ttlCommand,2,"r",0,NULL,1,1,1,0,0},
223 {"pttl",pttlCommand,2,"r",0,NULL,1,1,1,0,0},
224 {"persist",persistCommand,2,"w",0,NULL,1,1,1,0,0},
225 {"slaveof",slaveofCommand,3,"aws",0,NULL,0,0,0,0,0},
226 {"debug",debugCommand,-2,"as",0,NULL,0,0,0,0,0},
227 {"config",configCommand,-2,"ar",0,NULL,0,0,0,0,0},
228 {"subscribe",subscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
229 {"unsubscribe",unsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
230 {"psubscribe",psubscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
231 {"punsubscribe",punsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
232 {"publish",publishCommand,3,"pf",0,NULL,0,0,0,0,0},
233 {"watch",watchCommand,-2,"rs",0,noPreloadGetKeys,1,-1,1,0,0},
234 {"unwatch",unwatchCommand,1,"rs",0,NULL,0,0,0,0,0},
235 {"restore",restoreCommand,4,"awm",0,NULL,1,1,1,0,0},
236 {"migrate",migrateCommand,6,"aw",0,NULL,0,0,0,0,0},
237 {"dump",dumpCommand,2,"ar",0,NULL,1,1,1,0,0},
238 {"object",objectCommand,-2,"r",0,NULL,2,2,2,0,0},
239 {"client",clientCommand,-2,"ar",0,NULL,0,0,0,0,0},
240 {"eval",evalCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
241 {"evalsha",evalShaCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
242 {"slowlog",slowlogCommand,-2,"r",0,NULL,0,0,0,0,0},
243 {"script",scriptCommand,-2,"ras",0,NULL,0,0,0,0,0},
244 {"time",timeCommand,1,"rR",0,NULL,0,0,0,0,0}
245 };
246
247 /*============================ Utility functions ============================ */
248
249 /* Low level logging. To use only for very big messages, otherwise
250 * redisLog() is to prefer. */
251 void redisLogRaw(int level, const char *msg) {
252 const int syslogLevelMap[] = { LOG_DEBUG, LOG_INFO, LOG_NOTICE, LOG_WARNING };
253 const char *c = ".-*#";
254 time_t now = time(NULL);
255 FILE *fp;
256 char buf[64];
257 int rawmode = (level & REDIS_LOG_RAW);
258
259 level &= 0xff; /* clear flags */
260 if (level < server.verbosity) return;
261
262 fp = (server.logfile == NULL) ? stdout : fopen(server.logfile,"a");
263 if (!fp) return;
264
265 if (rawmode) {
266 fprintf(fp,"%s",msg);
267 } else {
268 strftime(buf,sizeof(buf),"%d %b %H:%M:%S",localtime(&now));
269 fprintf(fp,"[%d] %s %c %s\n",(int)getpid(),buf,c[level],msg);
270 }
271 fflush(fp);
272
273 if (server.logfile) fclose(fp);
274
275 if (server.syslog_enabled) syslog(syslogLevelMap[level], "%s", msg);
276 }
277
278 /* Like redisLogRaw() but with printf-alike support. This is the funciton that
279 * is used across the code. The raw version is only used in order to dump
280 * the INFO output on crash. */
281 void redisLog(int level, const char *fmt, ...) {
282 va_list ap;
283 char msg[REDIS_MAX_LOGMSG_LEN];
284
285 if ((level&0xff) < server.verbosity) return;
286
287 va_start(ap, fmt);
288 vsnprintf(msg, sizeof(msg), fmt, ap);
289 va_end(ap);
290
291 redisLogRaw(level,msg);
292 }
293
294 /* Log a fixed message without printf-alike capabilities, in a way that is
295 * safe to call from a signal handler.
296 *
297 * We actually use this only for signals that are not fatal from the point
298 * of view of Redis. Signals that are going to kill the server anyway and
299 * where we need printf-alike features are served by redisLog(). */
300 void redisLogFromHandler(int level, const char *msg) {
301 int fd;
302 char buf[64];
303
304 if ((level&0xff) < server.verbosity ||
305 (server.logfile == NULL && server.daemonize)) return;
306 fd = server.logfile ?
307 open(server.logfile, O_APPEND|O_CREAT|O_WRONLY, 0644) :
308 STDOUT_FILENO;
309 if (fd == -1) return;
310 ll2string(buf,sizeof(buf),getpid());
311 write(fd,"[",1);
312 write(fd,buf,strlen(buf));
313 write(fd," | signal handler] (",20);
314 ll2string(buf,sizeof(buf),time(NULL));
315 write(fd,buf,strlen(buf));
316 write(fd,") ",2);
317 write(fd,msg,strlen(msg));
318 write(fd,"\n",1);
319 if (server.logfile) close(fd);
320 }
321
322 /* Redis generally does not try to recover from out of memory conditions
323 * when allocating objects or strings, it is not clear if it will be possible
324 * to report this condition to the client since the networking layer itself
325 * is based on heap allocation for send buffers, so we simply abort.
326 * At least the code will be simpler to read... */
327 void oom(const char *msg) {
328 redisLog(REDIS_WARNING, "%s: Out of memory\n",msg);
329 sleep(1);
330 abort();
331 }
332
333 /* Return the UNIX time in microseconds */
334 long long ustime(void) {
335 struct timeval tv;
336 long long ust;
337
338 gettimeofday(&tv, NULL);
339 ust = ((long long)tv.tv_sec)*1000000;
340 ust += tv.tv_usec;
341 return ust;
342 }
343
344 /* Return the UNIX time in milliseconds */
345 long long mstime(void) {
346 return ustime()/1000;
347 }
348
349 /*====================== Hash table type implementation ==================== */
350
351 /* This is an hash table type that uses the SDS dynamic strings libary as
352 * keys and radis objects as values (objects can hold SDS strings,
353 * lists, sets). */
354
355 void dictVanillaFree(void *privdata, void *val)
356 {
357 DICT_NOTUSED(privdata);
358 zfree(val);
359 }
360
361 void dictListDestructor(void *privdata, void *val)
362 {
363 DICT_NOTUSED(privdata);
364 listRelease((list*)val);
365 }
366
367 int dictSdsKeyCompare(void *privdata, const void *key1,
368 const void *key2)
369 {
370 int l1,l2;
371 DICT_NOTUSED(privdata);
372
373 l1 = sdslen((sds)key1);
374 l2 = sdslen((sds)key2);
375 if (l1 != l2) return 0;
376 return memcmp(key1, key2, l1) == 0;
377 }
378
379 /* A case insensitive version used for the command lookup table. */
380 int dictSdsKeyCaseCompare(void *privdata, const void *key1,
381 const void *key2)
382 {
383 DICT_NOTUSED(privdata);
384
385 return strcasecmp(key1, key2) == 0;
386 }
387
388 void dictRedisObjectDestructor(void *privdata, void *val)
389 {
390 DICT_NOTUSED(privdata);
391
392 if (val == NULL) return; /* Values of swapped out keys as set to NULL */
393 decrRefCount(val);
394 }
395
396 void dictSdsDestructor(void *privdata, void *val)
397 {
398 DICT_NOTUSED(privdata);
399
400 sdsfree(val);
401 }
402
403 int dictObjKeyCompare(void *privdata, const void *key1,
404 const void *key2)
405 {
406 const robj *o1 = key1, *o2 = key2;
407 return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
408 }
409
410 unsigned int dictObjHash(const void *key) {
411 const robj *o = key;
412 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
413 }
414
415 unsigned int dictSdsHash(const void *key) {
416 return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
417 }
418
419 unsigned int dictSdsCaseHash(const void *key) {
420 return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
421 }
422
423 int dictEncObjKeyCompare(void *privdata, const void *key1,
424 const void *key2)
425 {
426 robj *o1 = (robj*) key1, *o2 = (robj*) key2;
427 int cmp;
428
429 if (o1->encoding == REDIS_ENCODING_INT &&
430 o2->encoding == REDIS_ENCODING_INT)
431 return o1->ptr == o2->ptr;
432
433 o1 = getDecodedObject(o1);
434 o2 = getDecodedObject(o2);
435 cmp = dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
436 decrRefCount(o1);
437 decrRefCount(o2);
438 return cmp;
439 }
440
441 unsigned int dictEncObjHash(const void *key) {
442 robj *o = (robj*) key;
443
444 if (o->encoding == REDIS_ENCODING_RAW) {
445 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
446 } else {
447 if (o->encoding == REDIS_ENCODING_INT) {
448 char buf[32];
449 int len;
450
451 len = ll2string(buf,32,(long)o->ptr);
452 return dictGenHashFunction((unsigned char*)buf, len);
453 } else {
454 unsigned int hash;
455
456 o = getDecodedObject(o);
457 hash = dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
458 decrRefCount(o);
459 return hash;
460 }
461 }
462 }
463
464 /* Sets type hash table */
465 dictType setDictType = {
466 dictEncObjHash, /* hash function */
467 NULL, /* key dup */
468 NULL, /* val dup */
469 dictEncObjKeyCompare, /* key compare */
470 dictRedisObjectDestructor, /* key destructor */
471 NULL /* val destructor */
472 };
473
474 /* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
475 dictType zsetDictType = {
476 dictEncObjHash, /* hash function */
477 NULL, /* key dup */
478 NULL, /* val dup */
479 dictEncObjKeyCompare, /* key compare */
480 dictRedisObjectDestructor, /* key destructor */
481 NULL /* val destructor */
482 };
483
484 /* Db->dict, keys are sds strings, vals are Redis objects. */
485 dictType dbDictType = {
486 dictSdsHash, /* hash function */
487 NULL, /* key dup */
488 NULL, /* val dup */
489 dictSdsKeyCompare, /* key compare */
490 dictSdsDestructor, /* key destructor */
491 dictRedisObjectDestructor /* val destructor */
492 };
493
494 /* Db->expires */
495 dictType keyptrDictType = {
496 dictSdsHash, /* hash function */
497 NULL, /* key dup */
498 NULL, /* val dup */
499 dictSdsKeyCompare, /* key compare */
500 NULL, /* key destructor */
501 NULL /* val destructor */
502 };
503
504 /* Command table. sds string -> command struct pointer. */
505 dictType commandTableDictType = {
506 dictSdsCaseHash, /* hash function */
507 NULL, /* key dup */
508 NULL, /* val dup */
509 dictSdsKeyCaseCompare, /* key compare */
510 dictSdsDestructor, /* key destructor */
511 NULL /* val destructor */
512 };
513
514 /* Hash type hash table (note that small hashes are represented with zimpaps) */
515 dictType hashDictType = {
516 dictEncObjHash, /* hash function */
517 NULL, /* key dup */
518 NULL, /* val dup */
519 dictEncObjKeyCompare, /* key compare */
520 dictRedisObjectDestructor, /* key destructor */
521 dictRedisObjectDestructor /* val destructor */
522 };
523
524 /* Keylist hash table type has unencoded redis objects as keys and
525 * lists as values. It's used for blocking operations (BLPOP) and to
526 * map swapped keys to a list of clients waiting for this keys to be loaded. */
527 dictType keylistDictType = {
528 dictObjHash, /* hash function */
529 NULL, /* key dup */
530 NULL, /* val dup */
531 dictObjKeyCompare, /* key compare */
532 dictRedisObjectDestructor, /* key destructor */
533 dictListDestructor /* val destructor */
534 };
535
536 int htNeedsResize(dict *dict) {
537 long long size, used;
538
539 size = dictSlots(dict);
540 used = dictSize(dict);
541 return (size && used && size > DICT_HT_INITIAL_SIZE &&
542 (used*100/size < REDIS_HT_MINFILL));
543 }
544
545 /* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
546 * we resize the hash table to save memory */
547 void tryResizeHashTables(void) {
548 int j;
549
550 for (j = 0; j < server.dbnum; j++) {
551 if (htNeedsResize(server.db[j].dict))
552 dictResize(server.db[j].dict);
553 if (htNeedsResize(server.db[j].expires))
554 dictResize(server.db[j].expires);
555 }
556 }
557
558 /* Our hash table implementation performs rehashing incrementally while
559 * we write/read from the hash table. Still if the server is idle, the hash
560 * table will use two tables for a long time. So we try to use 1 millisecond
561 * of CPU time at every serverCron() loop in order to rehash some key. */
562 void incrementallyRehash(void) {
563 int j;
564
565 for (j = 0; j < server.dbnum; j++) {
566 if (dictIsRehashing(server.db[j].dict)) {
567 dictRehashMilliseconds(server.db[j].dict,1);
568 break; /* already used our millisecond for this loop... */
569 }
570 }
571 }
572
573 /* This function is called once a background process of some kind terminates,
574 * as we want to avoid resizing the hash tables when there is a child in order
575 * to play well with copy-on-write (otherwise when a resize happens lots of
576 * memory pages are copied). The goal of this function is to update the ability
577 * for dict.c to resize the hash tables accordingly to the fact we have o not
578 * running childs. */
579 void updateDictResizePolicy(void) {
580 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
581 dictEnableResize();
582 else
583 dictDisableResize();
584 }
585
586 /* ======================= Cron: called every 100 ms ======================== */
587
588 /* Try to expire a few timed out keys. The algorithm used is adaptive and
589 * will use few CPU cycles if there are few expiring keys, otherwise
590 * it will get more aggressive to avoid that too much memory is used by
591 * keys that can be removed from the keyspace. */
592 void activeExpireCycle(void) {
593 int j;
594
595 for (j = 0; j < server.dbnum; j++) {
596 int expired;
597 redisDb *db = server.db+j;
598
599 /* Continue to expire if at the end of the cycle more than 25%
600 * of the keys were expired. */
601 do {
602 long num = dictSize(db->expires);
603 long long now = mstime();
604
605 expired = 0;
606 if (num > REDIS_EXPIRELOOKUPS_PER_CRON)
607 num = REDIS_EXPIRELOOKUPS_PER_CRON;
608 while (num--) {
609 dictEntry *de;
610 long long t;
611
612 if ((de = dictGetRandomKey(db->expires)) == NULL) break;
613 t = dictGetSignedIntegerVal(de);
614 if (now > t) {
615 sds key = dictGetKey(de);
616 robj *keyobj = createStringObject(key,sdslen(key));
617
618 propagateExpire(db,keyobj);
619 dbDelete(db,keyobj);
620 decrRefCount(keyobj);
621 expired++;
622 server.stat_expiredkeys++;
623 }
624 }
625 } while (expired > REDIS_EXPIRELOOKUPS_PER_CRON/4);
626 }
627 }
628
629 void updateLRUClock(void) {
630 server.lruclock = (server.unixtime/REDIS_LRU_CLOCK_RESOLUTION) &
631 REDIS_LRU_CLOCK_MAX;
632 }
633
634
635 /* Add a sample to the operations per second array of samples. */
636 void trackOperationsPerSecond(void) {
637 long long t = mstime() - server.ops_sec_last_sample_time;
638 long long ops = server.stat_numcommands - server.ops_sec_last_sample_ops;
639 long long ops_sec;
640
641 ops_sec = t > 0 ? (ops*1000/t) : 0;
642
643 server.ops_sec_samples[server.ops_sec_idx] = ops_sec;
644 server.ops_sec_idx = (server.ops_sec_idx+1) % REDIS_OPS_SEC_SAMPLES;
645 server.ops_sec_last_sample_time = mstime();
646 server.ops_sec_last_sample_ops = server.stat_numcommands;
647 }
648
649 /* Return the mean of all the samples. */
650 long long getOperationsPerSecond(void) {
651 int j;
652 long long sum = 0;
653
654 for (j = 0; j < REDIS_OPS_SEC_SAMPLES; j++)
655 sum += server.ops_sec_samples[j];
656 return sum / REDIS_OPS_SEC_SAMPLES;
657 }
658
659 /* Check for timeouts. Returns non-zero if the client was terminated */
660 int clientsCronHandleTimeout(redisClient *c) {
661 time_t now = server.unixtime;
662
663 if (server.maxidletime &&
664 !(c->flags & REDIS_SLAVE) && /* no timeout for slaves */
665 !(c->flags & REDIS_MASTER) && /* no timeout for masters */
666 !(c->flags & REDIS_BLOCKED) && /* no timeout for BLPOP */
667 dictSize(c->pubsub_channels) == 0 && /* no timeout for pubsub */
668 listLength(c->pubsub_patterns) == 0 &&
669 (now - c->lastinteraction > server.maxidletime))
670 {
671 redisLog(REDIS_VERBOSE,"Closing idle client");
672 freeClient(c);
673 return 1;
674 } else if (c->flags & REDIS_BLOCKED) {
675 if (c->bpop.timeout != 0 && c->bpop.timeout < now) {
676 addReply(c,shared.nullmultibulk);
677 unblockClientWaitingData(c);
678 }
679 }
680 return 0;
681 }
682
683 /* The client query buffer is an sds.c string that can end with a lot of
684 * free space not used, this function reclaims space if needed.
685 *
686 * The funciton always returns 0 as it never terminates the client. */
687 int clientsCronResizeQueryBuffer(redisClient *c) {
688 size_t querybuf_size = sdsAllocSize(c->querybuf);
689 time_t idletime = server.unixtime - c->lastinteraction;
690
691 /* There are two conditions to resize the query buffer:
692 * 1) Query buffer is > BIG_ARG and too big for latest peak.
693 * 2) Client is inactive and the buffer is bigger than 1k. */
694 if (((querybuf_size > REDIS_MBULK_BIG_ARG) &&
695 (querybuf_size/(c->querybuf_peak+1)) > 2) ||
696 (querybuf_size > 1024 && idletime > 2))
697 {
698 /* Only resize the query buffer if it is actually wasting space. */
699 if (sdsavail(c->querybuf) > 1024) {
700 c->querybuf = sdsRemoveFreeSpace(c->querybuf);
701 }
702 }
703 /* Reset the peak again to capture the peak memory usage in the next
704 * cycle. */
705 c->querybuf_peak = 0;
706 return 0;
707 }
708
709 void clientsCron(void) {
710 /* Make sure to process at least 1/100 of clients per call.
711 * Since this function is called 10 times per second we are sure that
712 * in the worst case we process all the clients in 10 seconds.
713 * In normal conditions (a reasonable number of clients) we process
714 * all the clients in a shorter time. */
715 int numclients = listLength(server.clients);
716 int iterations = numclients/100;
717
718 if (iterations < 50)
719 iterations = (numclients < 50) ? numclients : 50;
720 while(listLength(server.clients) && iterations--) {
721 redisClient *c;
722 listNode *head;
723
724 /* Rotate the list, take the current head, process.
725 * This way if the client must be removed from the list it's the
726 * first element and we don't incur into O(N) computation. */
727 listRotate(server.clients);
728 head = listFirst(server.clients);
729 c = listNodeValue(head);
730 /* The following functions do different service checks on the client.
731 * The protocol is that they return non-zero if the client was
732 * terminated. */
733 if (clientsCronHandleTimeout(c)) continue;
734 if (clientsCronResizeQueryBuffer(c)) continue;
735 }
736 }
737
738 int serverCron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
739 int j, loops = server.cronloops;
740 REDIS_NOTUSED(eventLoop);
741 REDIS_NOTUSED(id);
742 REDIS_NOTUSED(clientData);
743
744 /* Software watchdog: deliver the SIGALRM that will reach the signal
745 * handler if we don't return here fast enough. */
746 if (server.watchdog_period) watchdogScheduleSignal(server.watchdog_period);
747
748 /* We take a cached value of the unix time in the global state because
749 * with virtual memory and aging there is to store the current time
750 * in objects at every object access, and accuracy is not needed.
751 * To access a global var is faster than calling time(NULL) */
752 server.unixtime = time(NULL);
753
754 trackOperationsPerSecond();
755
756 /* We have just 22 bits per object for LRU information.
757 * So we use an (eventually wrapping) LRU clock with 10 seconds resolution.
758 * 2^22 bits with 10 seconds resoluton is more or less 1.5 years.
759 *
760 * Note that even if this will wrap after 1.5 years it's not a problem,
761 * everything will still work but just some object will appear younger
762 * to Redis. But for this to happen a given object should never be touched
763 * for 1.5 years.
764 *
765 * Note that you can change the resolution altering the
766 * REDIS_LRU_CLOCK_RESOLUTION define.
767 */
768 updateLRUClock();
769
770 /* Record the max memory used since the server was started. */
771 if (zmalloc_used_memory() > server.stat_peak_memory)
772 server.stat_peak_memory = zmalloc_used_memory();
773
774 /* We received a SIGTERM, shutting down here in a safe way, as it is
775 * not ok doing so inside the signal handler. */
776 if (server.shutdown_asap) {
777 if (prepareForShutdown(0) == REDIS_OK) exit(0);
778 redisLog(REDIS_WARNING,"SIGTERM received but errors trying to shut down the server, check the logs for more information");
779 }
780
781 /* Show some info about non-empty databases */
782 for (j = 0; j < server.dbnum; j++) {
783 long long size, used, vkeys;
784
785 size = dictSlots(server.db[j].dict);
786 used = dictSize(server.db[j].dict);
787 vkeys = dictSize(server.db[j].expires);
788 if (!(loops % 50) && (used || vkeys)) {
789 redisLog(REDIS_VERBOSE,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j,used,vkeys,size);
790 /* dictPrintStats(server.dict); */
791 }
792 }
793
794 /* We don't want to resize the hash tables while a bacground saving
795 * is in progress: the saving child is created using fork() that is
796 * implemented with a copy-on-write semantic in most modern systems, so
797 * if we resize the HT while there is the saving child at work actually
798 * a lot of memory movements in the parent will cause a lot of pages
799 * copied. */
800 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
801 if (!(loops % 10)) tryResizeHashTables();
802 if (server.activerehashing) incrementallyRehash();
803 }
804
805 /* Show information about connected clients */
806 if (!(loops % 50)) {
807 redisLog(REDIS_VERBOSE,"%d clients connected (%d slaves), %zu bytes in use",
808 listLength(server.clients)-listLength(server.slaves),
809 listLength(server.slaves),
810 zmalloc_used_memory());
811 }
812
813 /* We need to do a few operations on clients asynchronously. */
814 clientsCron();
815
816 /* Start a scheduled AOF rewrite if this was requested by the user while
817 * a BGSAVE was in progress. */
818 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1 &&
819 server.aof_rewrite_scheduled)
820 {
821 rewriteAppendOnlyFileBackground();
822 }
823
824 /* Check if a background saving or AOF rewrite in progress terminated. */
825 if (server.rdb_child_pid != -1 || server.aof_child_pid != -1) {
826 int statloc;
827 pid_t pid;
828
829 if ((pid = wait3(&statloc,WNOHANG,NULL)) != 0) {
830 int exitcode = WEXITSTATUS(statloc);
831 int bysignal = 0;
832
833 if (WIFSIGNALED(statloc)) bysignal = WTERMSIG(statloc);
834
835 if (pid == server.rdb_child_pid) {
836 backgroundSaveDoneHandler(exitcode,bysignal);
837 } else {
838 backgroundRewriteDoneHandler(exitcode,bysignal);
839 }
840 updateDictResizePolicy();
841 }
842 } else {
843 /* If there is not a background saving/rewrite in progress check if
844 * we have to save/rewrite now */
845 for (j = 0; j < server.saveparamslen; j++) {
846 struct saveparam *sp = server.saveparams+j;
847
848 if (server.dirty >= sp->changes &&
849 server.unixtime-server.lastsave > sp->seconds) {
850 redisLog(REDIS_NOTICE,"%d changes in %d seconds. Saving...",
851 sp->changes, sp->seconds);
852 rdbSaveBackground(server.rdb_filename);
853 break;
854 }
855 }
856
857 /* Trigger an AOF rewrite if needed */
858 if (server.rdb_child_pid == -1 &&
859 server.aof_child_pid == -1 &&
860 server.aof_rewrite_perc &&
861 server.aof_current_size > server.aof_rewrite_min_size)
862 {
863 long long base = server.aof_rewrite_base_size ?
864 server.aof_rewrite_base_size : 1;
865 long long growth = (server.aof_current_size*100/base) - 100;
866 if (growth >= server.aof_rewrite_perc) {
867 redisLog(REDIS_NOTICE,"Starting automatic rewriting of AOF on %lld%% growth",growth);
868 rewriteAppendOnlyFileBackground();
869 }
870 }
871 }
872
873
874 /* If we postponed an AOF buffer flush, let's try to do it every time the
875 * cron function is called. */
876 if (server.aof_flush_postponed_start) flushAppendOnlyFile(0);
877
878 /* Expire a few keys per cycle, only if this is a master.
879 * On slaves we wait for DEL operations synthesized by the master
880 * in order to guarantee a strict consistency. */
881 if (server.masterhost == NULL) activeExpireCycle();
882
883 /* Close clients that need to be closed asynchronous */
884 freeClientsInAsyncFreeQueue();
885
886 /* Replication cron function -- used to reconnect to master and
887 * to detect transfer failures. */
888 if (!(loops % 10)) replicationCron();
889
890 server.cronloops++;
891 return 100;
892 }
893
894 /* This function gets called every time Redis is entering the
895 * main loop of the event driven library, that is, before to sleep
896 * for ready file descriptors. */
897 void beforeSleep(struct aeEventLoop *eventLoop) {
898 REDIS_NOTUSED(eventLoop);
899 listNode *ln;
900 redisClient *c;
901
902 /* Try to process pending commands for clients that were just unblocked. */
903 while (listLength(server.unblocked_clients)) {
904 ln = listFirst(server.unblocked_clients);
905 redisAssert(ln != NULL);
906 c = ln->value;
907 listDelNode(server.unblocked_clients,ln);
908 c->flags &= ~REDIS_UNBLOCKED;
909
910 /* Process remaining data in the input buffer. */
911 if (c->querybuf && sdslen(c->querybuf) > 0) {
912 server.current_client = c;
913 processInputBuffer(c);
914 server.current_client = NULL;
915 }
916 }
917
918 /* Write the AOF buffer on disk */
919 flushAppendOnlyFile(0);
920 }
921
922 /* =========================== Server initialization ======================== */
923
924 void createSharedObjects(void) {
925 int j;
926
927 shared.crlf = createObject(REDIS_STRING,sdsnew("\r\n"));
928 shared.ok = createObject(REDIS_STRING,sdsnew("+OK\r\n"));
929 shared.err = createObject(REDIS_STRING,sdsnew("-ERR\r\n"));
930 shared.emptybulk = createObject(REDIS_STRING,sdsnew("$0\r\n\r\n"));
931 shared.czero = createObject(REDIS_STRING,sdsnew(":0\r\n"));
932 shared.cone = createObject(REDIS_STRING,sdsnew(":1\r\n"));
933 shared.cnegone = createObject(REDIS_STRING,sdsnew(":-1\r\n"));
934 shared.nullbulk = createObject(REDIS_STRING,sdsnew("$-1\r\n"));
935 shared.nullmultibulk = createObject(REDIS_STRING,sdsnew("*-1\r\n"));
936 shared.emptymultibulk = createObject(REDIS_STRING,sdsnew("*0\r\n"));
937 shared.pong = createObject(REDIS_STRING,sdsnew("+PONG\r\n"));
938 shared.queued = createObject(REDIS_STRING,sdsnew("+QUEUED\r\n"));
939 shared.wrongtypeerr = createObject(REDIS_STRING,sdsnew(
940 "-ERR Operation against a key holding the wrong kind of value\r\n"));
941 shared.nokeyerr = createObject(REDIS_STRING,sdsnew(
942 "-ERR no such key\r\n"));
943 shared.syntaxerr = createObject(REDIS_STRING,sdsnew(
944 "-ERR syntax error\r\n"));
945 shared.sameobjecterr = createObject(REDIS_STRING,sdsnew(
946 "-ERR source and destination objects are the same\r\n"));
947 shared.outofrangeerr = createObject(REDIS_STRING,sdsnew(
948 "-ERR index out of range\r\n"));
949 shared.noscripterr = createObject(REDIS_STRING,sdsnew(
950 "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
951 shared.loadingerr = createObject(REDIS_STRING,sdsnew(
952 "-LOADING Redis is loading the dataset in memory\r\n"));
953 shared.slowscripterr = createObject(REDIS_STRING,sdsnew(
954 "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
955 shared.bgsaveerr = createObject(REDIS_STRING,sdsnew(
956 "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
957 shared.roslaveerr = createObject(REDIS_STRING,sdsnew(
958 "-READONLY You can't write against a read only slave.\r\n"));
959 shared.oomerr = createObject(REDIS_STRING,sdsnew(
960 "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
961 shared.space = createObject(REDIS_STRING,sdsnew(" "));
962 shared.colon = createObject(REDIS_STRING,sdsnew(":"));
963 shared.plus = createObject(REDIS_STRING,sdsnew("+"));
964
965 for (j = 0; j < REDIS_SHARED_SELECT_CMDS; j++) {
966 shared.select[j] = createObject(REDIS_STRING,
967 sdscatprintf(sdsempty(),"select %d\r\n", j));
968 }
969 shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
970 shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
971 shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
972 shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
973 shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
974 shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
975 shared.del = createStringObject("DEL",3);
976 shared.rpop = createStringObject("RPOP",4);
977 shared.lpop = createStringObject("LPOP",4);
978 for (j = 0; j < REDIS_SHARED_INTEGERS; j++) {
979 shared.integers[j] = createObject(REDIS_STRING,(void*)(long)j);
980 shared.integers[j]->encoding = REDIS_ENCODING_INT;
981 }
982 for (j = 0; j < REDIS_SHARED_BULKHDR_LEN; j++) {
983 shared.mbulkhdr[j] = createObject(REDIS_STRING,
984 sdscatprintf(sdsempty(),"*%d\r\n",j));
985 shared.bulkhdr[j] = createObject(REDIS_STRING,
986 sdscatprintf(sdsempty(),"$%d\r\n",j));
987 }
988 }
989
990 void initServerConfig() {
991 getRandomHexChars(server.runid,REDIS_RUN_ID_SIZE);
992 server.runid[REDIS_RUN_ID_SIZE] = '\0';
993 server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
994 server.port = REDIS_SERVERPORT;
995 server.bindaddr = NULL;
996 server.unixsocket = NULL;
997 server.unixsocketperm = 0;
998 server.ipfd = -1;
999 server.sofd = -1;
1000 server.dbnum = REDIS_DEFAULT_DBNUM;
1001 server.verbosity = REDIS_NOTICE;
1002 server.maxidletime = REDIS_MAXIDLETIME;
1003 server.client_max_querybuf_len = REDIS_MAX_QUERYBUF_LEN;
1004 server.saveparams = NULL;
1005 server.loading = 0;
1006 server.logfile = NULL; /* NULL = log on standard output */
1007 server.syslog_enabled = 0;
1008 server.syslog_ident = zstrdup("redis");
1009 server.syslog_facility = LOG_LOCAL0;
1010 server.daemonize = 0;
1011 server.aof_state = REDIS_AOF_OFF;
1012 server.aof_fsync = AOF_FSYNC_EVERYSEC;
1013 server.aof_no_fsync_on_rewrite = 0;
1014 server.aof_rewrite_perc = REDIS_AOF_REWRITE_PERC;
1015 server.aof_rewrite_min_size = REDIS_AOF_REWRITE_MIN_SIZE;
1016 server.aof_rewrite_base_size = 0;
1017 server.aof_rewrite_scheduled = 0;
1018 server.aof_last_fsync = time(NULL);
1019 server.aof_delayed_fsync = 0;
1020 server.aof_fd = -1;
1021 server.aof_selected_db = -1; /* Make sure the first time will not match */
1022 server.aof_flush_postponed_start = 0;
1023 server.pidfile = zstrdup("/var/run/redis.pid");
1024 server.rdb_filename = zstrdup("dump.rdb");
1025 server.aof_filename = zstrdup("appendonly.aof");
1026 server.requirepass = NULL;
1027 server.rdb_compression = 1;
1028 server.activerehashing = 1;
1029 server.maxclients = REDIS_MAX_CLIENTS;
1030 server.bpop_blocked_clients = 0;
1031 server.maxmemory = 0;
1032 server.maxmemory_policy = REDIS_MAXMEMORY_VOLATILE_LRU;
1033 server.maxmemory_samples = 3;
1034 server.hash_max_ziplist_entries = REDIS_HASH_MAX_ZIPLIST_ENTRIES;
1035 server.hash_max_ziplist_value = REDIS_HASH_MAX_ZIPLIST_VALUE;
1036 server.list_max_ziplist_entries = REDIS_LIST_MAX_ZIPLIST_ENTRIES;
1037 server.list_max_ziplist_value = REDIS_LIST_MAX_ZIPLIST_VALUE;
1038 server.set_max_intset_entries = REDIS_SET_MAX_INTSET_ENTRIES;
1039 server.zset_max_ziplist_entries = REDIS_ZSET_MAX_ZIPLIST_ENTRIES;
1040 server.zset_max_ziplist_value = REDIS_ZSET_MAX_ZIPLIST_VALUE;
1041 server.shutdown_asap = 0;
1042 server.repl_ping_slave_period = REDIS_REPL_PING_SLAVE_PERIOD;
1043 server.repl_timeout = REDIS_REPL_TIMEOUT;
1044 server.lua_caller = NULL;
1045 server.lua_time_limit = REDIS_LUA_TIME_LIMIT;
1046 server.lua_client = NULL;
1047 server.lua_timedout = 0;
1048
1049 updateLRUClock();
1050 resetServerSaveParams();
1051
1052 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1053 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1054 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1055 /* Replication related */
1056 server.masterauth = NULL;
1057 server.masterhost = NULL;
1058 server.masterport = 6379;
1059 server.master = NULL;
1060 server.repl_state = REDIS_REPL_NONE;
1061 server.repl_syncio_timeout = REDIS_REPL_SYNCIO_TIMEOUT;
1062 server.repl_serve_stale_data = 1;
1063 server.repl_slave_ro = 1;
1064 server.repl_down_since = -1;
1065
1066 /* Client output buffer limits */
1067 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].hard_limit_bytes = 0;
1068 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_bytes = 0;
1069 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_seconds = 0;
1070 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].hard_limit_bytes = 1024*1024*256;
1071 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_bytes = 1024*1024*64;
1072 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_seconds = 60;
1073 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].hard_limit_bytes = 1024*1024*32;
1074 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_bytes = 1024*1024*8;
1075 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_seconds = 60;
1076
1077 /* Double constants initialization */
1078 R_Zero = 0.0;
1079 R_PosInf = 1.0/R_Zero;
1080 R_NegInf = -1.0/R_Zero;
1081 R_Nan = R_Zero/R_Zero;
1082
1083 /* Command table -- we intiialize it here as it is part of the
1084 * initial configuration, since command names may be changed via
1085 * redis.conf using the rename-command directive. */
1086 server.commands = dictCreate(&commandTableDictType,NULL);
1087 populateCommandTable();
1088 server.delCommand = lookupCommandByCString("del");
1089 server.multiCommand = lookupCommandByCString("multi");
1090 server.lpushCommand = lookupCommandByCString("lpush");
1091
1092 /* Slow log */
1093 server.slowlog_log_slower_than = REDIS_SLOWLOG_LOG_SLOWER_THAN;
1094 server.slowlog_max_len = REDIS_SLOWLOG_MAX_LEN;
1095
1096 /* Debugging */
1097 server.assert_failed = "<no assertion failed>";
1098 server.assert_file = "<no file>";
1099 server.assert_line = 0;
1100 server.bug_report_start = 0;
1101 server.watchdog_period = 0;
1102 }
1103
1104 /* This function will try to raise the max number of open files accordingly to
1105 * the configured max number of clients. It will also account for 32 additional
1106 * file descriptors as we need a few more for persistence, listening
1107 * sockets, log files and so forth.
1108 *
1109 * If it will not be possible to set the limit accordingly to the configured
1110 * max number of clients, the function will do the reverse setting
1111 * server.maxclients to the value that we can actually handle. */
1112 void adjustOpenFilesLimit(void) {
1113 rlim_t maxfiles = server.maxclients+32;
1114 struct rlimit limit;
1115
1116 if (maxfiles < 1024) maxfiles = 1024;
1117 if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
1118 redisLog(REDIS_WARNING,"Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
1119 strerror(errno));
1120 server.maxclients = 1024-32;
1121 } else {
1122 rlim_t oldlimit = limit.rlim_cur;
1123
1124 /* Set the max number of files if the current limit is not enough
1125 * for our needs. */
1126 if (oldlimit < maxfiles) {
1127 rlim_t f;
1128
1129 f = maxfiles;
1130 while(f > oldlimit) {
1131 limit.rlim_cur = f;
1132 limit.rlim_max = f;
1133 if (setrlimit(RLIMIT_NOFILE,&limit) != -1) break;
1134 f -= 128;
1135 }
1136 if (f < oldlimit) f = oldlimit;
1137 if (f != maxfiles) {
1138 server.maxclients = f-32;
1139 redisLog(REDIS_WARNING,"Unable to set the max number of files limit to %d (%s), setting the max clients configuration to %d.",
1140 (int) maxfiles, strerror(errno), (int) server.maxclients);
1141 } else {
1142 redisLog(REDIS_NOTICE,"Max number of open files set to %d",
1143 (int) maxfiles);
1144 }
1145 }
1146 }
1147 }
1148
1149 void initServer() {
1150 int j;
1151
1152 signal(SIGHUP, SIG_IGN);
1153 signal(SIGPIPE, SIG_IGN);
1154 setupSignalHandlers();
1155
1156 if (server.syslog_enabled) {
1157 openlog(server.syslog_ident, LOG_PID | LOG_NDELAY | LOG_NOWAIT,
1158 server.syslog_facility);
1159 }
1160
1161 server.current_client = NULL;
1162 server.clients = listCreate();
1163 server.clients_to_close = listCreate();
1164 server.slaves = listCreate();
1165 server.monitors = listCreate();
1166 server.unblocked_clients = listCreate();
1167
1168 createSharedObjects();
1169 adjustOpenFilesLimit();
1170 server.el = aeCreateEventLoop(server.maxclients+1024);
1171 server.db = zmalloc(sizeof(redisDb)*server.dbnum);
1172
1173 if (server.port != 0) {
1174 server.ipfd = anetTcpServer(server.neterr,server.port,server.bindaddr);
1175 if (server.ipfd == ANET_ERR) {
1176 redisLog(REDIS_WARNING, "Opening port %d: %s",
1177 server.port, server.neterr);
1178 exit(1);
1179 }
1180 }
1181 if (server.unixsocket != NULL) {
1182 unlink(server.unixsocket); /* don't care if this fails */
1183 server.sofd = anetUnixServer(server.neterr,server.unixsocket,server.unixsocketperm);
1184 if (server.sofd == ANET_ERR) {
1185 redisLog(REDIS_WARNING, "Opening socket: %s", server.neterr);
1186 exit(1);
1187 }
1188 }
1189 if (server.ipfd < 0 && server.sofd < 0) {
1190 redisLog(REDIS_WARNING, "Configured to not listen anywhere, exiting.");
1191 exit(1);
1192 }
1193 for (j = 0; j < server.dbnum; j++) {
1194 server.db[j].dict = dictCreate(&dbDictType,NULL);
1195 server.db[j].expires = dictCreate(&keyptrDictType,NULL);
1196 server.db[j].blocking_keys = dictCreate(&keylistDictType,NULL);
1197 server.db[j].watched_keys = dictCreate(&keylistDictType,NULL);
1198 server.db[j].id = j;
1199 }
1200 server.pubsub_channels = dictCreate(&keylistDictType,NULL);
1201 server.pubsub_patterns = listCreate();
1202 listSetFreeMethod(server.pubsub_patterns,freePubsubPattern);
1203 listSetMatchMethod(server.pubsub_patterns,listMatchPubsubPattern);
1204 server.cronloops = 0;
1205 server.rdb_child_pid = -1;
1206 server.aof_child_pid = -1;
1207 server.aof_rewrite_buf = sdsempty();
1208 server.aof_buf = sdsempty();
1209 server.lastsave = time(NULL);
1210 server.dirty = 0;
1211 server.stat_numcommands = 0;
1212 server.stat_numconnections = 0;
1213 server.stat_expiredkeys = 0;
1214 server.stat_evictedkeys = 0;
1215 server.stat_starttime = time(NULL);
1216 server.stat_keyspace_misses = 0;
1217 server.stat_keyspace_hits = 0;
1218 server.stat_peak_memory = 0;
1219 server.stat_fork_time = 0;
1220 server.stat_rejected_conn = 0;
1221 memset(server.ops_sec_samples,0,sizeof(server.ops_sec_samples));
1222 server.ops_sec_idx = 0;
1223 server.ops_sec_last_sample_time = mstime();
1224 server.ops_sec_last_sample_ops = 0;
1225 server.unixtime = time(NULL);
1226 server.lastbgsave_status = REDIS_OK;
1227 server.stop_writes_on_bgsave_err = 1;
1228 aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL);
1229 if (server.ipfd > 0 && aeCreateFileEvent(server.el,server.ipfd,AE_READABLE,
1230 acceptTcpHandler,NULL) == AE_ERR) oom("creating file event");
1231 if (server.sofd > 0 && aeCreateFileEvent(server.el,server.sofd,AE_READABLE,
1232 acceptUnixHandler,NULL) == AE_ERR) oom("creating file event");
1233
1234 if (server.aof_state == REDIS_AOF_ON) {
1235 server.aof_fd = open(server.aof_filename,
1236 O_WRONLY|O_APPEND|O_CREAT,0644);
1237 if (server.aof_fd == -1) {
1238 redisLog(REDIS_WARNING, "Can't open the append-only file: %s",
1239 strerror(errno));
1240 exit(1);
1241 }
1242 }
1243
1244 /* 32 bit instances are limited to 4GB of address space, so if there is
1245 * no explicit limit in the user provided configuration we set a limit
1246 * at 3.5GB using maxmemory with 'noeviction' policy'. This saves
1247 * useless crashes of the Redis instance. */
1248 if (server.arch_bits == 32 && server.maxmemory == 0) {
1249 redisLog(REDIS_WARNING,"Warning: 32 bit instance detected but no memory limit set. Setting 3.5 GB maxmemory limit with 'noeviction' policy now.");
1250 server.maxmemory = 3584LL*(1024*1024); /* 3584 MB = 3.5 GB */
1251 server.maxmemory_policy = REDIS_MAXMEMORY_NO_EVICTION;
1252 }
1253
1254 scriptingInit();
1255 slowlogInit();
1256 bioInit();
1257 }
1258
1259 /* Populates the Redis Command Table starting from the hard coded list
1260 * we have on top of redis.c file. */
1261 void populateCommandTable(void) {
1262 int j;
1263 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1264
1265 for (j = 0; j < numcommands; j++) {
1266 struct redisCommand *c = redisCommandTable+j;
1267 char *f = c->sflags;
1268 int retval;
1269
1270 while(*f != '\0') {
1271 switch(*f) {
1272 case 'w': c->flags |= REDIS_CMD_WRITE; break;
1273 case 'r': c->flags |= REDIS_CMD_READONLY; break;
1274 case 'm': c->flags |= REDIS_CMD_DENYOOM; break;
1275 case 'a': c->flags |= REDIS_CMD_ADMIN; break;
1276 case 'p': c->flags |= REDIS_CMD_PUBSUB; break;
1277 case 'f': c->flags |= REDIS_CMD_FORCE_REPLICATION; break;
1278 case 's': c->flags |= REDIS_CMD_NOSCRIPT; break;
1279 case 'R': c->flags |= REDIS_CMD_RANDOM; break;
1280 case 'S': c->flags |= REDIS_CMD_SORT_FOR_SCRIPT; break;
1281 default: redisPanic("Unsupported command flag"); break;
1282 }
1283 f++;
1284 }
1285
1286 retval = dictAdd(server.commands, sdsnew(c->name), c);
1287 assert(retval == DICT_OK);
1288 }
1289 }
1290
1291 void resetCommandTableStats(void) {
1292 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1293 int j;
1294
1295 for (j = 0; j < numcommands; j++) {
1296 struct redisCommand *c = redisCommandTable+j;
1297
1298 c->microseconds = 0;
1299 c->calls = 0;
1300 }
1301 }
1302
1303 /* ========================== Redis OP Array API ============================ */
1304
1305 void redisOpArrayInit(redisOpArray *oa) {
1306 oa->ops = NULL;
1307 oa->numops = 0;
1308 }
1309
1310 int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
1311 robj **argv, int argc, int target)
1312 {
1313 redisOp *op;
1314
1315 oa->ops = zrealloc(oa->ops,sizeof(redisOp)*(oa->numops+1));
1316 op = oa->ops+oa->numops;
1317 op->cmd = cmd;
1318 op->dbid = dbid;
1319 op->argv = argv;
1320 op->argc = argc;
1321 op->target = target;
1322 oa->numops++;
1323 return oa->numops;
1324 }
1325
1326 void redisOpArrayFree(redisOpArray *oa) {
1327 while(oa->numops) {
1328 int j;
1329 redisOp *op;
1330
1331 oa->numops--;
1332 op = oa->ops+oa->numops;
1333 for (j = 0; j < op->argc; j++)
1334 decrRefCount(op->argv[j]);
1335 zfree(op->argv);
1336 }
1337 zfree(oa->ops);
1338 }
1339
1340 /* ====================== Commands lookup and execution ===================== */
1341
1342 struct redisCommand *lookupCommand(sds name) {
1343 return dictFetchValue(server.commands, name);
1344 }
1345
1346 struct redisCommand *lookupCommandByCString(char *s) {
1347 struct redisCommand *cmd;
1348 sds name = sdsnew(s);
1349
1350 cmd = dictFetchValue(server.commands, name);
1351 sdsfree(name);
1352 return cmd;
1353 }
1354
1355 /* Propagate the specified command (in the context of the specified database id)
1356 * to AOF, Slaves and Monitors.
1357 *
1358 * flags are an xor between:
1359 * + REDIS_PROPAGATE_NONE (no propagation of command at all)
1360 * + REDIS_PROPAGATE_AOF (propagate into the AOF file if is enabled)
1361 * + REDIS_PROPAGATE_REPL (propagate into the replication link)
1362 */
1363 void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1364 int flags)
1365 {
1366 if (server.aof_state != REDIS_AOF_OFF && flags & REDIS_PROPAGATE_AOF)
1367 feedAppendOnlyFile(cmd,dbid,argv,argc);
1368 if (flags & REDIS_PROPAGATE_REPL && listLength(server.slaves))
1369 replicationFeedSlaves(server.slaves,dbid,argv,argc);
1370 }
1371
1372 /* Used inside commands to schedule the propagation of additional commands
1373 * after the current command is propagated to AOF / Replication. */
1374 void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1375 int target)
1376 {
1377 redisOpArrayAppend(&server.also_propagate,cmd,dbid,argv,argc,target);
1378 }
1379
1380 /* Call() is the core of Redis execution of a command */
1381 void call(redisClient *c, int flags) {
1382 long long dirty, start = ustime(), duration;
1383
1384 /* Sent the command to clients in MONITOR mode, only if the commands are
1385 * not geneated from reading an AOF. */
1386 if (listLength(server.monitors) && !server.loading)
1387 replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
1388
1389 /* Call the command. */
1390 redisOpArrayInit(&server.also_propagate);
1391 dirty = server.dirty;
1392 c->cmd->proc(c);
1393 dirty = server.dirty-dirty;
1394 duration = ustime()-start;
1395
1396 /* When EVAL is called loading the AOF we don't want commands called
1397 * from Lua to go into the slowlog or to populate statistics. */
1398 if (server.loading && c->flags & REDIS_LUA_CLIENT)
1399 flags &= ~(REDIS_CALL_SLOWLOG | REDIS_CALL_STATS);
1400
1401 /* Log the command into the Slow log if needed, and populate the
1402 * per-command statistics that we show in INFO commandstats. */
1403 if (flags & REDIS_CALL_SLOWLOG)
1404 slowlogPushEntryIfNeeded(c->argv,c->argc,duration);
1405 if (flags & REDIS_CALL_STATS) {
1406 c->cmd->microseconds += duration;
1407 c->cmd->calls++;
1408 }
1409
1410 /* Propagate the command into the AOF and replication link */
1411 if (flags & REDIS_CALL_PROPAGATE) {
1412 int flags = REDIS_PROPAGATE_NONE;
1413
1414 if (c->cmd->flags & REDIS_CMD_FORCE_REPLICATION)
1415 flags |= REDIS_PROPAGATE_REPL;
1416 if (dirty)
1417 flags |= (REDIS_PROPAGATE_REPL | REDIS_PROPAGATE_AOF);
1418 if (flags != REDIS_PROPAGATE_NONE)
1419 propagate(c->cmd,c->db->id,c->argv,c->argc,flags);
1420 }
1421 /* Commands such as LPUSH or BRPOPLPUSH may propagate an additional
1422 * PUSH command. */
1423 if (server.also_propagate.numops) {
1424 int j;
1425 redisOp *rop;
1426
1427 for (j = 0; j < server.also_propagate.numops; j++) {
1428 rop = &server.also_propagate.ops[j];
1429 propagate(rop->cmd, rop->dbid, rop->argv, rop->argc, rop->target);
1430 }
1431 redisOpArrayFree(&server.also_propagate);
1432 }
1433 server.stat_numcommands++;
1434 }
1435
1436 /* If this function gets called we already read a whole
1437 * command, argments are in the client argv/argc fields.
1438 * processCommand() execute the command or prepare the
1439 * server for a bulk read from the client.
1440 *
1441 * If 1 is returned the client is still alive and valid and
1442 * and other operations can be performed by the caller. Otherwise
1443 * if 0 is returned the client was destroied (i.e. after QUIT). */
1444 int processCommand(redisClient *c) {
1445 /* The QUIT command is handled separately. Normal command procs will
1446 * go through checking for replication and QUIT will cause trouble
1447 * when FORCE_REPLICATION is enabled and would be implemented in
1448 * a regular command proc. */
1449 if (!strcasecmp(c->argv[0]->ptr,"quit")) {
1450 addReply(c,shared.ok);
1451 c->flags |= REDIS_CLOSE_AFTER_REPLY;
1452 return REDIS_ERR;
1453 }
1454
1455 /* Now lookup the command and check ASAP about trivial error conditions
1456 * such as wrong arity, bad command name and so forth. */
1457 c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
1458 if (!c->cmd) {
1459 addReplyErrorFormat(c,"unknown command '%s'",
1460 (char*)c->argv[0]->ptr);
1461 return REDIS_OK;
1462 } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
1463 (c->argc < -c->cmd->arity)) {
1464 addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
1465 c->cmd->name);
1466 return REDIS_OK;
1467 }
1468
1469 /* Check if the user is authenticated */
1470 if (server.requirepass && !c->authenticated && c->cmd->proc != authCommand)
1471 {
1472 addReplyError(c,"operation not permitted");
1473 return REDIS_OK;
1474 }
1475
1476 /* Handle the maxmemory directive.
1477 *
1478 * First we try to free some memory if possible (if there are volatile
1479 * keys in the dataset). If there are not the only thing we can do
1480 * is returning an error. */
1481 if (server.maxmemory) {
1482 int retval = freeMemoryIfNeeded();
1483 if ((c->cmd->flags & REDIS_CMD_DENYOOM) && retval == REDIS_ERR) {
1484 addReply(c, shared.oomerr);
1485 return REDIS_OK;
1486 }
1487 }
1488
1489 /* Don't accept write commands if there are problems persisting on disk. */
1490 if (server.stop_writes_on_bgsave_err &&
1491 server.saveparamslen > 0
1492 && server.lastbgsave_status == REDIS_ERR &&
1493 c->cmd->flags & REDIS_CMD_WRITE)
1494 {
1495 addReply(c, shared.bgsaveerr);
1496 return REDIS_OK;
1497 }
1498
1499 /* Don't accept wirte commands if this is a read only slave. But
1500 * accept write commands if this is our master. */
1501 if (server.masterhost && server.repl_slave_ro &&
1502 !(c->flags & REDIS_MASTER) &&
1503 c->cmd->flags & REDIS_CMD_WRITE)
1504 {
1505 addReply(c, shared.roslaveerr);
1506 return REDIS_OK;
1507 }
1508
1509 /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
1510 if ((dictSize(c->pubsub_channels) > 0 || listLength(c->pubsub_patterns) > 0)
1511 &&
1512 c->cmd->proc != subscribeCommand &&
1513 c->cmd->proc != unsubscribeCommand &&
1514 c->cmd->proc != psubscribeCommand &&
1515 c->cmd->proc != punsubscribeCommand) {
1516 addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / QUIT allowed in this context");
1517 return REDIS_OK;
1518 }
1519
1520 /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
1521 * we are a slave with a broken link with master. */
1522 if (server.masterhost && server.repl_state != REDIS_REPL_CONNECTED &&
1523 server.repl_serve_stale_data == 0 &&
1524 c->cmd->proc != infoCommand && c->cmd->proc != slaveofCommand)
1525 {
1526 addReplyError(c,
1527 "link with MASTER is down and slave-serve-stale-data is set to no");
1528 return REDIS_OK;
1529 }
1530
1531 /* Loading DB? Return an error if the command is not INFO */
1532 if (server.loading && c->cmd->proc != infoCommand) {
1533 addReply(c, shared.loadingerr);
1534 return REDIS_OK;
1535 }
1536
1537 /* Lua script too slow? Only allow SHUTDOWN NOSAVE and SCRIPT KILL. */
1538 if (server.lua_timedout &&
1539 !(c->cmd->proc != shutdownCommand &&
1540 c->argc == 2 &&
1541 tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
1542 !(c->cmd->proc == scriptCommand &&
1543 c->argc == 2 &&
1544 tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
1545 {
1546 addReply(c, shared.slowscripterr);
1547 return REDIS_OK;
1548 }
1549
1550 /* Exec the command */
1551 if (c->flags & REDIS_MULTI &&
1552 c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
1553 c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
1554 {
1555 queueMultiCommand(c);
1556 addReply(c,shared.queued);
1557 } else {
1558 call(c,REDIS_CALL_FULL);
1559 }
1560 return REDIS_OK;
1561 }
1562
1563 /*================================== Shutdown =============================== */
1564
1565 int prepareForShutdown(int flags) {
1566 int save = flags & REDIS_SHUTDOWN_SAVE;
1567 int nosave = flags & REDIS_SHUTDOWN_NOSAVE;
1568
1569 redisLog(REDIS_WARNING,"User requested shutdown...");
1570 /* Kill the saving child if there is a background saving in progress.
1571 We want to avoid race conditions, for instance our saving child may
1572 overwrite the synchronous saving did by SHUTDOWN. */
1573 if (server.rdb_child_pid != -1) {
1574 redisLog(REDIS_WARNING,"There is a child saving an .rdb. Killing it!");
1575 kill(server.rdb_child_pid,SIGKILL);
1576 rdbRemoveTempFile(server.rdb_child_pid);
1577 }
1578 if (server.aof_state != REDIS_AOF_OFF) {
1579 /* Kill the AOF saving child as the AOF we already have may be longer
1580 * but contains the full dataset anyway. */
1581 if (server.aof_child_pid != -1) {
1582 redisLog(REDIS_WARNING,
1583 "There is a child rewriting the AOF. Killing it!");
1584 kill(server.aof_child_pid,SIGKILL);
1585 }
1586 /* Append only file: fsync() the AOF and exit */
1587 redisLog(REDIS_NOTICE,"Calling fsync() on the AOF file.");
1588 aof_fsync(server.aof_fd);
1589 }
1590 if ((server.saveparamslen > 0 && !nosave) || save) {
1591 redisLog(REDIS_NOTICE,"Saving the final RDB snapshot before exiting.");
1592 /* Snapshotting. Perform a SYNC SAVE and exit */
1593 if (rdbSave(server.rdb_filename) != REDIS_OK) {
1594 /* Ooops.. error saving! The best we can do is to continue
1595 * operating. Note that if there was a background saving process,
1596 * in the next cron() Redis will be notified that the background
1597 * saving aborted, handling special stuff like slaves pending for
1598 * synchronization... */
1599 redisLog(REDIS_WARNING,"Error trying to save the DB, can't exit.");
1600 return REDIS_ERR;
1601 }
1602 }
1603 if (server.daemonize) {
1604 redisLog(REDIS_NOTICE,"Removing the pid file.");
1605 unlink(server.pidfile);
1606 }
1607 /* Close the listening sockets. Apparently this allows faster restarts. */
1608 if (server.ipfd != -1) close(server.ipfd);
1609 if (server.sofd != -1) close(server.sofd);
1610 if (server.unixsocket) {
1611 redisLog(REDIS_NOTICE,"Removing the unix socket file.");
1612 unlink(server.unixsocket); /* don't care if this fails */
1613 }
1614
1615 redisLog(REDIS_WARNING,"Redis is now ready to exit, bye bye...");
1616 return REDIS_OK;
1617 }
1618
1619 /*================================== Commands =============================== */
1620
1621 void authCommand(redisClient *c) {
1622 if (!server.requirepass) {
1623 addReplyError(c,"Client sent AUTH, but no password is set");
1624 } else if (!strcmp(c->argv[1]->ptr, server.requirepass)) {
1625 c->authenticated = 1;
1626 addReply(c,shared.ok);
1627 } else {
1628 c->authenticated = 0;
1629 addReplyError(c,"invalid password");
1630 }
1631 }
1632
1633 void pingCommand(redisClient *c) {
1634 addReply(c,shared.pong);
1635 }
1636
1637 void echoCommand(redisClient *c) {
1638 addReplyBulk(c,c->argv[1]);
1639 }
1640
1641 void timeCommand(redisClient *c) {
1642 struct timeval tv;
1643
1644 /* gettimeofday() can only fail if &tv is a bad addresss so we
1645 * don't check for errors. */
1646 gettimeofday(&tv,NULL);
1647 addReplyMultiBulkLen(c,2);
1648 addReplyBulkLongLong(c,tv.tv_sec);
1649 addReplyBulkLongLong(c,tv.tv_usec);
1650 }
1651
1652 /* Convert an amount of bytes into a human readable string in the form
1653 * of 100B, 2G, 100M, 4K, and so forth. */
1654 void bytesToHuman(char *s, unsigned long long n) {
1655 double d;
1656
1657 if (n < 1024) {
1658 /* Bytes */
1659 sprintf(s,"%lluB",n);
1660 return;
1661 } else if (n < (1024*1024)) {
1662 d = (double)n/(1024);
1663 sprintf(s,"%.2fK",d);
1664 } else if (n < (1024LL*1024*1024)) {
1665 d = (double)n/(1024*1024);
1666 sprintf(s,"%.2fM",d);
1667 } else if (n < (1024LL*1024*1024*1024)) {
1668 d = (double)n/(1024LL*1024*1024);
1669 sprintf(s,"%.2fG",d);
1670 }
1671 }
1672
1673 /* Create the string returned by the INFO command. This is decoupled
1674 * by the INFO command itself as we need to report the same information
1675 * on memory corruption problems. */
1676 sds genRedisInfoString(char *section) {
1677 sds info = sdsempty();
1678 time_t uptime = server.unixtime-server.stat_starttime;
1679 int j, numcommands;
1680 struct rusage self_ru, c_ru;
1681 unsigned long lol, bib;
1682 int allsections = 0, defsections = 0;
1683 int sections = 0;
1684
1685 if (section) {
1686 allsections = strcasecmp(section,"all") == 0;
1687 defsections = strcasecmp(section,"default") == 0;
1688 }
1689
1690 getrusage(RUSAGE_SELF, &self_ru);
1691 getrusage(RUSAGE_CHILDREN, &c_ru);
1692 getClientsMaxBuffers(&lol,&bib);
1693
1694 /* Server */
1695 if (allsections || defsections || !strcasecmp(section,"server")) {
1696 if (sections++) info = sdscat(info,"\r\n");
1697 info = sdscatprintf(info,
1698 "# Server\r\n"
1699 "redis_version:%s\r\n"
1700 "redis_git_sha1:%s\r\n"
1701 "redis_git_dirty:%d\r\n"
1702 "arch_bits:%d\r\n"
1703 "multiplexing_api:%s\r\n"
1704 "gcc_version:%d.%d.%d\r\n"
1705 "process_id:%ld\r\n"
1706 "run_id:%s\r\n"
1707 "tcp_port:%d\r\n"
1708 "uptime_in_seconds:%ld\r\n"
1709 "uptime_in_days:%ld\r\n"
1710 "lru_clock:%ld\r\n",
1711 REDIS_VERSION,
1712 redisGitSHA1(),
1713 strtol(redisGitDirty(),NULL,10) > 0,
1714 server.arch_bits,
1715 aeGetApiName(),
1716 #ifdef __GNUC__
1717 __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
1718 #else
1719 0,0,0,
1720 #endif
1721 (long) getpid(),
1722 server.runid,
1723 server.port,
1724 uptime,
1725 uptime/(3600*24),
1726 (unsigned long) server.lruclock);
1727 }
1728
1729 /* Clients */
1730 if (allsections || defsections || !strcasecmp(section,"clients")) {
1731 if (sections++) info = sdscat(info,"\r\n");
1732 info = sdscatprintf(info,
1733 "# Clients\r\n"
1734 "connected_clients:%lu\r\n"
1735 "client_longest_output_list:%lu\r\n"
1736 "client_biggest_input_buf:%lu\r\n"
1737 "blocked_clients:%d\r\n",
1738 listLength(server.clients)-listLength(server.slaves),
1739 lol, bib,
1740 server.bpop_blocked_clients);
1741 }
1742
1743 /* Memory */
1744 if (allsections || defsections || !strcasecmp(section,"memory")) {
1745 char hmem[64];
1746 char peak_hmem[64];
1747
1748 bytesToHuman(hmem,zmalloc_used_memory());
1749 bytesToHuman(peak_hmem,server.stat_peak_memory);
1750 if (sections++) info = sdscat(info,"\r\n");
1751 info = sdscatprintf(info,
1752 "# Memory\r\n"
1753 "used_memory:%zu\r\n"
1754 "used_memory_human:%s\r\n"
1755 "used_memory_rss:%zu\r\n"
1756 "used_memory_peak:%zu\r\n"
1757 "used_memory_peak_human:%s\r\n"
1758 "used_memory_lua:%lld\r\n"
1759 "mem_fragmentation_ratio:%.2f\r\n"
1760 "mem_allocator:%s\r\n",
1761 zmalloc_used_memory(),
1762 hmem,
1763 zmalloc_get_rss(),
1764 server.stat_peak_memory,
1765 peak_hmem,
1766 ((long long)lua_gc(server.lua,LUA_GCCOUNT,0))*1024LL,
1767 zmalloc_get_fragmentation_ratio(),
1768 ZMALLOC_LIB
1769 );
1770 }
1771
1772 /* Persistence */
1773 if (allsections || defsections || !strcasecmp(section,"persistence")) {
1774 if (sections++) info = sdscat(info,"\r\n");
1775 info = sdscatprintf(info,
1776 "# Persistence\r\n"
1777 "loading:%d\r\n"
1778 "aof_enabled:%d\r\n"
1779 "changes_since_last_save:%lld\r\n"
1780 "bgsave_in_progress:%d\r\n"
1781 "last_save_time:%ld\r\n"
1782 "last_bgsave_status:%s\r\n"
1783 "bgrewriteaof_in_progress:%d\r\n",
1784 server.loading,
1785 server.aof_state != REDIS_AOF_OFF,
1786 server.dirty,
1787 server.rdb_child_pid != -1,
1788 server.lastsave,
1789 server.lastbgsave_status == REDIS_OK ? "ok" : "err",
1790 server.aof_child_pid != -1);
1791
1792 if (server.aof_state != REDIS_AOF_OFF) {
1793 info = sdscatprintf(info,
1794 "aof_current_size:%lld\r\n"
1795 "aof_base_size:%lld\r\n"
1796 "aof_pending_rewrite:%d\r\n"
1797 "aof_buffer_length:%zu\r\n"
1798 "aof_pending_bio_fsync:%llu\r\n"
1799 "aof_delayed_fsync:%lu\r\n",
1800 (long long) server.aof_current_size,
1801 (long long) server.aof_rewrite_base_size,
1802 server.aof_rewrite_scheduled,
1803 sdslen(server.aof_buf),
1804 bioPendingJobsOfType(REDIS_BIO_AOF_FSYNC),
1805 server.aof_delayed_fsync);
1806 }
1807
1808 if (server.loading) {
1809 double perc;
1810 time_t eta, elapsed;
1811 off_t remaining_bytes = server.loading_total_bytes-
1812 server.loading_loaded_bytes;
1813
1814 perc = ((double)server.loading_loaded_bytes /
1815 server.loading_total_bytes) * 100;
1816
1817 elapsed = server.unixtime-server.loading_start_time;
1818 if (elapsed == 0) {
1819 eta = 1; /* A fake 1 second figure if we don't have
1820 enough info */
1821 } else {
1822 eta = (elapsed*remaining_bytes)/server.loading_loaded_bytes;
1823 }
1824
1825 info = sdscatprintf(info,
1826 "loading_start_time:%ld\r\n"
1827 "loading_total_bytes:%llu\r\n"
1828 "loading_loaded_bytes:%llu\r\n"
1829 "loading_loaded_perc:%.2f\r\n"
1830 "loading_eta_seconds:%ld\r\n"
1831 ,(unsigned long) server.loading_start_time,
1832 (unsigned long long) server.loading_total_bytes,
1833 (unsigned long long) server.loading_loaded_bytes,
1834 perc,
1835 eta
1836 );
1837 }
1838 }
1839
1840 /* Stats */
1841 if (allsections || defsections || !strcasecmp(section,"stats")) {
1842 if (sections++) info = sdscat(info,"\r\n");
1843 info = sdscatprintf(info,
1844 "# Stats\r\n"
1845 "total_connections_received:%lld\r\n"
1846 "total_commands_processed:%lld\r\n"
1847 "instantaneous_ops_per_sec:%lld\r\n"
1848 "rejected_connections:%lld\r\n"
1849 "expired_keys:%lld\r\n"
1850 "evicted_keys:%lld\r\n"
1851 "keyspace_hits:%lld\r\n"
1852 "keyspace_misses:%lld\r\n"
1853 "pubsub_channels:%ld\r\n"
1854 "pubsub_patterns:%lu\r\n"
1855 "latest_fork_usec:%lld\r\n",
1856 server.stat_numconnections,
1857 server.stat_numcommands,
1858 getOperationsPerSecond(),
1859 server.stat_rejected_conn,
1860 server.stat_expiredkeys,
1861 server.stat_evictedkeys,
1862 server.stat_keyspace_hits,
1863 server.stat_keyspace_misses,
1864 dictSize(server.pubsub_channels),
1865 listLength(server.pubsub_patterns),
1866 server.stat_fork_time);
1867 }
1868
1869 /* Replication */
1870 if (allsections || defsections || !strcasecmp(section,"replication")) {
1871 if (sections++) info = sdscat(info,"\r\n");
1872 info = sdscatprintf(info,
1873 "# Replication\r\n"
1874 "role:%s\r\n",
1875 server.masterhost == NULL ? "master" : "slave");
1876 if (server.masterhost) {
1877 info = sdscatprintf(info,
1878 "master_host:%s\r\n"
1879 "master_port:%d\r\n"
1880 "master_link_status:%s\r\n"
1881 "master_last_io_seconds_ago:%d\r\n"
1882 "master_sync_in_progress:%d\r\n"
1883 ,server.masterhost,
1884 server.masterport,
1885 (server.repl_state == REDIS_REPL_CONNECTED) ?
1886 "up" : "down",
1887 server.master ?
1888 ((int)(server.unixtime-server.master->lastinteraction)) : -1,
1889 server.repl_state == REDIS_REPL_TRANSFER
1890 );
1891
1892 if (server.repl_state == REDIS_REPL_TRANSFER) {
1893 info = sdscatprintf(info,
1894 "master_sync_left_bytes:%ld\r\n"
1895 "master_sync_last_io_seconds_ago:%d\r\n"
1896 ,(long)server.repl_transfer_left,
1897 (int)(server.unixtime-server.repl_transfer_lastio)
1898 );
1899 }
1900
1901 if (server.repl_state != REDIS_REPL_CONNECTED) {
1902 info = sdscatprintf(info,
1903 "master_link_down_since_seconds:%ld\r\n",
1904 (long)server.unixtime-server.repl_down_since);
1905 }
1906 }
1907 info = sdscatprintf(info,
1908 "connected_slaves:%lu\r\n",
1909 listLength(server.slaves));
1910 if (listLength(server.slaves)) {
1911 int slaveid = 0;
1912 listNode *ln;
1913 listIter li;
1914
1915 listRewind(server.slaves,&li);
1916 while((ln = listNext(&li))) {
1917 redisClient *slave = listNodeValue(ln);
1918 char *state = NULL;
1919 char ip[32];
1920 int port;
1921
1922 if (anetPeerToString(slave->fd,ip,&port) == -1) continue;
1923 switch(slave->replstate) {
1924 case REDIS_REPL_WAIT_BGSAVE_START:
1925 case REDIS_REPL_WAIT_BGSAVE_END:
1926 state = "wait_bgsave";
1927 break;
1928 case REDIS_REPL_SEND_BULK:
1929 state = "send_bulk";
1930 break;
1931 case REDIS_REPL_ONLINE:
1932 state = "online";
1933 break;
1934 }
1935 if (state == NULL) continue;
1936 info = sdscatprintf(info,"slave%d:%s,%d,%s\r\n",
1937 slaveid,ip,port,state);
1938 slaveid++;
1939 }
1940 }
1941 }
1942
1943 /* CPU */
1944 if (allsections || defsections || !strcasecmp(section,"cpu")) {
1945 if (sections++) info = sdscat(info,"\r\n");
1946 info = sdscatprintf(info,
1947 "# CPU\r\n"
1948 "used_cpu_sys:%.2f\r\n"
1949 "used_cpu_user:%.2f\r\n"
1950 "used_cpu_sys_children:%.2f\r\n"
1951 "used_cpu_user_children:%.2f\r\n",
1952 (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
1953 (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000,
1954 (float)c_ru.ru_stime.tv_sec+(float)c_ru.ru_stime.tv_usec/1000000,
1955 (float)c_ru.ru_utime.tv_sec+(float)c_ru.ru_utime.tv_usec/1000000);
1956 }
1957
1958 /* cmdtime */
1959 if (allsections || !strcasecmp(section,"commandstats")) {
1960 if (sections++) info = sdscat(info,"\r\n");
1961 info = sdscatprintf(info, "# Commandstats\r\n");
1962 numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1963 for (j = 0; j < numcommands; j++) {
1964 struct redisCommand *c = redisCommandTable+j;
1965
1966 if (!c->calls) continue;
1967 info = sdscatprintf(info,
1968 "cmdstat_%s:calls=%lld,usec=%lld,usec_per_call=%.2f\r\n",
1969 c->name, c->calls, c->microseconds,
1970 (c->calls == 0) ? 0 : ((float)c->microseconds/c->calls));
1971 }
1972 }
1973
1974 /* Key space */
1975 if (allsections || defsections || !strcasecmp(section,"keyspace")) {
1976 if (sections++) info = sdscat(info,"\r\n");
1977 info = sdscatprintf(info, "# Keyspace\r\n");
1978 for (j = 0; j < server.dbnum; j++) {
1979 long long keys, vkeys;
1980
1981 keys = dictSize(server.db[j].dict);
1982 vkeys = dictSize(server.db[j].expires);
1983 if (keys || vkeys) {
1984 info = sdscatprintf(info, "db%d:keys=%lld,expires=%lld\r\n",
1985 j, keys, vkeys);
1986 }
1987 }
1988 }
1989 return info;
1990 }
1991
1992 void infoCommand(redisClient *c) {
1993 char *section = c->argc == 2 ? c->argv[1]->ptr : "default";
1994
1995 if (c->argc > 2) {
1996 addReply(c,shared.syntaxerr);
1997 return;
1998 }
1999 sds info = genRedisInfoString(section);
2000 addReplySds(c,sdscatprintf(sdsempty(),"$%lu\r\n",
2001 (unsigned long)sdslen(info)));
2002 addReplySds(c,info);
2003 addReply(c,shared.crlf);
2004 }
2005
2006 void monitorCommand(redisClient *c) {
2007 /* ignore MONITOR if aleady slave or in monitor mode */
2008 if (c->flags & REDIS_SLAVE) return;
2009
2010 c->flags |= (REDIS_SLAVE|REDIS_MONITOR);
2011 c->slaveseldb = 0;
2012 listAddNodeTail(server.monitors,c);
2013 addReply(c,shared.ok);
2014 }
2015
2016 /* ============================ Maxmemory directive ======================== */
2017
2018 /* This function gets called when 'maxmemory' is set on the config file to limit
2019 * the max memory used by the server, before processing a command.
2020 *
2021 * The goal of the function is to free enough memory to keep Redis under the
2022 * configured memory limit.
2023 *
2024 * The function starts calculating how many bytes should be freed to keep
2025 * Redis under the limit, and enters a loop selecting the best keys to
2026 * evict accordingly to the configured policy.
2027 *
2028 * If all the bytes needed to return back under the limit were freed the
2029 * function returns REDIS_OK, otherwise REDIS_ERR is returned, and the caller
2030 * should block the execution of commands that will result in more memory
2031 * used by the server.
2032 */
2033 int freeMemoryIfNeeded(void) {
2034 size_t mem_used, mem_tofree, mem_freed;
2035 int slaves = listLength(server.slaves);
2036
2037 /* Remove the size of slaves output buffers and AOF buffer from the
2038 * count of used memory. */
2039 mem_used = zmalloc_used_memory();
2040 if (slaves) {
2041 listIter li;
2042 listNode *ln;
2043
2044 listRewind(server.slaves,&li);
2045 while((ln = listNext(&li))) {
2046 redisClient *slave = listNodeValue(ln);
2047 unsigned long obuf_bytes = getClientOutputBufferMemoryUsage(slave);
2048 if (obuf_bytes > mem_used)
2049 mem_used = 0;
2050 else
2051 mem_used -= obuf_bytes;
2052 }
2053 }
2054 if (server.aof_state != REDIS_AOF_OFF) {
2055 mem_used -= sdslen(server.aof_buf);
2056 mem_used -= sdslen(server.aof_rewrite_buf);
2057 }
2058
2059 /* Check if we are over the memory limit. */
2060 if (mem_used <= server.maxmemory) return REDIS_OK;
2061
2062 if (server.maxmemory_policy == REDIS_MAXMEMORY_NO_EVICTION)
2063 return REDIS_ERR; /* We need to free memory, but policy forbids. */
2064
2065 /* Compute how much memory we need to free. */
2066 mem_tofree = mem_used - server.maxmemory;
2067 mem_freed = 0;
2068 while (mem_freed < mem_tofree) {
2069 int j, k, keys_freed = 0;
2070
2071 for (j = 0; j < server.dbnum; j++) {
2072 long bestval = 0; /* just to prevent warning */
2073 sds bestkey = NULL;
2074 struct dictEntry *de;
2075 redisDb *db = server.db+j;
2076 dict *dict;
2077
2078 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2079 server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM)
2080 {
2081 dict = server.db[j].dict;
2082 } else {
2083 dict = server.db[j].expires;
2084 }
2085 if (dictSize(dict) == 0) continue;
2086
2087 /* volatile-random and allkeys-random policy */
2088 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM ||
2089 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_RANDOM)
2090 {
2091 de = dictGetRandomKey(dict);
2092 bestkey = dictGetKey(de);
2093 }
2094
2095 /* volatile-lru and allkeys-lru policy */
2096 else if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2097 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2098 {
2099 for (k = 0; k < server.maxmemory_samples; k++) {
2100 sds thiskey;
2101 long thisval;
2102 robj *o;
2103
2104 de = dictGetRandomKey(dict);
2105 thiskey = dictGetKey(de);
2106 /* When policy is volatile-lru we need an additonal lookup
2107 * to locate the real key, as dict is set to db->expires. */
2108 if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2109 de = dictFind(db->dict, thiskey);
2110 o = dictGetVal(de);
2111 thisval = estimateObjectIdleTime(o);
2112
2113 /* Higher idle time is better candidate for deletion */
2114 if (bestkey == NULL || thisval > bestval) {
2115 bestkey = thiskey;
2116 bestval = thisval;
2117 }
2118 }
2119 }
2120
2121 /* volatile-ttl */
2122 else if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_TTL) {
2123 for (k = 0; k < server.maxmemory_samples; k++) {
2124 sds thiskey;
2125 long thisval;
2126
2127 de = dictGetRandomKey(dict);
2128 thiskey = dictGetKey(de);
2129 thisval = (long) dictGetVal(de);
2130
2131 /* Expire sooner (minor expire unix timestamp) is better
2132 * candidate for deletion */
2133 if (bestkey == NULL || thisval < bestval) {
2134 bestkey = thiskey;
2135 bestval = thisval;
2136 }
2137 }
2138 }
2139
2140 /* Finally remove the selected key. */
2141 if (bestkey) {
2142 long long delta;
2143
2144 robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
2145 propagateExpire(db,keyobj);
2146 /* We compute the amount of memory freed by dbDelete() alone.
2147 * It is possible that actually the memory needed to propagate
2148 * the DEL in AOF and replication link is greater than the one
2149 * we are freeing removing the key, but we can't account for
2150 * that otherwise we would never exit the loop.
2151 *
2152 * AOF and Output buffer memory will be freed eventually so
2153 * we only care about memory used by the key space. */
2154 delta = (long long) zmalloc_used_memory();
2155 dbDelete(db,keyobj);
2156 delta -= (long long) zmalloc_used_memory();
2157 mem_freed += delta;
2158 server.stat_evictedkeys++;
2159 decrRefCount(keyobj);
2160 keys_freed++;
2161
2162 /* When the memory to free starts to be big enough, we may
2163 * start spending so much time here that is impossible to
2164 * deliver data to the slaves fast enough, so we force the
2165 * transmission here inside the loop. */
2166 if (slaves) flushSlavesOutputBuffers();
2167 }
2168 }
2169 if (!keys_freed) return REDIS_ERR; /* nothing to free... */
2170 }
2171 return REDIS_OK;
2172 }
2173
2174 /* =================================== Main! ================================ */
2175
2176 #ifdef __linux__
2177 int linuxOvercommitMemoryValue(void) {
2178 FILE *fp = fopen("/proc/sys/vm/overcommit_memory","r");
2179 char buf[64];
2180
2181 if (!fp) return -1;
2182 if (fgets(buf,64,fp) == NULL) {
2183 fclose(fp);
2184 return -1;
2185 }
2186 fclose(fp);
2187
2188 return atoi(buf);
2189 }
2190
2191 void linuxOvercommitMemoryWarning(void) {
2192 if (linuxOvercommitMemoryValue() == 0) {
2193 redisLog(REDIS_WARNING,"WARNING overcommit_memory is set to 0! Background save may fail under low memory condition. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
2194 }
2195 }
2196 #endif /* __linux__ */
2197
2198 void createPidFile(void) {
2199 /* Try to write the pid file in a best-effort way. */
2200 FILE *fp = fopen(server.pidfile,"w");
2201 if (fp) {
2202 fprintf(fp,"%d\n",(int)getpid());
2203 fclose(fp);
2204 }
2205 }
2206
2207 void daemonize(void) {
2208 int fd;
2209
2210 if (fork() != 0) exit(0); /* parent exits */
2211 setsid(); /* create a new session */
2212
2213 /* Every output goes to /dev/null. If Redis is daemonized but
2214 * the 'logfile' is set to 'stdout' in the configuration file
2215 * it will not log at all. */
2216 if ((fd = open("/dev/null", O_RDWR, 0)) != -1) {
2217 dup2(fd, STDIN_FILENO);
2218 dup2(fd, STDOUT_FILENO);
2219 dup2(fd, STDERR_FILENO);
2220 if (fd > STDERR_FILENO) close(fd);
2221 }
2222 }
2223
2224 void version() {
2225 printf("Redis server v=%s sha=%s:%d malloc=%s\n", REDIS_VERSION,
2226 redisGitSHA1(), atoi(redisGitDirty()) > 0, ZMALLOC_LIB);
2227 exit(0);
2228 }
2229
2230 void usage() {
2231 fprintf(stderr,"Usage: ./redis-server [/path/to/redis.conf] [options]\n");
2232 fprintf(stderr," ./redis-server - (read config from stdin)\n");
2233 fprintf(stderr," ./redis-server -v or --version\n");
2234 fprintf(stderr," ./redis-server -h or --help\n");
2235 fprintf(stderr," ./redis-server --test-memory <megabytes>\n\n");
2236 fprintf(stderr,"Examples:\n");
2237 fprintf(stderr," ./redis-server (run the server with default conf)\n");
2238 fprintf(stderr," ./redis-server /etc/redis/6379.conf\n");
2239 fprintf(stderr," ./redis-server --port 7777\n");
2240 fprintf(stderr," ./redis-server --port 7777 --slaveof 127.0.0.1 8888\n");
2241 fprintf(stderr," ./redis-server /etc/myredis.conf --loglevel verbose\n");
2242 exit(1);
2243 }
2244
2245 void redisAsciiArt(void) {
2246 #include "asciilogo.h"
2247 char *buf = zmalloc(1024*16);
2248
2249 snprintf(buf,1024*16,ascii_logo,
2250 REDIS_VERSION,
2251 redisGitSHA1(),
2252 strtol(redisGitDirty(),NULL,10) > 0,
2253 (sizeof(long) == 8) ? "64" : "32",
2254 "stand alone",
2255 server.port,
2256 (long) getpid()
2257 );
2258 redisLogRaw(REDIS_NOTICE|REDIS_LOG_RAW,buf);
2259 zfree(buf);
2260 }
2261
2262 static void sigtermHandler(int sig) {
2263 REDIS_NOTUSED(sig);
2264
2265 redisLogFromHandler(REDIS_WARNING,"Received SIGTERM, scheduling shutdown...");
2266 server.shutdown_asap = 1;
2267 }
2268
2269 void setupSignalHandlers(void) {
2270 struct sigaction act;
2271
2272 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction is used.
2273 * Otherwise, sa_handler is used. */
2274 sigemptyset(&act.sa_mask);
2275 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND;
2276 act.sa_handler = sigtermHandler;
2277 sigaction(SIGTERM, &act, NULL);
2278
2279 #ifdef HAVE_BACKTRACE
2280 sigemptyset(&act.sa_mask);
2281 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND | SA_SIGINFO;
2282 act.sa_sigaction = sigsegvHandler;
2283 sigaction(SIGSEGV, &act, NULL);
2284 sigaction(SIGBUS, &act, NULL);
2285 sigaction(SIGFPE, &act, NULL);
2286 sigaction(SIGILL, &act, NULL);
2287 #endif
2288 return;
2289 }
2290
2291 void memtest(size_t megabytes, int passes);
2292
2293 int main(int argc, char **argv) {
2294 long long start;
2295 struct timeval tv;
2296
2297 /* We need to initialize our libraries, and the server configuration. */
2298 zmalloc_enable_thread_safeness();
2299 srand(time(NULL)^getpid());
2300 gettimeofday(&tv,NULL);
2301 dictSetHashFunctionSeed(tv.tv_sec^tv.tv_usec^getpid());
2302 initServerConfig();
2303
2304 if (argc >= 2) {
2305 int j = 1; /* First option to parse in argv[] */
2306 sds options = sdsempty();
2307 char *configfile = NULL;
2308
2309 /* Handle special options --help and --version */
2310 if (strcmp(argv[1], "-v") == 0 ||
2311 strcmp(argv[1], "--version") == 0) version();
2312 if (strcmp(argv[1], "--help") == 0 ||
2313 strcmp(argv[1], "-h") == 0) usage();
2314 if (strcmp(argv[1], "--test-memory") == 0) {
2315 if (argc == 3) {
2316 memtest(atoi(argv[2]),50);
2317 exit(0);
2318 } else {
2319 fprintf(stderr,"Please specify the amount of memory to test in megabytes.\n");
2320 fprintf(stderr,"Example: ./redis-server --test-memory 4096\n\n");
2321 exit(1);
2322 }
2323 }
2324
2325 /* First argument is the config file name? */
2326 if (argv[j][0] != '-' || argv[j][1] != '-')
2327 configfile = argv[j++];
2328 /* All the other options are parsed and conceptually appended to the
2329 * configuration file. For instance --port 6380 will generate the
2330 * string "port 6380\n" to be parsed after the actual file name
2331 * is parsed, if any. */
2332 while(j != argc) {
2333 if (argv[j][0] == '-' && argv[j][1] == '-') {
2334 /* Option name */
2335 if (sdslen(options)) options = sdscat(options,"\n");
2336 options = sdscat(options,argv[j]+2);
2337 options = sdscat(options," ");
2338 } else {
2339 /* Option argument */
2340 options = sdscatrepr(options,argv[j],strlen(argv[j]));
2341 options = sdscat(options," ");
2342 }
2343 j++;
2344 }
2345 resetServerSaveParams();
2346 loadServerConfig(configfile,options);
2347 sdsfree(options);
2348 } else {
2349 redisLog(REDIS_WARNING,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
2350 }
2351 if (server.daemonize) daemonize();
2352 initServer();
2353 if (server.daemonize) createPidFile();
2354 redisAsciiArt();
2355 redisLog(REDIS_WARNING,"Server started, Redis version " REDIS_VERSION);
2356 #ifdef __linux__
2357 linuxOvercommitMemoryWarning();
2358 #endif
2359 start = ustime();
2360 if (server.aof_state == REDIS_AOF_ON) {
2361 if (loadAppendOnlyFile(server.aof_filename) == REDIS_OK)
2362 redisLog(REDIS_NOTICE,"DB loaded from append only file: %.3f seconds",(float)(ustime()-start)/1000000);
2363 } else {
2364 if (rdbLoad(server.rdb_filename) == REDIS_OK) {
2365 redisLog(REDIS_NOTICE,"DB loaded from disk: %.3f seconds",
2366 (float)(ustime()-start)/1000000);
2367 } else if (errno != ENOENT) {
2368 redisLog(REDIS_WARNING,"Fatal error loading the DB. Exiting.");
2369 exit(1);
2370 }
2371 }
2372 if (server.ipfd > 0)
2373 redisLog(REDIS_NOTICE,"The server is now ready to accept connections on port %d", server.port);
2374 if (server.sofd > 0)
2375 redisLog(REDIS_NOTICE,"The server is now ready to accept connections at %s", server.unixsocket);
2376 aeSetBeforeSleepProc(server.el,beforeSleep);
2377 aeMain(server.el);
2378 aeDeleteEventLoop(server.el);
2379 return 0;
2380 }
2381
2382 /* The End */