]> git.saurik.com Git - redis.git/blob - src/redis.c
fix time() instead of mstime() in expireIfNeeded
[redis.git] / src / redis.c
1 /*
2 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 */
29
30 #include "redis.h"
31 #include "slowlog.h"
32 #include "bio.h"
33
34 #include <time.h>
35 #include <signal.h>
36 #include <sys/wait.h>
37 #include <errno.h>
38 #include <assert.h>
39 #include <ctype.h>
40 #include <stdarg.h>
41 #include <arpa/inet.h>
42 #include <sys/stat.h>
43 #include <fcntl.h>
44 #include <sys/time.h>
45 #include <sys/resource.h>
46 #include <sys/uio.h>
47 #include <limits.h>
48 #include <float.h>
49 #include <math.h>
50 #include <sys/resource.h>
51
52 /* Our shared "common" objects */
53
54 struct sharedObjectsStruct shared;
55
56 /* Global vars that are actually used as constants. The following double
57 * values are used for double on-disk serialization, and are initialized
58 * at runtime to avoid strange compiler optimizations. */
59
60 double R_Zero, R_PosInf, R_NegInf, R_Nan;
61
62 /*================================= Globals ================================= */
63
64 /* Global vars */
65 struct redisServer server; /* server global state */
66 struct redisCommand *commandTable;
67
68 /* Our command table.
69 *
70 * Every entry is composed of the following fields:
71 *
72 * name: a string representing the command name.
73 * function: pointer to the C function implementing the command.
74 * arity: number of arguments, it is possible to use -N to say >= N
75 * sflags: command flags as string. See below for a table of flags.
76 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
77 * get_keys_proc: an optional function to get key arguments from a command.
78 * This is only used when the following three fields are not
79 * enough to specify what arguments are keys.
80 * first_key_index: first argument that is a key
81 * last_key_index: last argument that is a key
82 * key_step: step to get all the keys from first to last argument. For instance
83 * in MSET the step is two since arguments are key,val,key,val,...
84 * microseconds: microseconds of total execution time for this command.
85 * calls: total number of calls of this command.
86 *
87 * The flags, microseconds and calls fields are computed by Redis and should
88 * always be set to zero.
89 *
90 * Command flags are expressed using strings where every character represents
91 * a flag. Later the populateCommandTable() function will take care of
92 * populating the real 'flags' field using this characters.
93 *
94 * This is the meaning of the flags:
95 *
96 * w: write command (may modify the key space).
97 * r: read command (will never modify the key space).
98 * m: may increase memory usage once called. Don't allow if out of memory.
99 * a: admin command, like SAVE or SHUTDOWN.
100 * p: Pub/Sub related command.
101 * f: force replication of this command, regarless of server.dirty.
102 * s: command not allowed in scripts.
103 * R: random command. Command is not deterministic, that is, the same command
104 * with the same arguments, with the same key space, may have different
105 * results. For instance SPOP and RANDOMKEY are two random commands.
106 * S: Sort command output array if called from script, so that the output
107 * is deterministic.
108 */
109 struct redisCommand redisCommandTable[] = {
110 {"get",getCommand,2,"r",0,NULL,1,1,1,0,0},
111 {"set",setCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
112 {"setnx",setnxCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
113 {"setex",setexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
114 {"psetex",psetexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
115 {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
116 {"strlen",strlenCommand,2,"r",0,NULL,1,1,1,0,0},
117 {"del",delCommand,-2,"w",0,noPreloadGetKeys,1,-1,1,0,0},
118 {"exists",existsCommand,2,"r",0,NULL,1,1,1,0,0},
119 {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
120 {"getbit",getbitCommand,3,"r",0,NULL,1,1,1,0,0},
121 {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
122 {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
123 {"substr",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
124 {"incr",incrCommand,2,"wm",0,NULL,1,1,1,0,0},
125 {"decr",decrCommand,2,"wm",0,NULL,1,1,1,0,0},
126 {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
127 {"rpush",rpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
128 {"lpush",lpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
129 {"rpushx",rpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
130 {"lpushx",lpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
131 {"linsert",linsertCommand,5,"wm",0,NULL,1,1,1,0,0},
132 {"rpop",rpopCommand,2,"w",0,NULL,1,1,1,0,0},
133 {"lpop",lpopCommand,2,"w",0,NULL,1,1,1,0,0},
134 {"brpop",brpopCommand,-3,"ws",0,NULL,1,1,1,0,0},
135 {"brpoplpush",brpoplpushCommand,4,"wms",0,NULL,1,2,1,0,0},
136 {"blpop",blpopCommand,-3,"ws",0,NULL,1,-2,1,0,0},
137 {"llen",llenCommand,2,"r",0,NULL,1,1,1,0,0},
138 {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
139 {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
140 {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
141 {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
142 {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
143 {"rpoplpush",rpoplpushCommand,3,"wm",0,NULL,1,2,1,0,0},
144 {"sadd",saddCommand,-3,"wm",0,NULL,1,1,1,0,0},
145 {"srem",sremCommand,-3,"w",0,NULL,1,1,1,0,0},
146 {"smove",smoveCommand,4,"w",0,NULL,1,2,1,0,0},
147 {"sismember",sismemberCommand,3,"r",0,NULL,1,1,1,0,0},
148 {"scard",scardCommand,2,"r",0,NULL,1,1,1,0,0},
149 {"spop",spopCommand,2,"wRs",0,NULL,1,1,1,0,0},
150 {"srandmember",srandmemberCommand,2,"rR",0,NULL,1,1,1,0,0},
151 {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
152 {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
153 {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
154 {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
155 {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
156 {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
157 {"smembers",sinterCommand,2,"rS",0,NULL,1,1,1,0,0},
158 {"zadd",zaddCommand,-4,"wm",0,NULL,1,1,1,0,0},
159 {"zincrby",zincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
160 {"zrem",zremCommand,-3,"w",0,NULL,1,1,1,0,0},
161 {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
162 {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
163 {"zunionstore",zunionstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
164 {"zinterstore",zinterstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
165 {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
166 {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
167 {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
168 {"zcount",zcountCommand,4,"r",0,NULL,1,1,1,0,0},
169 {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
170 {"zcard",zcardCommand,2,"r",0,NULL,1,1,1,0,0},
171 {"zscore",zscoreCommand,3,"r",0,NULL,1,1,1,0,0},
172 {"zrank",zrankCommand,3,"r",0,NULL,1,1,1,0,0},
173 {"zrevrank",zrevrankCommand,3,"r",0,NULL,1,1,1,0,0},
174 {"hset",hsetCommand,4,"wm",0,NULL,1,1,1,0,0},
175 {"hsetnx",hsetnxCommand,4,"wm",0,NULL,1,1,1,0,0},
176 {"hget",hgetCommand,3,"r",0,NULL,1,1,1,0,0},
177 {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
178 {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
179 {"hincrby",hincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
180 {"hincrbyfloat",hincrbyfloatCommand,4,"wm",0,NULL,1,1,1,0,0},
181 {"hdel",hdelCommand,-3,"w",0,NULL,1,1,1,0,0},
182 {"hlen",hlenCommand,2,"r",0,NULL,1,1,1,0,0},
183 {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
184 {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
185 {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
186 {"hexists",hexistsCommand,3,"r",0,NULL,1,1,1,0,0},
187 {"incrby",incrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
188 {"decrby",decrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
189 {"incrbyfloat",incrbyfloatCommand,3,"wm",0,NULL,1,1,1,0,0},
190 {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
191 {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
192 {"msetnx",msetnxCommand,-3,"wm",0,NULL,1,-1,2,0,0},
193 {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
194 {"select",selectCommand,2,"r",0,NULL,0,0,0,0,0},
195 {"move",moveCommand,3,"w",0,NULL,1,1,1,0,0},
196 {"rename",renameCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
197 {"renamenx",renamenxCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
198 {"expire",expireCommand,3,"w",0,NULL,1,1,1,0,0},
199 {"expireat",expireatCommand,3,"w",0,NULL,1,1,1,0,0},
200 {"pexpire",pexpireCommand,3,"w",0,NULL,1,1,1,0,0},
201 {"pexpireat",pexpireatCommand,3,"w",0,NULL,1,1,1,0,0},
202 {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
203 {"dbsize",dbsizeCommand,1,"r",0,NULL,0,0,0,0,0},
204 {"auth",authCommand,2,"rs",0,NULL,0,0,0,0,0},
205 {"ping",pingCommand,1,"r",0,NULL,0,0,0,0,0},
206 {"echo",echoCommand,2,"r",0,NULL,0,0,0,0,0},
207 {"save",saveCommand,1,"ars",0,NULL,0,0,0,0,0},
208 {"bgsave",bgsaveCommand,1,"ar",0,NULL,0,0,0,0,0},
209 {"bgrewriteaof",bgrewriteaofCommand,1,"ar",0,NULL,0,0,0,0,0},
210 {"shutdown",shutdownCommand,-1,"ar",0,NULL,0,0,0,0,0},
211 {"lastsave",lastsaveCommand,1,"r",0,NULL,0,0,0,0,0},
212 {"type",typeCommand,2,"r",0,NULL,1,1,1,0,0},
213 {"multi",multiCommand,1,"rs",0,NULL,0,0,0,0,0},
214 {"exec",execCommand,1,"s",0,NULL,0,0,0,0,0},
215 {"discard",discardCommand,1,"rs",0,NULL,0,0,0,0,0},
216 {"sync",syncCommand,1,"ars",0,NULL,0,0,0,0,0},
217 {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
218 {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
219 {"sort",sortCommand,-2,"wmS",0,NULL,1,1,1,0,0},
220 {"info",infoCommand,-1,"r",0,NULL,0,0,0,0,0},
221 {"monitor",monitorCommand,1,"ars",0,NULL,0,0,0,0,0},
222 {"ttl",ttlCommand,2,"r",0,NULL,1,1,1,0,0},
223 {"pttl",pttlCommand,2,"r",0,NULL,1,1,1,0,0},
224 {"persist",persistCommand,2,"w",0,NULL,1,1,1,0,0},
225 {"slaveof",slaveofCommand,3,"aws",0,NULL,0,0,0,0,0},
226 {"debug",debugCommand,-2,"as",0,NULL,0,0,0,0,0},
227 {"config",configCommand,-2,"ar",0,NULL,0,0,0,0,0},
228 {"subscribe",subscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
229 {"unsubscribe",unsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
230 {"psubscribe",psubscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
231 {"punsubscribe",punsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
232 {"publish",publishCommand,3,"pf",0,NULL,0,0,0,0,0},
233 {"watch",watchCommand,-2,"rs",0,noPreloadGetKeys,1,-1,1,0,0},
234 {"unwatch",unwatchCommand,1,"rs",0,NULL,0,0,0,0,0},
235 {"restore",restoreCommand,4,"awm",0,NULL,1,1,1,0,0},
236 {"migrate",migrateCommand,6,"aw",0,NULL,0,0,0,0,0},
237 {"dump",dumpCommand,2,"ar",0,NULL,1,1,1,0,0},
238 {"object",objectCommand,-2,"r",0,NULL,2,2,2,0,0},
239 {"client",clientCommand,-2,"ar",0,NULL,0,0,0,0,0},
240 {"eval",evalCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
241 {"evalsha",evalShaCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
242 {"slowlog",slowlogCommand,-2,"r",0,NULL,0,0,0,0,0},
243 {"script",scriptCommand,-2,"ras",0,NULL,0,0,0,0,0},
244 {"time",timeCommand,1,"rR",0,NULL,0,0,0,0,0}
245 };
246
247 /*============================ Utility functions ============================ */
248
249 /* Low level logging. To use only for very big messages, otherwise
250 * redisLog() is to prefer. */
251 void redisLogRaw(int level, const char *msg) {
252 const int syslogLevelMap[] = { LOG_DEBUG, LOG_INFO, LOG_NOTICE, LOG_WARNING };
253 const char *c = ".-*#";
254 time_t now = time(NULL);
255 FILE *fp;
256 char buf[64];
257 int rawmode = (level & REDIS_LOG_RAW);
258
259 level &= 0xff; /* clear flags */
260 if (level < server.verbosity) return;
261
262 fp = (server.logfile == NULL) ? stdout : fopen(server.logfile,"a");
263 if (!fp) return;
264
265 if (rawmode) {
266 fprintf(fp,"%s",msg);
267 } else {
268 strftime(buf,sizeof(buf),"%d %b %H:%M:%S",localtime(&now));
269 fprintf(fp,"[%d] %s %c %s\n",(int)getpid(),buf,c[level],msg);
270 }
271 fflush(fp);
272
273 if (server.logfile) fclose(fp);
274
275 if (server.syslog_enabled) syslog(syslogLevelMap[level], "%s", msg);
276 }
277
278 /* Like redisLogRaw() but with printf-alike support. This is the funciton that
279 * is used across the code. The raw version is only used in order to dump
280 * the INFO output on crash. */
281 void redisLog(int level, const char *fmt, ...) {
282 va_list ap;
283 char msg[REDIS_MAX_LOGMSG_LEN];
284
285 if ((level&0xff) < server.verbosity) return;
286
287 va_start(ap, fmt);
288 vsnprintf(msg, sizeof(msg), fmt, ap);
289 va_end(ap);
290
291 redisLogRaw(level,msg);
292 }
293
294 /* Redis generally does not try to recover from out of memory conditions
295 * when allocating objects or strings, it is not clear if it will be possible
296 * to report this condition to the client since the networking layer itself
297 * is based on heap allocation for send buffers, so we simply abort.
298 * At least the code will be simpler to read... */
299 void oom(const char *msg) {
300 redisLog(REDIS_WARNING, "%s: Out of memory\n",msg);
301 sleep(1);
302 abort();
303 }
304
305 /* Return the UNIX time in microseconds */
306 long long ustime(void) {
307 struct timeval tv;
308 long long ust;
309
310 gettimeofday(&tv, NULL);
311 ust = ((long long)tv.tv_sec)*1000000;
312 ust += tv.tv_usec;
313 return ust;
314 }
315
316 /* Return the UNIX time in milliseconds */
317 long long mstime(void) {
318 return ustime()/1000;
319 }
320
321 /*====================== Hash table type implementation ==================== */
322
323 /* This is an hash table type that uses the SDS dynamic strings libary as
324 * keys and radis objects as values (objects can hold SDS strings,
325 * lists, sets). */
326
327 void dictVanillaFree(void *privdata, void *val)
328 {
329 DICT_NOTUSED(privdata);
330 zfree(val);
331 }
332
333 void dictListDestructor(void *privdata, void *val)
334 {
335 DICT_NOTUSED(privdata);
336 listRelease((list*)val);
337 }
338
339 int dictSdsKeyCompare(void *privdata, const void *key1,
340 const void *key2)
341 {
342 int l1,l2;
343 DICT_NOTUSED(privdata);
344
345 l1 = sdslen((sds)key1);
346 l2 = sdslen((sds)key2);
347 if (l1 != l2) return 0;
348 return memcmp(key1, key2, l1) == 0;
349 }
350
351 /* A case insensitive version used for the command lookup table. */
352 int dictSdsKeyCaseCompare(void *privdata, const void *key1,
353 const void *key2)
354 {
355 DICT_NOTUSED(privdata);
356
357 return strcasecmp(key1, key2) == 0;
358 }
359
360 void dictRedisObjectDestructor(void *privdata, void *val)
361 {
362 DICT_NOTUSED(privdata);
363
364 if (val == NULL) return; /* Values of swapped out keys as set to NULL */
365 decrRefCount(val);
366 }
367
368 void dictSdsDestructor(void *privdata, void *val)
369 {
370 DICT_NOTUSED(privdata);
371
372 sdsfree(val);
373 }
374
375 int dictObjKeyCompare(void *privdata, const void *key1,
376 const void *key2)
377 {
378 const robj *o1 = key1, *o2 = key2;
379 return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
380 }
381
382 unsigned int dictObjHash(const void *key) {
383 const robj *o = key;
384 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
385 }
386
387 unsigned int dictSdsHash(const void *key) {
388 return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
389 }
390
391 unsigned int dictSdsCaseHash(const void *key) {
392 return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
393 }
394
395 int dictEncObjKeyCompare(void *privdata, const void *key1,
396 const void *key2)
397 {
398 robj *o1 = (robj*) key1, *o2 = (robj*) key2;
399 int cmp;
400
401 if (o1->encoding == REDIS_ENCODING_INT &&
402 o2->encoding == REDIS_ENCODING_INT)
403 return o1->ptr == o2->ptr;
404
405 o1 = getDecodedObject(o1);
406 o2 = getDecodedObject(o2);
407 cmp = dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
408 decrRefCount(o1);
409 decrRefCount(o2);
410 return cmp;
411 }
412
413 unsigned int dictEncObjHash(const void *key) {
414 robj *o = (robj*) key;
415
416 if (o->encoding == REDIS_ENCODING_RAW) {
417 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
418 } else {
419 if (o->encoding == REDIS_ENCODING_INT) {
420 char buf[32];
421 int len;
422
423 len = ll2string(buf,32,(long)o->ptr);
424 return dictGenHashFunction((unsigned char*)buf, len);
425 } else {
426 unsigned int hash;
427
428 o = getDecodedObject(o);
429 hash = dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
430 decrRefCount(o);
431 return hash;
432 }
433 }
434 }
435
436 /* Sets type hash table */
437 dictType setDictType = {
438 dictEncObjHash, /* hash function */
439 NULL, /* key dup */
440 NULL, /* val dup */
441 dictEncObjKeyCompare, /* key compare */
442 dictRedisObjectDestructor, /* key destructor */
443 NULL /* val destructor */
444 };
445
446 /* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
447 dictType zsetDictType = {
448 dictEncObjHash, /* hash function */
449 NULL, /* key dup */
450 NULL, /* val dup */
451 dictEncObjKeyCompare, /* key compare */
452 dictRedisObjectDestructor, /* key destructor */
453 NULL /* val destructor */
454 };
455
456 /* Db->dict, keys are sds strings, vals are Redis objects. */
457 dictType dbDictType = {
458 dictSdsHash, /* hash function */
459 NULL, /* key dup */
460 NULL, /* val dup */
461 dictSdsKeyCompare, /* key compare */
462 dictSdsDestructor, /* key destructor */
463 dictRedisObjectDestructor /* val destructor */
464 };
465
466 /* Db->expires */
467 dictType keyptrDictType = {
468 dictSdsHash, /* hash function */
469 NULL, /* key dup */
470 NULL, /* val dup */
471 dictSdsKeyCompare, /* key compare */
472 NULL, /* key destructor */
473 NULL /* val destructor */
474 };
475
476 /* Command table. sds string -> command struct pointer. */
477 dictType commandTableDictType = {
478 dictSdsCaseHash, /* hash function */
479 NULL, /* key dup */
480 NULL, /* val dup */
481 dictSdsKeyCaseCompare, /* key compare */
482 dictSdsDestructor, /* key destructor */
483 NULL /* val destructor */
484 };
485
486 /* Hash type hash table (note that small hashes are represented with zimpaps) */
487 dictType hashDictType = {
488 dictEncObjHash, /* hash function */
489 NULL, /* key dup */
490 NULL, /* val dup */
491 dictEncObjKeyCompare, /* key compare */
492 dictRedisObjectDestructor, /* key destructor */
493 dictRedisObjectDestructor /* val destructor */
494 };
495
496 /* Keylist hash table type has unencoded redis objects as keys and
497 * lists as values. It's used for blocking operations (BLPOP) and to
498 * map swapped keys to a list of clients waiting for this keys to be loaded. */
499 dictType keylistDictType = {
500 dictObjHash, /* hash function */
501 NULL, /* key dup */
502 NULL, /* val dup */
503 dictObjKeyCompare, /* key compare */
504 dictRedisObjectDestructor, /* key destructor */
505 dictListDestructor /* val destructor */
506 };
507
508 int htNeedsResize(dict *dict) {
509 long long size, used;
510
511 size = dictSlots(dict);
512 used = dictSize(dict);
513 return (size && used && size > DICT_HT_INITIAL_SIZE &&
514 (used*100/size < REDIS_HT_MINFILL));
515 }
516
517 /* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
518 * we resize the hash table to save memory */
519 void tryResizeHashTables(void) {
520 int j;
521
522 for (j = 0; j < server.dbnum; j++) {
523 if (htNeedsResize(server.db[j].dict))
524 dictResize(server.db[j].dict);
525 if (htNeedsResize(server.db[j].expires))
526 dictResize(server.db[j].expires);
527 }
528 }
529
530 /* Our hash table implementation performs rehashing incrementally while
531 * we write/read from the hash table. Still if the server is idle, the hash
532 * table will use two tables for a long time. So we try to use 1 millisecond
533 * of CPU time at every serverCron() loop in order to rehash some key. */
534 void incrementallyRehash(void) {
535 int j;
536
537 for (j = 0; j < server.dbnum; j++) {
538 if (dictIsRehashing(server.db[j].dict)) {
539 dictRehashMilliseconds(server.db[j].dict,1);
540 break; /* already used our millisecond for this loop... */
541 }
542 }
543 }
544
545 /* This function is called once a background process of some kind terminates,
546 * as we want to avoid resizing the hash tables when there is a child in order
547 * to play well with copy-on-write (otherwise when a resize happens lots of
548 * memory pages are copied). The goal of this function is to update the ability
549 * for dict.c to resize the hash tables accordingly to the fact we have o not
550 * running childs. */
551 void updateDictResizePolicy(void) {
552 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
553 dictEnableResize();
554 else
555 dictDisableResize();
556 }
557
558 /* ======================= Cron: called every 100 ms ======================== */
559
560 /* Try to expire a few timed out keys. The algorithm used is adaptive and
561 * will use few CPU cycles if there are few expiring keys, otherwise
562 * it will get more aggressive to avoid that too much memory is used by
563 * keys that can be removed from the keyspace. */
564 void activeExpireCycle(void) {
565 int j;
566
567 for (j = 0; j < server.dbnum; j++) {
568 int expired;
569 redisDb *db = server.db+j;
570
571 /* Continue to expire if at the end of the cycle more than 25%
572 * of the keys were expired. */
573 do {
574 long num = dictSize(db->expires);
575 long long now = mstime();
576
577 expired = 0;
578 if (num > REDIS_EXPIRELOOKUPS_PER_CRON)
579 num = REDIS_EXPIRELOOKUPS_PER_CRON;
580 while (num--) {
581 dictEntry *de;
582 long long t;
583
584 if ((de = dictGetRandomKey(db->expires)) == NULL) break;
585 t = dictGetSignedIntegerVal(de);
586 if (now > t) {
587 sds key = dictGetKey(de);
588 robj *keyobj = createStringObject(key,sdslen(key));
589
590 propagateExpire(db,keyobj);
591 dbDelete(db,keyobj);
592 decrRefCount(keyobj);
593 expired++;
594 server.stat_expiredkeys++;
595 }
596 }
597 } while (expired > REDIS_EXPIRELOOKUPS_PER_CRON/4);
598 }
599 }
600
601 void updateLRUClock(void) {
602 server.lruclock = (server.unixtime/REDIS_LRU_CLOCK_RESOLUTION) &
603 REDIS_LRU_CLOCK_MAX;
604 }
605
606
607 /* Add a sample to the operations per second array of samples. */
608 void trackOperationsPerSecond(void) {
609 long long t = mstime() - server.ops_sec_last_sample_time;
610 long long ops = server.stat_numcommands - server.ops_sec_last_sample_ops;
611 long long ops_sec;
612
613 ops_sec = t > 0 ? (ops*1000/t) : 0;
614
615 server.ops_sec_samples[server.ops_sec_idx] = ops_sec;
616 server.ops_sec_idx = (server.ops_sec_idx+1) % REDIS_OPS_SEC_SAMPLES;
617 server.ops_sec_last_sample_time = mstime();
618 server.ops_sec_last_sample_ops = server.stat_numcommands;
619 }
620
621 /* Return the mean of all the samples. */
622 long long getOperationsPerSecond(void) {
623 int j;
624 long long sum = 0;
625
626 for (j = 0; j < REDIS_OPS_SEC_SAMPLES; j++)
627 sum += server.ops_sec_samples[j];
628 return sum / REDIS_OPS_SEC_SAMPLES;
629 }
630
631 /* Check for timeouts. Returns non-zero if the client was terminated */
632 int clientsCronHandleTimeout(redisClient *c) {
633 time_t now = server.unixtime;
634
635 if (server.maxidletime &&
636 !(c->flags & REDIS_SLAVE) && /* no timeout for slaves */
637 !(c->flags & REDIS_MASTER) && /* no timeout for masters */
638 !(c->flags & REDIS_BLOCKED) && /* no timeout for BLPOP */
639 dictSize(c->pubsub_channels) == 0 && /* no timeout for pubsub */
640 listLength(c->pubsub_patterns) == 0 &&
641 (now - c->lastinteraction > server.maxidletime))
642 {
643 redisLog(REDIS_VERBOSE,"Closing idle client");
644 freeClient(c);
645 return 1;
646 } else if (c->flags & REDIS_BLOCKED) {
647 if (c->bpop.timeout != 0 && c->bpop.timeout < now) {
648 addReply(c,shared.nullmultibulk);
649 unblockClientWaitingData(c);
650 }
651 }
652 return 0;
653 }
654
655 /* The client query buffer is an sds.c string that can end with a lot of
656 * free space not used, this function reclaims space if needed.
657 *
658 * The funciton always returns 0 as it never terminates the client. */
659 int clientsCronResizeQueryBuffer(redisClient *c) {
660 size_t querybuf_size = sdsAllocSize(c->querybuf);
661 time_t idletime = server.unixtime - c->lastinteraction;
662
663 /* There are two conditions to resize the query buffer:
664 * 1) Query buffer is > BIG_ARG and too big for latest peak.
665 * 2) Client is inactive and the buffer is bigger than 1k. */
666 if (((querybuf_size > REDIS_MBULK_BIG_ARG) &&
667 (querybuf_size/(c->querybuf_peak+1)) > 2) ||
668 (querybuf_size > 1024 && idletime > 2))
669 {
670 /* Only resize the query buffer if it is actually wasting space. */
671 if (sdsavail(c->querybuf) > 1024) {
672 c->querybuf = sdsRemoveFreeSpace(c->querybuf);
673 }
674 }
675 /* Reset the peak again to capture the peak memory usage in the next
676 * cycle. */
677 c->querybuf_peak = 0;
678 return 0;
679 }
680
681 void clientsCron(void) {
682 /* Make sure to process at least 1/100 of clients per call.
683 * Since this function is called 10 times per second we are sure that
684 * in the worst case we process all the clients in 10 seconds.
685 * In normal conditions (a reasonable number of clients) we process
686 * all the clients in a shorter time. */
687 int numclients = listLength(server.clients);
688 int iterations = numclients/100;
689
690 if (iterations < 50)
691 iterations = (numclients < 50) ? numclients : 50;
692 while(listLength(server.clients) && iterations--) {
693 redisClient *c;
694 listNode *head;
695
696 /* Rotate the list, take the current head, process.
697 * This way if the client must be removed from the list it's the
698 * first element and we don't incur into O(N) computation. */
699 listRotate(server.clients);
700 head = listFirst(server.clients);
701 c = listNodeValue(head);
702 /* The following functions do different service checks on the client.
703 * The protocol is that they return non-zero if the client was
704 * terminated. */
705 if (clientsCronHandleTimeout(c)) continue;
706 if (clientsCronResizeQueryBuffer(c)) continue;
707 }
708 }
709
710 int serverCron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
711 int j, loops = server.cronloops;
712 REDIS_NOTUSED(eventLoop);
713 REDIS_NOTUSED(id);
714 REDIS_NOTUSED(clientData);
715
716 /* We take a cached value of the unix time in the global state because
717 * with virtual memory and aging there is to store the current time
718 * in objects at every object access, and accuracy is not needed.
719 * To access a global var is faster than calling time(NULL) */
720 server.unixtime = time(NULL);
721
722 trackOperationsPerSecond();
723
724 /* We have just 22 bits per object for LRU information.
725 * So we use an (eventually wrapping) LRU clock with 10 seconds resolution.
726 * 2^22 bits with 10 seconds resoluton is more or less 1.5 years.
727 *
728 * Note that even if this will wrap after 1.5 years it's not a problem,
729 * everything will still work but just some object will appear younger
730 * to Redis. But for this to happen a given object should never be touched
731 * for 1.5 years.
732 *
733 * Note that you can change the resolution altering the
734 * REDIS_LRU_CLOCK_RESOLUTION define.
735 */
736 updateLRUClock();
737
738 /* Record the max memory used since the server was started. */
739 if (zmalloc_used_memory() > server.stat_peak_memory)
740 server.stat_peak_memory = zmalloc_used_memory();
741
742 /* We received a SIGTERM, shutting down here in a safe way, as it is
743 * not ok doing so inside the signal handler. */
744 if (server.shutdown_asap) {
745 if (prepareForShutdown(0) == REDIS_OK) exit(0);
746 redisLog(REDIS_WARNING,"SIGTERM received but errors trying to shut down the server, check the logs for more information");
747 }
748
749 /* Show some info about non-empty databases */
750 for (j = 0; j < server.dbnum; j++) {
751 long long size, used, vkeys;
752
753 size = dictSlots(server.db[j].dict);
754 used = dictSize(server.db[j].dict);
755 vkeys = dictSize(server.db[j].expires);
756 if (!(loops % 50) && (used || vkeys)) {
757 redisLog(REDIS_VERBOSE,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j,used,vkeys,size);
758 /* dictPrintStats(server.dict); */
759 }
760 }
761
762 /* We don't want to resize the hash tables while a bacground saving
763 * is in progress: the saving child is created using fork() that is
764 * implemented with a copy-on-write semantic in most modern systems, so
765 * if we resize the HT while there is the saving child at work actually
766 * a lot of memory movements in the parent will cause a lot of pages
767 * copied. */
768 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
769 if (!(loops % 10)) tryResizeHashTables();
770 if (server.activerehashing) incrementallyRehash();
771 }
772
773 /* Show information about connected clients */
774 if (!(loops % 50)) {
775 redisLog(REDIS_VERBOSE,"%d clients connected (%d slaves), %zu bytes in use",
776 listLength(server.clients)-listLength(server.slaves),
777 listLength(server.slaves),
778 zmalloc_used_memory());
779 }
780
781 /* We need to do a few operations on clients asynchronously. */
782 clientsCron();
783
784 /* Start a scheduled AOF rewrite if this was requested by the user while
785 * a BGSAVE was in progress. */
786 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1 &&
787 server.aof_rewrite_scheduled)
788 {
789 rewriteAppendOnlyFileBackground();
790 }
791
792 /* Check if a background saving or AOF rewrite in progress terminated. */
793 if (server.rdb_child_pid != -1 || server.aof_child_pid != -1) {
794 int statloc;
795 pid_t pid;
796
797 if ((pid = wait3(&statloc,WNOHANG,NULL)) != 0) {
798 int exitcode = WEXITSTATUS(statloc);
799 int bysignal = 0;
800
801 if (WIFSIGNALED(statloc)) bysignal = WTERMSIG(statloc);
802
803 if (pid == server.rdb_child_pid) {
804 backgroundSaveDoneHandler(exitcode,bysignal);
805 } else {
806 backgroundRewriteDoneHandler(exitcode,bysignal);
807 }
808 updateDictResizePolicy();
809 }
810 } else {
811 /* If there is not a background saving/rewrite in progress check if
812 * we have to save/rewrite now */
813 for (j = 0; j < server.saveparamslen; j++) {
814 struct saveparam *sp = server.saveparams+j;
815
816 if (server.dirty >= sp->changes &&
817 server.unixtime-server.lastsave > sp->seconds) {
818 redisLog(REDIS_NOTICE,"%d changes in %d seconds. Saving...",
819 sp->changes, sp->seconds);
820 rdbSaveBackground(server.rdb_filename);
821 break;
822 }
823 }
824
825 /* Trigger an AOF rewrite if needed */
826 if (server.rdb_child_pid == -1 &&
827 server.aof_child_pid == -1 &&
828 server.aof_rewrite_perc &&
829 server.aof_current_size > server.aof_rewrite_min_size)
830 {
831 long long base = server.aof_rewrite_base_size ?
832 server.aof_rewrite_base_size : 1;
833 long long growth = (server.aof_current_size*100/base) - 100;
834 if (growth >= server.aof_rewrite_perc) {
835 redisLog(REDIS_NOTICE,"Starting automatic rewriting of AOF on %lld%% growth",growth);
836 rewriteAppendOnlyFileBackground();
837 }
838 }
839 }
840
841
842 /* If we postponed an AOF buffer flush, let's try to do it every time the
843 * cron function is called. */
844 if (server.aof_flush_postponed_start) flushAppendOnlyFile(0);
845
846 /* Expire a few keys per cycle, only if this is a master.
847 * On slaves we wait for DEL operations synthesized by the master
848 * in order to guarantee a strict consistency. */
849 if (server.masterhost == NULL) activeExpireCycle();
850
851 /* Close clients that need to be closed asynchronous */
852 freeClientsInAsyncFreeQueue();
853
854 /* Replication cron function -- used to reconnect to master and
855 * to detect transfer failures. */
856 if (!(loops % 10)) replicationCron();
857
858 server.cronloops++;
859 return 100;
860 }
861
862 /* This function gets called every time Redis is entering the
863 * main loop of the event driven library, that is, before to sleep
864 * for ready file descriptors. */
865 void beforeSleep(struct aeEventLoop *eventLoop) {
866 REDIS_NOTUSED(eventLoop);
867 listNode *ln;
868 redisClient *c;
869
870 /* Try to process pending commands for clients that were just unblocked. */
871 while (listLength(server.unblocked_clients)) {
872 ln = listFirst(server.unblocked_clients);
873 redisAssert(ln != NULL);
874 c = ln->value;
875 listDelNode(server.unblocked_clients,ln);
876 c->flags &= ~REDIS_UNBLOCKED;
877
878 /* Process remaining data in the input buffer. */
879 if (c->querybuf && sdslen(c->querybuf) > 0) {
880 server.current_client = c;
881 processInputBuffer(c);
882 server.current_client = NULL;
883 }
884 }
885
886 /* Write the AOF buffer on disk */
887 flushAppendOnlyFile(0);
888 }
889
890 /* =========================== Server initialization ======================== */
891
892 void createSharedObjects(void) {
893 int j;
894
895 shared.crlf = createObject(REDIS_STRING,sdsnew("\r\n"));
896 shared.ok = createObject(REDIS_STRING,sdsnew("+OK\r\n"));
897 shared.err = createObject(REDIS_STRING,sdsnew("-ERR\r\n"));
898 shared.emptybulk = createObject(REDIS_STRING,sdsnew("$0\r\n\r\n"));
899 shared.czero = createObject(REDIS_STRING,sdsnew(":0\r\n"));
900 shared.cone = createObject(REDIS_STRING,sdsnew(":1\r\n"));
901 shared.cnegone = createObject(REDIS_STRING,sdsnew(":-1\r\n"));
902 shared.nullbulk = createObject(REDIS_STRING,sdsnew("$-1\r\n"));
903 shared.nullmultibulk = createObject(REDIS_STRING,sdsnew("*-1\r\n"));
904 shared.emptymultibulk = createObject(REDIS_STRING,sdsnew("*0\r\n"));
905 shared.pong = createObject(REDIS_STRING,sdsnew("+PONG\r\n"));
906 shared.queued = createObject(REDIS_STRING,sdsnew("+QUEUED\r\n"));
907 shared.wrongtypeerr = createObject(REDIS_STRING,sdsnew(
908 "-ERR Operation against a key holding the wrong kind of value\r\n"));
909 shared.nokeyerr = createObject(REDIS_STRING,sdsnew(
910 "-ERR no such key\r\n"));
911 shared.syntaxerr = createObject(REDIS_STRING,sdsnew(
912 "-ERR syntax error\r\n"));
913 shared.sameobjecterr = createObject(REDIS_STRING,sdsnew(
914 "-ERR source and destination objects are the same\r\n"));
915 shared.outofrangeerr = createObject(REDIS_STRING,sdsnew(
916 "-ERR index out of range\r\n"));
917 shared.noscripterr = createObject(REDIS_STRING,sdsnew(
918 "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
919 shared.loadingerr = createObject(REDIS_STRING,sdsnew(
920 "-LOADING Redis is loading the dataset in memory\r\n"));
921 shared.slowscripterr = createObject(REDIS_STRING,sdsnew(
922 "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
923 shared.bgsaveerr = createObject(REDIS_STRING,sdsnew(
924 "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
925 shared.roslaveerr = createObject(REDIS_STRING,sdsnew(
926 "-READONLY You can't write against a read only slave.\r\n"));
927 shared.oomerr = createObject(REDIS_STRING,sdsnew(
928 "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
929 shared.space = createObject(REDIS_STRING,sdsnew(" "));
930 shared.colon = createObject(REDIS_STRING,sdsnew(":"));
931 shared.plus = createObject(REDIS_STRING,sdsnew("+"));
932 shared.select0 = createStringObject("select 0\r\n",10);
933 shared.select1 = createStringObject("select 1\r\n",10);
934 shared.select2 = createStringObject("select 2\r\n",10);
935 shared.select3 = createStringObject("select 3\r\n",10);
936 shared.select4 = createStringObject("select 4\r\n",10);
937 shared.select5 = createStringObject("select 5\r\n",10);
938 shared.select6 = createStringObject("select 6\r\n",10);
939 shared.select7 = createStringObject("select 7\r\n",10);
940 shared.select8 = createStringObject("select 8\r\n",10);
941 shared.select9 = createStringObject("select 9\r\n",10);
942 shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
943 shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
944 shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
945 shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
946 shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
947 shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
948 shared.del = createStringObject("DEL",3);
949 shared.rpop = createStringObject("RPOP",4);
950 shared.lpop = createStringObject("LPOP",4);
951 for (j = 0; j < REDIS_SHARED_INTEGERS; j++) {
952 shared.integers[j] = createObject(REDIS_STRING,(void*)(long)j);
953 shared.integers[j]->encoding = REDIS_ENCODING_INT;
954 }
955 for (j = 0; j < REDIS_SHARED_BULKHDR_LEN; j++) {
956 shared.mbulkhdr[j] = createObject(REDIS_STRING,
957 sdscatprintf(sdsempty(),"*%d\r\n",j));
958 shared.bulkhdr[j] = createObject(REDIS_STRING,
959 sdscatprintf(sdsempty(),"$%d\r\n",j));
960 }
961 }
962
963 void initServerConfig() {
964 getRandomHexChars(server.runid,REDIS_RUN_ID_SIZE);
965 server.runid[REDIS_RUN_ID_SIZE] = '\0';
966 server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
967 server.port = REDIS_SERVERPORT;
968 server.bindaddr = NULL;
969 server.unixsocket = NULL;
970 server.unixsocketperm = 0;
971 server.ipfd = -1;
972 server.sofd = -1;
973 server.dbnum = REDIS_DEFAULT_DBNUM;
974 server.verbosity = REDIS_NOTICE;
975 server.maxidletime = REDIS_MAXIDLETIME;
976 server.client_max_querybuf_len = REDIS_MAX_QUERYBUF_LEN;
977 server.saveparams = NULL;
978 server.loading = 0;
979 server.logfile = NULL; /* NULL = log on standard output */
980 server.syslog_enabled = 0;
981 server.syslog_ident = zstrdup("redis");
982 server.syslog_facility = LOG_LOCAL0;
983 server.daemonize = 0;
984 server.aof_state = REDIS_AOF_OFF;
985 server.aof_fsync = AOF_FSYNC_EVERYSEC;
986 server.aof_no_fsync_on_rewrite = 0;
987 server.aof_rewrite_perc = REDIS_AOF_REWRITE_PERC;
988 server.aof_rewrite_min_size = REDIS_AOF_REWRITE_MIN_SIZE;
989 server.aof_rewrite_base_size = 0;
990 server.aof_rewrite_scheduled = 0;
991 server.aof_last_fsync = time(NULL);
992 server.aof_delayed_fsync = 0;
993 server.aof_fd = -1;
994 server.aof_selected_db = -1; /* Make sure the first time will not match */
995 server.aof_flush_postponed_start = 0;
996 server.pidfile = zstrdup("/var/run/redis.pid");
997 server.rdb_filename = zstrdup("dump.rdb");
998 server.aof_filename = zstrdup("appendonly.aof");
999 server.requirepass = NULL;
1000 server.rdb_compression = 1;
1001 server.activerehashing = 1;
1002 server.maxclients = REDIS_MAX_CLIENTS;
1003 server.bpop_blocked_clients = 0;
1004 server.maxmemory = 0;
1005 server.maxmemory_policy = REDIS_MAXMEMORY_VOLATILE_LRU;
1006 server.maxmemory_samples = 3;
1007 server.hash_max_ziplist_entries = REDIS_HASH_MAX_ZIPLIST_ENTRIES;
1008 server.hash_max_ziplist_value = REDIS_HASH_MAX_ZIPLIST_VALUE;
1009 server.list_max_ziplist_entries = REDIS_LIST_MAX_ZIPLIST_ENTRIES;
1010 server.list_max_ziplist_value = REDIS_LIST_MAX_ZIPLIST_VALUE;
1011 server.set_max_intset_entries = REDIS_SET_MAX_INTSET_ENTRIES;
1012 server.zset_max_ziplist_entries = REDIS_ZSET_MAX_ZIPLIST_ENTRIES;
1013 server.zset_max_ziplist_value = REDIS_ZSET_MAX_ZIPLIST_VALUE;
1014 server.shutdown_asap = 0;
1015 server.repl_ping_slave_period = REDIS_REPL_PING_SLAVE_PERIOD;
1016 server.repl_timeout = REDIS_REPL_TIMEOUT;
1017 server.lua_caller = NULL;
1018 server.lua_time_limit = REDIS_LUA_TIME_LIMIT;
1019 server.lua_client = NULL;
1020 server.lua_timedout = 0;
1021
1022 updateLRUClock();
1023 resetServerSaveParams();
1024
1025 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1026 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1027 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1028 /* Replication related */
1029 server.masterauth = NULL;
1030 server.masterhost = NULL;
1031 server.masterport = 6379;
1032 server.master = NULL;
1033 server.repl_state = REDIS_REPL_NONE;
1034 server.repl_syncio_timeout = REDIS_REPL_SYNCIO_TIMEOUT;
1035 server.repl_serve_stale_data = 1;
1036 server.repl_slave_ro = 1;
1037 server.repl_down_since = -1;
1038
1039 /* Client output buffer limits */
1040 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].hard_limit_bytes = 0;
1041 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_bytes = 0;
1042 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_seconds = 0;
1043 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].hard_limit_bytes = 1024*1024*256;
1044 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_bytes = 1024*1024*64;
1045 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_seconds = 60;
1046 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].hard_limit_bytes = 1024*1024*32;
1047 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_bytes = 1024*1024*8;
1048 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_seconds = 60;
1049
1050 /* Double constants initialization */
1051 R_Zero = 0.0;
1052 R_PosInf = 1.0/R_Zero;
1053 R_NegInf = -1.0/R_Zero;
1054 R_Nan = R_Zero/R_Zero;
1055
1056 /* Command table -- we intiialize it here as it is part of the
1057 * initial configuration, since command names may be changed via
1058 * redis.conf using the rename-command directive. */
1059 server.commands = dictCreate(&commandTableDictType,NULL);
1060 populateCommandTable();
1061 server.delCommand = lookupCommandByCString("del");
1062 server.multiCommand = lookupCommandByCString("multi");
1063 server.lpushCommand = lookupCommandByCString("lpush");
1064
1065 /* Slow log */
1066 server.slowlog_log_slower_than = REDIS_SLOWLOG_LOG_SLOWER_THAN;
1067 server.slowlog_max_len = REDIS_SLOWLOG_MAX_LEN;
1068
1069 /* Assert */
1070 server.assert_failed = "<no assertion failed>";
1071 server.assert_file = "<no file>";
1072 server.assert_line = 0;
1073 server.bug_report_start = 0;
1074 }
1075
1076 /* This function will try to raise the max number of open files accordingly to
1077 * the configured max number of clients. It will also account for 32 additional
1078 * file descriptors as we need a few more for persistence, listening
1079 * sockets, log files and so forth.
1080 *
1081 * If it will not be possible to set the limit accordingly to the configured
1082 * max number of clients, the function will do the reverse setting
1083 * server.maxclients to the value that we can actually handle. */
1084 void adjustOpenFilesLimit(void) {
1085 rlim_t maxfiles = server.maxclients+32;
1086 struct rlimit limit;
1087
1088 if (maxfiles < 1024) maxfiles = 1024;
1089 if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
1090 redisLog(REDIS_WARNING,"Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
1091 strerror(errno));
1092 server.maxclients = 1024-32;
1093 } else {
1094 rlim_t oldlimit = limit.rlim_cur;
1095
1096 /* Set the max number of files if the current limit is not enough
1097 * for our needs. */
1098 if (oldlimit < maxfiles) {
1099 limit.rlim_cur = maxfiles;
1100 limit.rlim_max = maxfiles;
1101 if (setrlimit(RLIMIT_NOFILE,&limit) == -1) {
1102 server.maxclients = oldlimit-32;
1103 redisLog(REDIS_WARNING,"Unable to set the max number of files limit to %d (%s), setting the max clients configuration to %d.",
1104 (int) maxfiles, strerror(errno), (int) server.maxclients);
1105 } else {
1106 redisLog(REDIS_NOTICE,"Max number of open files set to %d",
1107 (int) maxfiles);
1108 }
1109 }
1110 }
1111 }
1112
1113 void initServer() {
1114 int j;
1115
1116 signal(SIGHUP, SIG_IGN);
1117 signal(SIGPIPE, SIG_IGN);
1118 setupSignalHandlers();
1119
1120 if (server.syslog_enabled) {
1121 openlog(server.syslog_ident, LOG_PID | LOG_NDELAY | LOG_NOWAIT,
1122 server.syslog_facility);
1123 }
1124
1125 server.current_client = NULL;
1126 server.clients = listCreate();
1127 server.clients_to_close = listCreate();
1128 server.slaves = listCreate();
1129 server.monitors = listCreate();
1130 server.unblocked_clients = listCreate();
1131
1132 createSharedObjects();
1133 adjustOpenFilesLimit();
1134 server.el = aeCreateEventLoop(server.maxclients+1024);
1135 server.db = zmalloc(sizeof(redisDb)*server.dbnum);
1136
1137 if (server.port != 0) {
1138 server.ipfd = anetTcpServer(server.neterr,server.port,server.bindaddr);
1139 if (server.ipfd == ANET_ERR) {
1140 redisLog(REDIS_WARNING, "Opening port %d: %s",
1141 server.port, server.neterr);
1142 exit(1);
1143 }
1144 }
1145 if (server.unixsocket != NULL) {
1146 unlink(server.unixsocket); /* don't care if this fails */
1147 server.sofd = anetUnixServer(server.neterr,server.unixsocket,server.unixsocketperm);
1148 if (server.sofd == ANET_ERR) {
1149 redisLog(REDIS_WARNING, "Opening socket: %s", server.neterr);
1150 exit(1);
1151 }
1152 }
1153 if (server.ipfd < 0 && server.sofd < 0) {
1154 redisLog(REDIS_WARNING, "Configured to not listen anywhere, exiting.");
1155 exit(1);
1156 }
1157 for (j = 0; j < server.dbnum; j++) {
1158 server.db[j].dict = dictCreate(&dbDictType,NULL);
1159 server.db[j].expires = dictCreate(&keyptrDictType,NULL);
1160 server.db[j].blocking_keys = dictCreate(&keylistDictType,NULL);
1161 server.db[j].watched_keys = dictCreate(&keylistDictType,NULL);
1162 server.db[j].id = j;
1163 }
1164 server.pubsub_channels = dictCreate(&keylistDictType,NULL);
1165 server.pubsub_patterns = listCreate();
1166 listSetFreeMethod(server.pubsub_patterns,freePubsubPattern);
1167 listSetMatchMethod(server.pubsub_patterns,listMatchPubsubPattern);
1168 server.cronloops = 0;
1169 server.rdb_child_pid = -1;
1170 server.aof_child_pid = -1;
1171 server.aof_rewrite_buf = sdsempty();
1172 server.aof_buf = sdsempty();
1173 server.lastsave = time(NULL);
1174 server.dirty = 0;
1175 server.stat_numcommands = 0;
1176 server.stat_numconnections = 0;
1177 server.stat_expiredkeys = 0;
1178 server.stat_evictedkeys = 0;
1179 server.stat_starttime = time(NULL);
1180 server.stat_keyspace_misses = 0;
1181 server.stat_keyspace_hits = 0;
1182 server.stat_peak_memory = 0;
1183 server.stat_fork_time = 0;
1184 server.stat_rejected_conn = 0;
1185 memset(server.ops_sec_samples,0,sizeof(server.ops_sec_samples));
1186 server.ops_sec_idx = 0;
1187 server.ops_sec_last_sample_time = mstime();
1188 server.ops_sec_last_sample_ops = 0;
1189 server.unixtime = time(NULL);
1190 server.lastbgsave_status = REDIS_OK;
1191 server.stop_writes_on_bgsave_err = 1;
1192 aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL);
1193 if (server.ipfd > 0 && aeCreateFileEvent(server.el,server.ipfd,AE_READABLE,
1194 acceptTcpHandler,NULL) == AE_ERR) oom("creating file event");
1195 if (server.sofd > 0 && aeCreateFileEvent(server.el,server.sofd,AE_READABLE,
1196 acceptUnixHandler,NULL) == AE_ERR) oom("creating file event");
1197
1198 if (server.aof_state == REDIS_AOF_ON) {
1199 server.aof_fd = open(server.aof_filename,
1200 O_WRONLY|O_APPEND|O_CREAT,0644);
1201 if (server.aof_fd == -1) {
1202 redisLog(REDIS_WARNING, "Can't open the append-only file: %s",
1203 strerror(errno));
1204 exit(1);
1205 }
1206 }
1207
1208 /* 32 bit instances are limited to 4GB of address space, so if there is
1209 * no explicit limit in the user provided configuration we set a limit
1210 * at 3.5GB using maxmemory with 'noeviction' policy'. This saves
1211 * useless crashes of the Redis instance. */
1212 if (server.arch_bits == 32 && server.maxmemory == 0) {
1213 redisLog(REDIS_WARNING,"Warning: 32 bit instance detected but no memory limit set. Setting 3.5 GB maxmemory limit with 'noeviction' policy now.");
1214 server.maxmemory = 3584LL*(1024*1024); /* 3584 MB = 3.5 GB */
1215 server.maxmemory_policy = REDIS_MAXMEMORY_NO_EVICTION;
1216 }
1217
1218 scriptingInit();
1219 slowlogInit();
1220 bioInit();
1221 }
1222
1223 /* Populates the Redis Command Table starting from the hard coded list
1224 * we have on top of redis.c file. */
1225 void populateCommandTable(void) {
1226 int j;
1227 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1228
1229 for (j = 0; j < numcommands; j++) {
1230 struct redisCommand *c = redisCommandTable+j;
1231 char *f = c->sflags;
1232 int retval;
1233
1234 while(*f != '\0') {
1235 switch(*f) {
1236 case 'w': c->flags |= REDIS_CMD_WRITE; break;
1237 case 'r': c->flags |= REDIS_CMD_READONLY; break;
1238 case 'm': c->flags |= REDIS_CMD_DENYOOM; break;
1239 case 'a': c->flags |= REDIS_CMD_ADMIN; break;
1240 case 'p': c->flags |= REDIS_CMD_PUBSUB; break;
1241 case 'f': c->flags |= REDIS_CMD_FORCE_REPLICATION; break;
1242 case 's': c->flags |= REDIS_CMD_NOSCRIPT; break;
1243 case 'R': c->flags |= REDIS_CMD_RANDOM; break;
1244 case 'S': c->flags |= REDIS_CMD_SORT_FOR_SCRIPT; break;
1245 default: redisPanic("Unsupported command flag"); break;
1246 }
1247 f++;
1248 }
1249
1250 retval = dictAdd(server.commands, sdsnew(c->name), c);
1251 assert(retval == DICT_OK);
1252 }
1253 }
1254
1255 void resetCommandTableStats(void) {
1256 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1257 int j;
1258
1259 for (j = 0; j < numcommands; j++) {
1260 struct redisCommand *c = redisCommandTable+j;
1261
1262 c->microseconds = 0;
1263 c->calls = 0;
1264 }
1265 }
1266
1267 /* ========================== Redis OP Array API ============================ */
1268
1269 void redisOpArrayInit(redisOpArray *oa) {
1270 oa->ops = NULL;
1271 oa->numops = 0;
1272 }
1273
1274 int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
1275 robj **argv, int argc, int target)
1276 {
1277 redisOp *op;
1278
1279 oa->ops = zrealloc(oa->ops,sizeof(redisOp)*(oa->numops+1));
1280 op = oa->ops+oa->numops;
1281 op->cmd = cmd;
1282 op->dbid = dbid;
1283 op->argv = argv;
1284 op->argc = argc;
1285 op->target = target;
1286 oa->numops++;
1287 return oa->numops;
1288 }
1289
1290 void redisOpArrayFree(redisOpArray *oa) {
1291 while(oa->numops) {
1292 int j;
1293 redisOp *op;
1294
1295 oa->numops--;
1296 op = oa->ops+oa->numops;
1297 for (j = 0; j < op->argc; j++)
1298 decrRefCount(op->argv[j]);
1299 zfree(op->argv);
1300 }
1301 zfree(oa->ops);
1302 }
1303
1304 /* ====================== Commands lookup and execution ===================== */
1305
1306 struct redisCommand *lookupCommand(sds name) {
1307 return dictFetchValue(server.commands, name);
1308 }
1309
1310 struct redisCommand *lookupCommandByCString(char *s) {
1311 struct redisCommand *cmd;
1312 sds name = sdsnew(s);
1313
1314 cmd = dictFetchValue(server.commands, name);
1315 sdsfree(name);
1316 return cmd;
1317 }
1318
1319 /* Propagate the specified command (in the context of the specified database id)
1320 * to AOF, Slaves and Monitors.
1321 *
1322 * flags are an xor between:
1323 * + REDIS_PROPAGATE_NONE (no propagation of command at all)
1324 * + REDIS_PROPAGATE_AOF (propagate into the AOF file if is enabled)
1325 * + REDIS_PROPAGATE_REPL (propagate into the replication link)
1326 */
1327 void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1328 int flags)
1329 {
1330 if (server.aof_state != REDIS_AOF_OFF && flags & REDIS_PROPAGATE_AOF)
1331 feedAppendOnlyFile(cmd,dbid,argv,argc);
1332 if (flags & REDIS_PROPAGATE_REPL && listLength(server.slaves))
1333 replicationFeedSlaves(server.slaves,dbid,argv,argc);
1334 }
1335
1336 /* Used inside commands to schedule the propagation of additional commands
1337 * after the current command is propagated to AOF / Replication. */
1338 void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1339 int target)
1340 {
1341 redisOpArrayAppend(&server.also_propagate,cmd,dbid,argv,argc,target);
1342 }
1343
1344 /* Call() is the core of Redis execution of a command */
1345 void call(redisClient *c, int flags) {
1346 long long dirty, start = ustime(), duration;
1347
1348 /* Sent the command to clients in MONITOR mode, only if the commands are
1349 * not geneated from reading an AOF. */
1350 if (listLength(server.monitors) && !server.loading)
1351 replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
1352
1353 /* Call the command. */
1354 redisOpArrayInit(&server.also_propagate);
1355 dirty = server.dirty;
1356 c->cmd->proc(c);
1357 dirty = server.dirty-dirty;
1358 duration = ustime()-start;
1359
1360 /* When EVAL is called loading the AOF we don't want commands called
1361 * from Lua to go into the slowlog or to populate statistics. */
1362 if (server.loading && c->flags & REDIS_LUA_CLIENT)
1363 flags &= ~(REDIS_CALL_SLOWLOG | REDIS_CALL_STATS);
1364
1365 /* Log the command into the Slow log if needed, and populate the
1366 * per-command statistics that we show in INFO commandstats. */
1367 if (flags & REDIS_CALL_SLOWLOG)
1368 slowlogPushEntryIfNeeded(c->argv,c->argc,duration);
1369 if (flags & REDIS_CALL_STATS) {
1370 c->cmd->microseconds += duration;
1371 c->cmd->calls++;
1372 }
1373
1374 /* Propagate the command into the AOF and replication link */
1375 if (flags & REDIS_CALL_PROPAGATE) {
1376 int flags = REDIS_PROPAGATE_NONE;
1377
1378 if (c->cmd->flags & REDIS_CMD_FORCE_REPLICATION)
1379 flags |= REDIS_PROPAGATE_REPL;
1380 if (dirty)
1381 flags |= (REDIS_PROPAGATE_REPL | REDIS_PROPAGATE_AOF);
1382 if (flags != REDIS_PROPAGATE_NONE)
1383 propagate(c->cmd,c->db->id,c->argv,c->argc,flags);
1384 }
1385 /* Commands such as LPUSH or BRPOPLPUSH may propagate an additional
1386 * PUSH command. */
1387 if (server.also_propagate.numops) {
1388 int j;
1389 redisOp *rop;
1390
1391 for (j = 0; j < server.also_propagate.numops; j++) {
1392 rop = &server.also_propagate.ops[j];
1393 propagate(rop->cmd, rop->dbid, rop->argv, rop->argc, rop->target);
1394 }
1395 redisOpArrayFree(&server.also_propagate);
1396 }
1397 server.stat_numcommands++;
1398 }
1399
1400 /* If this function gets called we already read a whole
1401 * command, argments are in the client argv/argc fields.
1402 * processCommand() execute the command or prepare the
1403 * server for a bulk read from the client.
1404 *
1405 * If 1 is returned the client is still alive and valid and
1406 * and other operations can be performed by the caller. Otherwise
1407 * if 0 is returned the client was destroied (i.e. after QUIT). */
1408 int processCommand(redisClient *c) {
1409 /* The QUIT command is handled separately. Normal command procs will
1410 * go through checking for replication and QUIT will cause trouble
1411 * when FORCE_REPLICATION is enabled and would be implemented in
1412 * a regular command proc. */
1413 if (!strcasecmp(c->argv[0]->ptr,"quit")) {
1414 addReply(c,shared.ok);
1415 c->flags |= REDIS_CLOSE_AFTER_REPLY;
1416 return REDIS_ERR;
1417 }
1418
1419 /* Now lookup the command and check ASAP about trivial error conditions
1420 * such as wrong arity, bad command name and so forth. */
1421 c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
1422 if (!c->cmd) {
1423 addReplyErrorFormat(c,"unknown command '%s'",
1424 (char*)c->argv[0]->ptr);
1425 return REDIS_OK;
1426 } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
1427 (c->argc < -c->cmd->arity)) {
1428 addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
1429 c->cmd->name);
1430 return REDIS_OK;
1431 }
1432
1433 /* Check if the user is authenticated */
1434 if (server.requirepass && !c->authenticated && c->cmd->proc != authCommand)
1435 {
1436 addReplyError(c,"operation not permitted");
1437 return REDIS_OK;
1438 }
1439
1440 /* Handle the maxmemory directive.
1441 *
1442 * First we try to free some memory if possible (if there are volatile
1443 * keys in the dataset). If there are not the only thing we can do
1444 * is returning an error. */
1445 if (server.maxmemory) {
1446 int retval = freeMemoryIfNeeded();
1447 if ((c->cmd->flags & REDIS_CMD_DENYOOM) && retval == REDIS_ERR) {
1448 addReply(c, shared.oomerr);
1449 return REDIS_OK;
1450 }
1451 }
1452
1453 /* Don't accept write commands if there are problems persisting on disk. */
1454 if (server.stop_writes_on_bgsave_err &&
1455 server.saveparamslen > 0
1456 && server.lastbgsave_status == REDIS_ERR &&
1457 c->cmd->flags & REDIS_CMD_WRITE)
1458 {
1459 addReply(c, shared.bgsaveerr);
1460 return REDIS_OK;
1461 }
1462
1463 /* Don't accept wirte commands if this is a read only slave. But
1464 * accept write commands if this is our master. */
1465 if (server.masterhost && server.repl_slave_ro &&
1466 !(c->flags & REDIS_MASTER) &&
1467 c->cmd->flags & REDIS_CMD_WRITE)
1468 {
1469 addReply(c, shared.roslaveerr);
1470 return REDIS_OK;
1471 }
1472
1473 /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
1474 if ((dictSize(c->pubsub_channels) > 0 || listLength(c->pubsub_patterns) > 0)
1475 &&
1476 c->cmd->proc != subscribeCommand &&
1477 c->cmd->proc != unsubscribeCommand &&
1478 c->cmd->proc != psubscribeCommand &&
1479 c->cmd->proc != punsubscribeCommand) {
1480 addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / QUIT allowed in this context");
1481 return REDIS_OK;
1482 }
1483
1484 /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
1485 * we are a slave with a broken link with master. */
1486 if (server.masterhost && server.repl_state != REDIS_REPL_CONNECTED &&
1487 server.repl_serve_stale_data == 0 &&
1488 c->cmd->proc != infoCommand && c->cmd->proc != slaveofCommand)
1489 {
1490 addReplyError(c,
1491 "link with MASTER is down and slave-serve-stale-data is set to no");
1492 return REDIS_OK;
1493 }
1494
1495 /* Loading DB? Return an error if the command is not INFO */
1496 if (server.loading && c->cmd->proc != infoCommand) {
1497 addReply(c, shared.loadingerr);
1498 return REDIS_OK;
1499 }
1500
1501 /* Lua script too slow? Only allow SHUTDOWN NOSAVE and SCRIPT KILL. */
1502 if (server.lua_timedout &&
1503 !(c->cmd->proc != shutdownCommand &&
1504 c->argc == 2 &&
1505 tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
1506 !(c->cmd->proc == scriptCommand &&
1507 c->argc == 2 &&
1508 tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
1509 {
1510 addReply(c, shared.slowscripterr);
1511 return REDIS_OK;
1512 }
1513
1514 /* Exec the command */
1515 if (c->flags & REDIS_MULTI &&
1516 c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
1517 c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
1518 {
1519 queueMultiCommand(c);
1520 addReply(c,shared.queued);
1521 } else {
1522 call(c,REDIS_CALL_FULL);
1523 }
1524 return REDIS_OK;
1525 }
1526
1527 /*================================== Shutdown =============================== */
1528
1529 int prepareForShutdown(int flags) {
1530 int save = flags & REDIS_SHUTDOWN_SAVE;
1531 int nosave = flags & REDIS_SHUTDOWN_NOSAVE;
1532
1533 redisLog(REDIS_WARNING,"User requested shutdown...");
1534 /* Kill the saving child if there is a background saving in progress.
1535 We want to avoid race conditions, for instance our saving child may
1536 overwrite the synchronous saving did by SHUTDOWN. */
1537 if (server.rdb_child_pid != -1) {
1538 redisLog(REDIS_WARNING,"There is a child saving an .rdb. Killing it!");
1539 kill(server.rdb_child_pid,SIGKILL);
1540 rdbRemoveTempFile(server.rdb_child_pid);
1541 }
1542 if (server.aof_state != REDIS_AOF_OFF) {
1543 /* Kill the AOF saving child as the AOF we already have may be longer
1544 * but contains the full dataset anyway. */
1545 if (server.aof_child_pid != -1) {
1546 redisLog(REDIS_WARNING,
1547 "There is a child rewriting the AOF. Killing it!");
1548 kill(server.aof_child_pid,SIGKILL);
1549 }
1550 /* Append only file: fsync() the AOF and exit */
1551 redisLog(REDIS_NOTICE,"Calling fsync() on the AOF file.");
1552 aof_fsync(server.aof_fd);
1553 }
1554 if ((server.saveparamslen > 0 && !nosave) || save) {
1555 redisLog(REDIS_NOTICE,"Saving the final RDB snapshot before exiting.");
1556 /* Snapshotting. Perform a SYNC SAVE and exit */
1557 if (rdbSave(server.rdb_filename) != REDIS_OK) {
1558 /* Ooops.. error saving! The best we can do is to continue
1559 * operating. Note that if there was a background saving process,
1560 * in the next cron() Redis will be notified that the background
1561 * saving aborted, handling special stuff like slaves pending for
1562 * synchronization... */
1563 redisLog(REDIS_WARNING,"Error trying to save the DB, can't exit.");
1564 return REDIS_ERR;
1565 }
1566 }
1567 if (server.daemonize) {
1568 redisLog(REDIS_NOTICE,"Removing the pid file.");
1569 unlink(server.pidfile);
1570 }
1571 /* Close the listening sockets. Apparently this allows faster restarts. */
1572 if (server.ipfd != -1) close(server.ipfd);
1573 if (server.sofd != -1) close(server.sofd);
1574 if (server.unixsocket) {
1575 redisLog(REDIS_NOTICE,"Removing the unix socket file.");
1576 unlink(server.unixsocket); /* don't care if this fails */
1577 }
1578
1579 redisLog(REDIS_WARNING,"Redis is now ready to exit, bye bye...");
1580 return REDIS_OK;
1581 }
1582
1583 /*================================== Commands =============================== */
1584
1585 void authCommand(redisClient *c) {
1586 if (!server.requirepass) {
1587 addReplyError(c,"Client sent AUTH, but no password is set");
1588 } else if (!strcmp(c->argv[1]->ptr, server.requirepass)) {
1589 c->authenticated = 1;
1590 addReply(c,shared.ok);
1591 } else {
1592 c->authenticated = 0;
1593 addReplyError(c,"invalid password");
1594 }
1595 }
1596
1597 void pingCommand(redisClient *c) {
1598 addReply(c,shared.pong);
1599 }
1600
1601 void echoCommand(redisClient *c) {
1602 addReplyBulk(c,c->argv[1]);
1603 }
1604
1605 void timeCommand(redisClient *c) {
1606 struct timeval tv;
1607
1608 /* gettimeofday() can only fail if &tv is a bad addresss so we
1609 * don't check for errors. */
1610 gettimeofday(&tv,NULL);
1611 addReplyMultiBulkLen(c,2);
1612 addReplyBulkLongLong(c,tv.tv_sec);
1613 addReplyBulkLongLong(c,tv.tv_usec);
1614 }
1615
1616 /* Convert an amount of bytes into a human readable string in the form
1617 * of 100B, 2G, 100M, 4K, and so forth. */
1618 void bytesToHuman(char *s, unsigned long long n) {
1619 double d;
1620
1621 if (n < 1024) {
1622 /* Bytes */
1623 sprintf(s,"%lluB",n);
1624 return;
1625 } else if (n < (1024*1024)) {
1626 d = (double)n/(1024);
1627 sprintf(s,"%.2fK",d);
1628 } else if (n < (1024LL*1024*1024)) {
1629 d = (double)n/(1024*1024);
1630 sprintf(s,"%.2fM",d);
1631 } else if (n < (1024LL*1024*1024*1024)) {
1632 d = (double)n/(1024LL*1024*1024);
1633 sprintf(s,"%.2fG",d);
1634 }
1635 }
1636
1637 /* Create the string returned by the INFO command. This is decoupled
1638 * by the INFO command itself as we need to report the same information
1639 * on memory corruption problems. */
1640 sds genRedisInfoString(char *section) {
1641 sds info = sdsempty();
1642 time_t uptime = server.unixtime-server.stat_starttime;
1643 int j, numcommands;
1644 struct rusage self_ru, c_ru;
1645 unsigned long lol, bib;
1646 int allsections = 0, defsections = 0;
1647 int sections = 0;
1648
1649 if (section) {
1650 allsections = strcasecmp(section,"all") == 0;
1651 defsections = strcasecmp(section,"default") == 0;
1652 }
1653
1654 getrusage(RUSAGE_SELF, &self_ru);
1655 getrusage(RUSAGE_CHILDREN, &c_ru);
1656 getClientsMaxBuffers(&lol,&bib);
1657
1658 /* Server */
1659 if (allsections || defsections || !strcasecmp(section,"server")) {
1660 if (sections++) info = sdscat(info,"\r\n");
1661 info = sdscatprintf(info,
1662 "# Server\r\n"
1663 "redis_version:%s\r\n"
1664 "redis_git_sha1:%s\r\n"
1665 "redis_git_dirty:%d\r\n"
1666 "arch_bits:%d\r\n"
1667 "multiplexing_api:%s\r\n"
1668 "gcc_version:%d.%d.%d\r\n"
1669 "process_id:%ld\r\n"
1670 "run_id:%s\r\n"
1671 "tcp_port:%d\r\n"
1672 "uptime_in_seconds:%ld\r\n"
1673 "uptime_in_days:%ld\r\n"
1674 "lru_clock:%ld\r\n",
1675 REDIS_VERSION,
1676 redisGitSHA1(),
1677 strtol(redisGitDirty(),NULL,10) > 0,
1678 server.arch_bits,
1679 aeGetApiName(),
1680 #ifdef __GNUC__
1681 __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
1682 #else
1683 0,0,0,
1684 #endif
1685 (long) getpid(),
1686 server.runid,
1687 server.port,
1688 uptime,
1689 uptime/(3600*24),
1690 (unsigned long) server.lruclock);
1691 }
1692
1693 /* Clients */
1694 if (allsections || defsections || !strcasecmp(section,"clients")) {
1695 if (sections++) info = sdscat(info,"\r\n");
1696 info = sdscatprintf(info,
1697 "# Clients\r\n"
1698 "connected_clients:%lu\r\n"
1699 "client_longest_output_list:%lu\r\n"
1700 "client_biggest_input_buf:%lu\r\n"
1701 "blocked_clients:%d\r\n",
1702 listLength(server.clients)-listLength(server.slaves),
1703 lol, bib,
1704 server.bpop_blocked_clients);
1705 }
1706
1707 /* Memory */
1708 if (allsections || defsections || !strcasecmp(section,"memory")) {
1709 char hmem[64];
1710 char peak_hmem[64];
1711
1712 bytesToHuman(hmem,zmalloc_used_memory());
1713 bytesToHuman(peak_hmem,server.stat_peak_memory);
1714 if (sections++) info = sdscat(info,"\r\n");
1715 info = sdscatprintf(info,
1716 "# Memory\r\n"
1717 "used_memory:%zu\r\n"
1718 "used_memory_human:%s\r\n"
1719 "used_memory_rss:%zu\r\n"
1720 "used_memory_peak:%zu\r\n"
1721 "used_memory_peak_human:%s\r\n"
1722 "used_memory_lua:%lld\r\n"
1723 "mem_fragmentation_ratio:%.2f\r\n"
1724 "mem_allocator:%s\r\n",
1725 zmalloc_used_memory(),
1726 hmem,
1727 zmalloc_get_rss(),
1728 server.stat_peak_memory,
1729 peak_hmem,
1730 ((long long)lua_gc(server.lua,LUA_GCCOUNT,0))*1024LL,
1731 zmalloc_get_fragmentation_ratio(),
1732 ZMALLOC_LIB
1733 );
1734 }
1735
1736 /* Persistence */
1737 if (allsections || defsections || !strcasecmp(section,"persistence")) {
1738 if (sections++) info = sdscat(info,"\r\n");
1739 info = sdscatprintf(info,
1740 "# Persistence\r\n"
1741 "loading:%d\r\n"
1742 "aof_enabled:%d\r\n"
1743 "changes_since_last_save:%lld\r\n"
1744 "bgsave_in_progress:%d\r\n"
1745 "last_save_time:%ld\r\n"
1746 "last_bgsave_status:%s\r\n"
1747 "bgrewriteaof_in_progress:%d\r\n",
1748 server.loading,
1749 server.aof_state != REDIS_AOF_OFF,
1750 server.dirty,
1751 server.rdb_child_pid != -1,
1752 server.lastsave,
1753 server.lastbgsave_status == REDIS_OK ? "ok" : "err",
1754 server.aof_child_pid != -1);
1755
1756 if (server.aof_state != REDIS_AOF_OFF) {
1757 info = sdscatprintf(info,
1758 "aof_current_size:%lld\r\n"
1759 "aof_base_size:%lld\r\n"
1760 "aof_pending_rewrite:%d\r\n"
1761 "aof_buffer_length:%zu\r\n"
1762 "aof_pending_bio_fsync:%llu\r\n"
1763 "aof_delayed_fsync:%lu\r\n",
1764 (long long) server.aof_current_size,
1765 (long long) server.aof_rewrite_base_size,
1766 server.aof_rewrite_scheduled,
1767 sdslen(server.aof_buf),
1768 bioPendingJobsOfType(REDIS_BIO_AOF_FSYNC),
1769 server.aof_delayed_fsync);
1770 }
1771
1772 if (server.loading) {
1773 double perc;
1774 time_t eta, elapsed;
1775 off_t remaining_bytes = server.loading_total_bytes-
1776 server.loading_loaded_bytes;
1777
1778 perc = ((double)server.loading_loaded_bytes /
1779 server.loading_total_bytes) * 100;
1780
1781 elapsed = server.unixtime-server.loading_start_time;
1782 if (elapsed == 0) {
1783 eta = 1; /* A fake 1 second figure if we don't have
1784 enough info */
1785 } else {
1786 eta = (elapsed*remaining_bytes)/server.loading_loaded_bytes;
1787 }
1788
1789 info = sdscatprintf(info,
1790 "loading_start_time:%ld\r\n"
1791 "loading_total_bytes:%llu\r\n"
1792 "loading_loaded_bytes:%llu\r\n"
1793 "loading_loaded_perc:%.2f\r\n"
1794 "loading_eta_seconds:%ld\r\n"
1795 ,(unsigned long) server.loading_start_time,
1796 (unsigned long long) server.loading_total_bytes,
1797 (unsigned long long) server.loading_loaded_bytes,
1798 perc,
1799 eta
1800 );
1801 }
1802 }
1803
1804 /* Stats */
1805 if (allsections || defsections || !strcasecmp(section,"stats")) {
1806 if (sections++) info = sdscat(info,"\r\n");
1807 info = sdscatprintf(info,
1808 "# Stats\r\n"
1809 "total_connections_received:%lld\r\n"
1810 "total_commands_processed:%lld\r\n"
1811 "instantaneous_ops_per_sec:%lld\r\n"
1812 "rejected_connections:%lld\r\n"
1813 "expired_keys:%lld\r\n"
1814 "evicted_keys:%lld\r\n"
1815 "keyspace_hits:%lld\r\n"
1816 "keyspace_misses:%lld\r\n"
1817 "pubsub_channels:%ld\r\n"
1818 "pubsub_patterns:%lu\r\n"
1819 "latest_fork_usec:%lld\r\n",
1820 server.stat_numconnections,
1821 server.stat_numcommands,
1822 getOperationsPerSecond(),
1823 server.stat_rejected_conn,
1824 server.stat_expiredkeys,
1825 server.stat_evictedkeys,
1826 server.stat_keyspace_hits,
1827 server.stat_keyspace_misses,
1828 dictSize(server.pubsub_channels),
1829 listLength(server.pubsub_patterns),
1830 server.stat_fork_time);
1831 }
1832
1833 /* Replication */
1834 if (allsections || defsections || !strcasecmp(section,"replication")) {
1835 if (sections++) info = sdscat(info,"\r\n");
1836 info = sdscatprintf(info,
1837 "# Replication\r\n"
1838 "role:%s\r\n",
1839 server.masterhost == NULL ? "master" : "slave");
1840 if (server.masterhost) {
1841 info = sdscatprintf(info,
1842 "master_host:%s\r\n"
1843 "master_port:%d\r\n"
1844 "master_link_status:%s\r\n"
1845 "master_last_io_seconds_ago:%d\r\n"
1846 "master_sync_in_progress:%d\r\n"
1847 ,server.masterhost,
1848 server.masterport,
1849 (server.repl_state == REDIS_REPL_CONNECTED) ?
1850 "up" : "down",
1851 server.master ?
1852 ((int)(server.unixtime-server.master->lastinteraction)) : -1,
1853 server.repl_state == REDIS_REPL_TRANSFER
1854 );
1855
1856 if (server.repl_state == REDIS_REPL_TRANSFER) {
1857 info = sdscatprintf(info,
1858 "master_sync_left_bytes:%ld\r\n"
1859 "master_sync_last_io_seconds_ago:%d\r\n"
1860 ,(long)server.repl_transfer_left,
1861 (int)(server.unixtime-server.repl_transfer_lastio)
1862 );
1863 }
1864
1865 if (server.repl_state != REDIS_REPL_CONNECTED) {
1866 info = sdscatprintf(info,
1867 "master_link_down_since_seconds:%ld\r\n",
1868 (long)server.unixtime-server.repl_down_since);
1869 }
1870 }
1871 info = sdscatprintf(info,
1872 "connected_slaves:%lu\r\n",
1873 listLength(server.slaves));
1874 if (listLength(server.slaves)) {
1875 int slaveid = 0;
1876 listNode *ln;
1877 listIter li;
1878
1879 listRewind(server.slaves,&li);
1880 while((ln = listNext(&li))) {
1881 redisClient *slave = listNodeValue(ln);
1882 char *state = NULL;
1883 char ip[32];
1884 int port;
1885
1886 if (anetPeerToString(slave->fd,ip,&port) == -1) continue;
1887 switch(slave->replstate) {
1888 case REDIS_REPL_WAIT_BGSAVE_START:
1889 case REDIS_REPL_WAIT_BGSAVE_END:
1890 state = "wait_bgsave";
1891 break;
1892 case REDIS_REPL_SEND_BULK:
1893 state = "send_bulk";
1894 break;
1895 case REDIS_REPL_ONLINE:
1896 state = "online";
1897 break;
1898 }
1899 if (state == NULL) continue;
1900 info = sdscatprintf(info,"slave%d:%s,%d,%s\r\n",
1901 slaveid,ip,port,state);
1902 slaveid++;
1903 }
1904 }
1905 }
1906
1907 /* CPU */
1908 if (allsections || defsections || !strcasecmp(section,"cpu")) {
1909 if (sections++) info = sdscat(info,"\r\n");
1910 info = sdscatprintf(info,
1911 "# CPU\r\n"
1912 "used_cpu_sys:%.2f\r\n"
1913 "used_cpu_user:%.2f\r\n"
1914 "used_cpu_sys_children:%.2f\r\n"
1915 "used_cpu_user_children:%.2f\r\n",
1916 (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
1917 (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000,
1918 (float)c_ru.ru_stime.tv_sec+(float)c_ru.ru_stime.tv_usec/1000000,
1919 (float)c_ru.ru_utime.tv_sec+(float)c_ru.ru_utime.tv_usec/1000000);
1920 }
1921
1922 /* cmdtime */
1923 if (allsections || !strcasecmp(section,"commandstats")) {
1924 if (sections++) info = sdscat(info,"\r\n");
1925 info = sdscatprintf(info, "# Commandstats\r\n");
1926 numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1927 for (j = 0; j < numcommands; j++) {
1928 struct redisCommand *c = redisCommandTable+j;
1929
1930 if (!c->calls) continue;
1931 info = sdscatprintf(info,
1932 "cmdstat_%s:calls=%lld,usec=%lld,usec_per_call=%.2f\r\n",
1933 c->name, c->calls, c->microseconds,
1934 (c->calls == 0) ? 0 : ((float)c->microseconds/c->calls));
1935 }
1936 }
1937
1938 /* Key space */
1939 if (allsections || defsections || !strcasecmp(section,"keyspace")) {
1940 if (sections++) info = sdscat(info,"\r\n");
1941 info = sdscatprintf(info, "# Keyspace\r\n");
1942 for (j = 0; j < server.dbnum; j++) {
1943 long long keys, vkeys;
1944
1945 keys = dictSize(server.db[j].dict);
1946 vkeys = dictSize(server.db[j].expires);
1947 if (keys || vkeys) {
1948 info = sdscatprintf(info, "db%d:keys=%lld,expires=%lld\r\n",
1949 j, keys, vkeys);
1950 }
1951 }
1952 }
1953 return info;
1954 }
1955
1956 void infoCommand(redisClient *c) {
1957 char *section = c->argc == 2 ? c->argv[1]->ptr : "default";
1958
1959 if (c->argc > 2) {
1960 addReply(c,shared.syntaxerr);
1961 return;
1962 }
1963 sds info = genRedisInfoString(section);
1964 addReplySds(c,sdscatprintf(sdsempty(),"$%lu\r\n",
1965 (unsigned long)sdslen(info)));
1966 addReplySds(c,info);
1967 addReply(c,shared.crlf);
1968 }
1969
1970 void monitorCommand(redisClient *c) {
1971 /* ignore MONITOR if aleady slave or in monitor mode */
1972 if (c->flags & REDIS_SLAVE) return;
1973
1974 c->flags |= (REDIS_SLAVE|REDIS_MONITOR);
1975 c->slaveseldb = 0;
1976 listAddNodeTail(server.monitors,c);
1977 addReply(c,shared.ok);
1978 }
1979
1980 /* ============================ Maxmemory directive ======================== */
1981
1982 /* This function gets called when 'maxmemory' is set on the config file to limit
1983 * the max memory used by the server, before processing a command.
1984 *
1985 * The goal of the function is to free enough memory to keep Redis under the
1986 * configured memory limit.
1987 *
1988 * The function starts calculating how many bytes should be freed to keep
1989 * Redis under the limit, and enters a loop selecting the best keys to
1990 * evict accordingly to the configured policy.
1991 *
1992 * If all the bytes needed to return back under the limit were freed the
1993 * function returns REDIS_OK, otherwise REDIS_ERR is returned, and the caller
1994 * should block the execution of commands that will result in more memory
1995 * used by the server.
1996 */
1997 int freeMemoryIfNeeded(void) {
1998 size_t mem_used, mem_tofree, mem_freed;
1999 int slaves = listLength(server.slaves);
2000
2001 /* Remove the size of slaves output buffers and AOF buffer from the
2002 * count of used memory. */
2003 mem_used = zmalloc_used_memory();
2004 if (slaves) {
2005 listIter li;
2006 listNode *ln;
2007
2008 listRewind(server.slaves,&li);
2009 while((ln = listNext(&li))) {
2010 redisClient *slave = listNodeValue(ln);
2011 unsigned long obuf_bytes = getClientOutputBufferMemoryUsage(slave);
2012 if (obuf_bytes > mem_used)
2013 mem_used = 0;
2014 else
2015 mem_used -= obuf_bytes;
2016 }
2017 }
2018 if (server.aof_state != REDIS_AOF_OFF) {
2019 mem_used -= sdslen(server.aof_buf);
2020 mem_used -= sdslen(server.aof_rewrite_buf);
2021 }
2022
2023 /* Check if we are over the memory limit. */
2024 if (mem_used <= server.maxmemory) return REDIS_OK;
2025
2026 if (server.maxmemory_policy == REDIS_MAXMEMORY_NO_EVICTION)
2027 return REDIS_ERR; /* We need to free memory, but policy forbids. */
2028
2029 /* Compute how much memory we need to free. */
2030 mem_tofree = mem_used - server.maxmemory;
2031 mem_freed = 0;
2032 while (mem_freed < mem_tofree) {
2033 int j, k, keys_freed = 0;
2034
2035 for (j = 0; j < server.dbnum; j++) {
2036 long bestval = 0; /* just to prevent warning */
2037 sds bestkey = NULL;
2038 struct dictEntry *de;
2039 redisDb *db = server.db+j;
2040 dict *dict;
2041
2042 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2043 server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM)
2044 {
2045 dict = server.db[j].dict;
2046 } else {
2047 dict = server.db[j].expires;
2048 }
2049 if (dictSize(dict) == 0) continue;
2050
2051 /* volatile-random and allkeys-random policy */
2052 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM ||
2053 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_RANDOM)
2054 {
2055 de = dictGetRandomKey(dict);
2056 bestkey = dictGetKey(de);
2057 }
2058
2059 /* volatile-lru and allkeys-lru policy */
2060 else if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2061 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2062 {
2063 for (k = 0; k < server.maxmemory_samples; k++) {
2064 sds thiskey;
2065 long thisval;
2066 robj *o;
2067
2068 de = dictGetRandomKey(dict);
2069 thiskey = dictGetKey(de);
2070 /* When policy is volatile-lru we need an additonal lookup
2071 * to locate the real key, as dict is set to db->expires. */
2072 if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2073 de = dictFind(db->dict, thiskey);
2074 o = dictGetVal(de);
2075 thisval = estimateObjectIdleTime(o);
2076
2077 /* Higher idle time is better candidate for deletion */
2078 if (bestkey == NULL || thisval > bestval) {
2079 bestkey = thiskey;
2080 bestval = thisval;
2081 }
2082 }
2083 }
2084
2085 /* volatile-ttl */
2086 else if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_TTL) {
2087 for (k = 0; k < server.maxmemory_samples; k++) {
2088 sds thiskey;
2089 long thisval;
2090
2091 de = dictGetRandomKey(dict);
2092 thiskey = dictGetKey(de);
2093 thisval = (long) dictGetVal(de);
2094
2095 /* Expire sooner (minor expire unix timestamp) is better
2096 * candidate for deletion */
2097 if (bestkey == NULL || thisval < bestval) {
2098 bestkey = thiskey;
2099 bestval = thisval;
2100 }
2101 }
2102 }
2103
2104 /* Finally remove the selected key. */
2105 if (bestkey) {
2106 long long delta;
2107
2108 robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
2109 propagateExpire(db,keyobj);
2110 /* We compute the amount of memory freed by dbDelete() alone.
2111 * It is possible that actually the memory needed to propagate
2112 * the DEL in AOF and replication link is greater than the one
2113 * we are freeing removing the key, but we can't account for
2114 * that otherwise we would never exit the loop.
2115 *
2116 * AOF and Output buffer memory will be freed eventually so
2117 * we only care about memory used by the key space. */
2118 delta = (long long) zmalloc_used_memory();
2119 dbDelete(db,keyobj);
2120 delta -= (long long) zmalloc_used_memory();
2121 mem_freed += delta;
2122 server.stat_evictedkeys++;
2123 decrRefCount(keyobj);
2124 keys_freed++;
2125
2126 /* When the memory to free starts to be big enough, we may
2127 * start spending so much time here that is impossible to
2128 * deliver data to the slaves fast enough, so we force the
2129 * transmission here inside the loop. */
2130 if (slaves) flushSlavesOutputBuffers();
2131 }
2132 }
2133 if (!keys_freed) return REDIS_ERR; /* nothing to free... */
2134 }
2135 return REDIS_OK;
2136 }
2137
2138 /* =================================== Main! ================================ */
2139
2140 #ifdef __linux__
2141 int linuxOvercommitMemoryValue(void) {
2142 FILE *fp = fopen("/proc/sys/vm/overcommit_memory","r");
2143 char buf[64];
2144
2145 if (!fp) return -1;
2146 if (fgets(buf,64,fp) == NULL) {
2147 fclose(fp);
2148 return -1;
2149 }
2150 fclose(fp);
2151
2152 return atoi(buf);
2153 }
2154
2155 void linuxOvercommitMemoryWarning(void) {
2156 if (linuxOvercommitMemoryValue() == 0) {
2157 redisLog(REDIS_WARNING,"WARNING overcommit_memory is set to 0! Background save may fail under low memory condition. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
2158 }
2159 }
2160 #endif /* __linux__ */
2161
2162 void createPidFile(void) {
2163 /* Try to write the pid file in a best-effort way. */
2164 FILE *fp = fopen(server.pidfile,"w");
2165 if (fp) {
2166 fprintf(fp,"%d\n",(int)getpid());
2167 fclose(fp);
2168 }
2169 }
2170
2171 void daemonize(void) {
2172 int fd;
2173
2174 if (fork() != 0) exit(0); /* parent exits */
2175 setsid(); /* create a new session */
2176
2177 /* Every output goes to /dev/null. If Redis is daemonized but
2178 * the 'logfile' is set to 'stdout' in the configuration file
2179 * it will not log at all. */
2180 if ((fd = open("/dev/null", O_RDWR, 0)) != -1) {
2181 dup2(fd, STDIN_FILENO);
2182 dup2(fd, STDOUT_FILENO);
2183 dup2(fd, STDERR_FILENO);
2184 if (fd > STDERR_FILENO) close(fd);
2185 }
2186 }
2187
2188 void version() {
2189 printf("Redis server v=%s sha=%s:%d malloc=%s\n", REDIS_VERSION,
2190 redisGitSHA1(), atoi(redisGitDirty()) > 0, ZMALLOC_LIB);
2191 exit(0);
2192 }
2193
2194 void usage() {
2195 fprintf(stderr,"Usage: ./redis-server [/path/to/redis.conf] [options]\n");
2196 fprintf(stderr," ./redis-server - (read config from stdin)\n");
2197 fprintf(stderr," ./redis-server -v or --version\n");
2198 fprintf(stderr," ./redis-server -h or --help\n");
2199 fprintf(stderr," ./redis-server --test-memory <megabytes>\n\n");
2200 fprintf(stderr,"Examples:\n");
2201 fprintf(stderr," ./redis-server (run the server with default conf)\n");
2202 fprintf(stderr," ./redis-server /etc/redis/6379.conf\n");
2203 fprintf(stderr," ./redis-server --port 7777\n");
2204 fprintf(stderr," ./redis-server --port 7777 --slaveof 127.0.0.1 8888\n");
2205 fprintf(stderr," ./redis-server /etc/myredis.conf --loglevel verbose\n");
2206 exit(1);
2207 }
2208
2209 void redisAsciiArt(void) {
2210 #include "asciilogo.h"
2211 char *buf = zmalloc(1024*16);
2212
2213 snprintf(buf,1024*16,ascii_logo,
2214 REDIS_VERSION,
2215 redisGitSHA1(),
2216 strtol(redisGitDirty(),NULL,10) > 0,
2217 (sizeof(long) == 8) ? "64" : "32",
2218 "stand alone",
2219 server.port,
2220 (long) getpid()
2221 );
2222 redisLogRaw(REDIS_NOTICE|REDIS_LOG_RAW,buf);
2223 zfree(buf);
2224 }
2225
2226 static void sigtermHandler(int sig) {
2227 REDIS_NOTUSED(sig);
2228
2229 redisLog(REDIS_WARNING,"Received SIGTERM, scheduling shutdown...");
2230 server.shutdown_asap = 1;
2231 }
2232
2233 void setupSignalHandlers(void) {
2234 struct sigaction act;
2235
2236 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction is used.
2237 * Otherwise, sa_handler is used. */
2238 sigemptyset(&act.sa_mask);
2239 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND;
2240 act.sa_handler = sigtermHandler;
2241 sigaction(SIGTERM, &act, NULL);
2242
2243 #ifdef HAVE_BACKTRACE
2244 sigemptyset(&act.sa_mask);
2245 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND | SA_SIGINFO;
2246 act.sa_sigaction = sigsegvHandler;
2247 sigaction(SIGSEGV, &act, NULL);
2248 sigaction(SIGBUS, &act, NULL);
2249 sigaction(SIGFPE, &act, NULL);
2250 sigaction(SIGILL, &act, NULL);
2251 #endif
2252 return;
2253 }
2254
2255 void memtest(size_t megabytes, int passes);
2256
2257 int main(int argc, char **argv) {
2258 long long start;
2259 struct timeval tv;
2260
2261 /* We need to initialize our libraries, and the server configuration. */
2262 zmalloc_enable_thread_safeness();
2263 srand(time(NULL)^getpid());
2264 gettimeofday(&tv,NULL);
2265 dictSetHashFunctionSeed(tv.tv_sec^tv.tv_usec^getpid());
2266 initServerConfig();
2267
2268 if (argc >= 2) {
2269 int j = 1; /* First option to parse in argv[] */
2270 sds options = sdsempty();
2271 char *configfile = NULL;
2272
2273 /* Handle special options --help and --version */
2274 if (strcmp(argv[1], "-v") == 0 ||
2275 strcmp(argv[1], "--version") == 0) version();
2276 if (strcmp(argv[1], "--help") == 0 ||
2277 strcmp(argv[1], "-h") == 0) usage();
2278 if (strcmp(argv[1], "--test-memory") == 0) {
2279 if (argc == 3) {
2280 memtest(atoi(argv[2]),50);
2281 exit(0);
2282 } else {
2283 fprintf(stderr,"Please specify the amount of memory to test in megabytes.\n");
2284 fprintf(stderr,"Example: ./redis-server --test-memory 4096\n\n");
2285 exit(1);
2286 }
2287 }
2288
2289 /* First argument is the config file name? */
2290 if (argv[j][0] != '-' || argv[j][1] != '-')
2291 configfile = argv[j++];
2292 /* All the other options are parsed and conceptually appended to the
2293 * configuration file. For instance --port 6380 will generate the
2294 * string "port 6380\n" to be parsed after the actual file name
2295 * is parsed, if any. */
2296 while(j != argc) {
2297 if (argv[j][0] == '-' && argv[j][1] == '-') {
2298 /* Option name */
2299 if (sdslen(options)) options = sdscat(options,"\n");
2300 options = sdscat(options,argv[j]+2);
2301 options = sdscat(options," ");
2302 } else {
2303 /* Option argument */
2304 options = sdscatrepr(options,argv[j],strlen(argv[j]));
2305 options = sdscat(options," ");
2306 }
2307 j++;
2308 }
2309 resetServerSaveParams();
2310 loadServerConfig(configfile,options);
2311 sdsfree(options);
2312 } else {
2313 redisLog(REDIS_WARNING,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
2314 }
2315 if (server.daemonize) daemonize();
2316 initServer();
2317 if (server.daemonize) createPidFile();
2318 redisAsciiArt();
2319 redisLog(REDIS_WARNING,"Server started, Redis version " REDIS_VERSION);
2320 #ifdef __linux__
2321 linuxOvercommitMemoryWarning();
2322 #endif
2323 start = ustime();
2324 if (server.aof_state == REDIS_AOF_ON) {
2325 if (loadAppendOnlyFile(server.aof_filename) == REDIS_OK)
2326 redisLog(REDIS_NOTICE,"DB loaded from append only file: %.3f seconds",(float)(ustime()-start)/1000000);
2327 } else {
2328 if (rdbLoad(server.rdb_filename) == REDIS_OK) {
2329 redisLog(REDIS_NOTICE,"DB loaded from disk: %.3f seconds",
2330 (float)(ustime()-start)/1000000);
2331 } else if (errno != ENOENT) {
2332 redisLog(REDIS_WARNING,"Fatal error loading the DB. Exiting.");
2333 exit(1);
2334 }
2335 }
2336 if (server.ipfd > 0)
2337 redisLog(REDIS_NOTICE,"The server is now ready to accept connections on port %d", server.port);
2338 if (server.sofd > 0)
2339 redisLog(REDIS_NOTICE,"The server is now ready to accept connections at %s", server.unixsocket);
2340 aeSetBeforeSleepProc(server.el,beforeSleep);
2341 aeMain(server.el);
2342 aeDeleteEventLoop(server.el);
2343 return 0;
2344 }
2345
2346 /* The End */