]> git.saurik.com Git - redis.git/blob - src/redis.c
declare hashDictType as external too
[redis.git] / src / redis.c
1 /*
2 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 */
29
30 #include "redis.h"
31 #include "slowlog.h"
32 #include "bio.h"
33
34 #include <time.h>
35 #include <signal.h>
36 #include <sys/wait.h>
37 #include <errno.h>
38 #include <assert.h>
39 #include <ctype.h>
40 #include <stdarg.h>
41 #include <arpa/inet.h>
42 #include <sys/stat.h>
43 #include <fcntl.h>
44 #include <sys/time.h>
45 #include <sys/resource.h>
46 #include <sys/uio.h>
47 #include <limits.h>
48 #include <float.h>
49 #include <math.h>
50 #include <sys/resource.h>
51
52 /* Our shared "common" objects */
53
54 struct sharedObjectsStruct shared;
55
56 /* Global vars that are actually used as constants. The following double
57 * values are used for double on-disk serialization, and are initialized
58 * at runtime to avoid strange compiler optimizations. */
59
60 double R_Zero, R_PosInf, R_NegInf, R_Nan;
61
62 /*================================= Globals ================================= */
63
64 /* Global vars */
65 struct redisServer server; /* server global state */
66 struct redisCommand *commandTable;
67
68 /* Our command table.
69 *
70 * Every entry is composed of the following fields:
71 *
72 * name: a string representing the command name.
73 * function: pointer to the C function implementing the command.
74 * arity: number of arguments, it is possible to use -N to say >= N
75 * sflags: command flags as string. See below for a table of flags.
76 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
77 * get_keys_proc: an optional function to get key arguments from a command.
78 * This is only used when the following three fields are not
79 * enough to specify what arguments are keys.
80 * first_key_index: first argument that is a key
81 * last_key_index: last argument that is a key
82 * key_step: step to get all the keys from first to last argument. For instance
83 * in MSET the step is two since arguments are key,val,key,val,...
84 * microseconds: microseconds of total execution time for this command.
85 * calls: total number of calls of this command.
86 *
87 * The flags, microseconds and calls fields are computed by Redis and should
88 * always be set to zero.
89 *
90 * Command flags are expressed using strings where every character represents
91 * a flag. Later the populateCommandTable() function will take care of
92 * populating the real 'flags' field using this characters.
93 *
94 * This is the meaning of the flags:
95 *
96 * w: write command (may modify the key space).
97 * r: read command (will never modify the key space).
98 * m: may increase memory usage once called. Don't allow if out of memory.
99 * a: admin command, like SAVE or SHUTDOWN.
100 * p: Pub/Sub related command.
101 * f: force replication of this command, regarless of server.dirty.
102 * s: command not allowed in scripts.
103 * R: random command. Command is not deterministic, that is, the same command
104 * with the same arguments, with the same key space, may have different
105 * results. For instance SPOP and RANDOMKEY are two random commands.
106 * S: Sort command output array if called from script, so that the output
107 * is deterministic.
108 */
109 struct redisCommand redisCommandTable[] = {
110 {"get",getCommand,2,"r",0,NULL,1,1,1,0,0},
111 {"set",setCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
112 {"setnx",setnxCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
113 {"setex",setexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
114 {"psetex",psetexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
115 {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
116 {"strlen",strlenCommand,2,"r",0,NULL,1,1,1,0,0},
117 {"del",delCommand,-2,"w",0,noPreloadGetKeys,1,-1,1,0,0},
118 {"exists",existsCommand,2,"r",0,NULL,1,1,1,0,0},
119 {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
120 {"getbit",getbitCommand,3,"r",0,NULL,1,1,1,0,0},
121 {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
122 {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
123 {"substr",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
124 {"incr",incrCommand,2,"wm",0,NULL,1,1,1,0,0},
125 {"decr",decrCommand,2,"wm",0,NULL,1,1,1,0,0},
126 {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
127 {"rpush",rpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
128 {"lpush",lpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
129 {"rpushx",rpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
130 {"lpushx",lpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
131 {"linsert",linsertCommand,5,"wm",0,NULL,1,1,1,0,0},
132 {"rpop",rpopCommand,2,"w",0,NULL,1,1,1,0,0},
133 {"lpop",lpopCommand,2,"w",0,NULL,1,1,1,0,0},
134 {"brpop",brpopCommand,-3,"ws",0,NULL,1,1,1,0,0},
135 {"brpoplpush",brpoplpushCommand,4,"wms",0,NULL,1,2,1,0,0},
136 {"blpop",blpopCommand,-3,"ws",0,NULL,1,-2,1,0,0},
137 {"llen",llenCommand,2,"r",0,NULL,1,1,1,0,0},
138 {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
139 {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
140 {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
141 {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
142 {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
143 {"rpoplpush",rpoplpushCommand,3,"wm",0,NULL,1,2,1,0,0},
144 {"sadd",saddCommand,-3,"wm",0,NULL,1,1,1,0,0},
145 {"srem",sremCommand,-3,"w",0,NULL,1,1,1,0,0},
146 {"smove",smoveCommand,4,"w",0,NULL,1,2,1,0,0},
147 {"sismember",sismemberCommand,3,"r",0,NULL,1,1,1,0,0},
148 {"scard",scardCommand,2,"r",0,NULL,1,1,1,0,0},
149 {"spop",spopCommand,2,"wRs",0,NULL,1,1,1,0,0},
150 {"srandmember",srandmemberCommand,2,"rR",0,NULL,1,1,1,0,0},
151 {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
152 {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
153 {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
154 {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
155 {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
156 {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
157 {"smembers",sinterCommand,2,"rS",0,NULL,1,1,1,0,0},
158 {"zadd",zaddCommand,-4,"wm",0,NULL,1,1,1,0,0},
159 {"zincrby",zincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
160 {"zrem",zremCommand,-3,"w",0,NULL,1,1,1,0,0},
161 {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
162 {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
163 {"zunionstore",zunionstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
164 {"zinterstore",zinterstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
165 {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
166 {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
167 {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
168 {"zcount",zcountCommand,4,"r",0,NULL,1,1,1,0,0},
169 {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
170 {"zcard",zcardCommand,2,"r",0,NULL,1,1,1,0,0},
171 {"zscore",zscoreCommand,3,"r",0,NULL,1,1,1,0,0},
172 {"zrank",zrankCommand,3,"r",0,NULL,1,1,1,0,0},
173 {"zrevrank",zrevrankCommand,3,"r",0,NULL,1,1,1,0,0},
174 {"hset",hsetCommand,4,"wm",0,NULL,1,1,1,0,0},
175 {"hsetnx",hsetnxCommand,4,"wm",0,NULL,1,1,1,0,0},
176 {"hget",hgetCommand,3,"r",0,NULL,1,1,1,0,0},
177 {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
178 {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
179 {"hincrby",hincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
180 {"hincrbyfloat",hincrbyfloatCommand,4,"wm",0,NULL,1,1,1,0,0},
181 {"hdel",hdelCommand,-3,"w",0,NULL,1,1,1,0,0},
182 {"hlen",hlenCommand,2,"r",0,NULL,1,1,1,0,0},
183 {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
184 {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
185 {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
186 {"hexists",hexistsCommand,3,"r",0,NULL,1,1,1,0,0},
187 {"incrby",incrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
188 {"decrby",decrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
189 {"incrbyfloat",incrbyfloatCommand,3,"wm",0,NULL,1,1,1,0,0},
190 {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
191 {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
192 {"msetnx",msetnxCommand,-3,"wm",0,NULL,1,-1,2,0,0},
193 {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
194 {"select",selectCommand,2,"r",0,NULL,0,0,0,0,0},
195 {"move",moveCommand,3,"w",0,NULL,1,1,1,0,0},
196 {"rename",renameCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
197 {"renamenx",renamenxCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
198 {"expire",expireCommand,3,"w",0,NULL,1,1,1,0,0},
199 {"expireat",expireatCommand,3,"w",0,NULL,1,1,1,0,0},
200 {"pexpire",pexpireCommand,3,"w",0,NULL,1,1,1,0,0},
201 {"pexpireat",pexpireatCommand,3,"w",0,NULL,1,1,1,0,0},
202 {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
203 {"dbsize",dbsizeCommand,1,"r",0,NULL,0,0,0,0,0},
204 {"auth",authCommand,2,"rs",0,NULL,0,0,0,0,0},
205 {"ping",pingCommand,1,"r",0,NULL,0,0,0,0,0},
206 {"echo",echoCommand,2,"r",0,NULL,0,0,0,0,0},
207 {"save",saveCommand,1,"ars",0,NULL,0,0,0,0,0},
208 {"bgsave",bgsaveCommand,1,"ar",0,NULL,0,0,0,0,0},
209 {"bgrewriteaof",bgrewriteaofCommand,1,"ar",0,NULL,0,0,0,0,0},
210 {"shutdown",shutdownCommand,-1,"ar",0,NULL,0,0,0,0,0},
211 {"lastsave",lastsaveCommand,1,"r",0,NULL,0,0,0,0,0},
212 {"type",typeCommand,2,"r",0,NULL,1,1,1,0,0},
213 {"multi",multiCommand,1,"rs",0,NULL,0,0,0,0,0},
214 {"exec",execCommand,1,"s",0,NULL,0,0,0,0,0},
215 {"discard",discardCommand,1,"rs",0,NULL,0,0,0,0,0},
216 {"sync",syncCommand,1,"ars",0,NULL,0,0,0,0,0},
217 {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
218 {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
219 {"sort",sortCommand,-2,"wmS",0,NULL,1,1,1,0,0},
220 {"info",infoCommand,-1,"r",0,NULL,0,0,0,0,0},
221 {"monitor",monitorCommand,1,"ars",0,NULL,0,0,0,0,0},
222 {"ttl",ttlCommand,2,"r",0,NULL,1,1,1,0,0},
223 {"pttl",pttlCommand,2,"r",0,NULL,1,1,1,0,0},
224 {"persist",persistCommand,2,"w",0,NULL,1,1,1,0,0},
225 {"slaveof",slaveofCommand,3,"aws",0,NULL,0,0,0,0,0},
226 {"debug",debugCommand,-2,"as",0,NULL,0,0,0,0,0},
227 {"config",configCommand,-2,"ar",0,NULL,0,0,0,0,0},
228 {"subscribe",subscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
229 {"unsubscribe",unsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
230 {"psubscribe",psubscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
231 {"punsubscribe",punsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
232 {"publish",publishCommand,3,"pf",0,NULL,0,0,0,0,0},
233 {"watch",watchCommand,-2,"rs",0,noPreloadGetKeys,1,-1,1,0,0},
234 {"unwatch",unwatchCommand,1,"rs",0,NULL,0,0,0,0,0},
235 {"restore",restoreCommand,4,"awm",0,NULL,1,1,1,0,0},
236 {"migrate",migrateCommand,6,"aw",0,NULL,0,0,0,0,0},
237 {"dump",dumpCommand,2,"ar",0,NULL,1,1,1,0,0},
238 {"object",objectCommand,-2,"r",0,NULL,2,2,2,0,0},
239 {"client",clientCommand,-2,"ar",0,NULL,0,0,0,0,0},
240 {"eval",evalCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
241 {"evalsha",evalShaCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
242 {"slowlog",slowlogCommand,-2,"r",0,NULL,0,0,0,0,0},
243 {"script",scriptCommand,-2,"ras",0,NULL,0,0,0,0,0},
244 {"time",timeCommand,1,"rR",0,NULL,0,0,0,0,0}
245 };
246
247 /*============================ Utility functions ============================ */
248
249 /* Low level logging. To use only for very big messages, otherwise
250 * redisLog() is to prefer. */
251 void redisLogRaw(int level, const char *msg) {
252 const int syslogLevelMap[] = { LOG_DEBUG, LOG_INFO, LOG_NOTICE, LOG_WARNING };
253 const char *c = ".-*#";
254 time_t now = time(NULL);
255 FILE *fp;
256 char buf[64];
257 int rawmode = (level & REDIS_LOG_RAW);
258
259 level &= 0xff; /* clear flags */
260 if (level < server.verbosity) return;
261
262 fp = (server.logfile == NULL) ? stdout : fopen(server.logfile,"a");
263 if (!fp) return;
264
265 if (rawmode) {
266 fprintf(fp,"%s",msg);
267 } else {
268 strftime(buf,sizeof(buf),"%d %b %H:%M:%S",localtime(&now));
269 fprintf(fp,"[%d] %s %c %s\n",(int)getpid(),buf,c[level],msg);
270 }
271 fflush(fp);
272
273 if (server.logfile) fclose(fp);
274
275 if (server.syslog_enabled) syslog(syslogLevelMap[level], "%s", msg);
276 }
277
278 /* Like redisLogRaw() but with printf-alike support. This is the funciton that
279 * is used across the code. The raw version is only used in order to dump
280 * the INFO output on crash. */
281 void redisLog(int level, const char *fmt, ...) {
282 va_list ap;
283 char msg[REDIS_MAX_LOGMSG_LEN];
284
285 if ((level&0xff) < server.verbosity) return;
286
287 va_start(ap, fmt);
288 vsnprintf(msg, sizeof(msg), fmt, ap);
289 va_end(ap);
290
291 redisLogRaw(level,msg);
292 }
293
294 /* Redis generally does not try to recover from out of memory conditions
295 * when allocating objects or strings, it is not clear if it will be possible
296 * to report this condition to the client since the networking layer itself
297 * is based on heap allocation for send buffers, so we simply abort.
298 * At least the code will be simpler to read... */
299 void oom(const char *msg) {
300 redisLog(REDIS_WARNING, "%s: Out of memory\n",msg);
301 sleep(1);
302 abort();
303 }
304
305 /* Return the UNIX time in microseconds */
306 long long ustime(void) {
307 struct timeval tv;
308 long long ust;
309
310 gettimeofday(&tv, NULL);
311 ust = ((long long)tv.tv_sec)*1000000;
312 ust += tv.tv_usec;
313 return ust;
314 }
315
316 /* Return the UNIX time in milliseconds */
317 long long mstime(void) {
318 return ustime()/1000;
319 }
320
321 /*====================== Hash table type implementation ==================== */
322
323 /* This is an hash table type that uses the SDS dynamic strings libary as
324 * keys and radis objects as values (objects can hold SDS strings,
325 * lists, sets). */
326
327 void dictVanillaFree(void *privdata, void *val)
328 {
329 DICT_NOTUSED(privdata);
330 zfree(val);
331 }
332
333 void dictListDestructor(void *privdata, void *val)
334 {
335 DICT_NOTUSED(privdata);
336 listRelease((list*)val);
337 }
338
339 int dictSdsKeyCompare(void *privdata, const void *key1,
340 const void *key2)
341 {
342 int l1,l2;
343 DICT_NOTUSED(privdata);
344
345 l1 = sdslen((sds)key1);
346 l2 = sdslen((sds)key2);
347 if (l1 != l2) return 0;
348 return memcmp(key1, key2, l1) == 0;
349 }
350
351 /* A case insensitive version used for the command lookup table. */
352 int dictSdsKeyCaseCompare(void *privdata, const void *key1,
353 const void *key2)
354 {
355 DICT_NOTUSED(privdata);
356
357 return strcasecmp(key1, key2) == 0;
358 }
359
360 void dictRedisObjectDestructor(void *privdata, void *val)
361 {
362 DICT_NOTUSED(privdata);
363
364 if (val == NULL) return; /* Values of swapped out keys as set to NULL */
365 decrRefCount(val);
366 }
367
368 void dictSdsDestructor(void *privdata, void *val)
369 {
370 DICT_NOTUSED(privdata);
371
372 sdsfree(val);
373 }
374
375 int dictObjKeyCompare(void *privdata, const void *key1,
376 const void *key2)
377 {
378 const robj *o1 = key1, *o2 = key2;
379 return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
380 }
381
382 unsigned int dictObjHash(const void *key) {
383 const robj *o = key;
384 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
385 }
386
387 unsigned int dictSdsHash(const void *key) {
388 return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
389 }
390
391 unsigned int dictSdsCaseHash(const void *key) {
392 return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
393 }
394
395 int dictEncObjKeyCompare(void *privdata, const void *key1,
396 const void *key2)
397 {
398 robj *o1 = (robj*) key1, *o2 = (robj*) key2;
399 int cmp;
400
401 if (o1->encoding == REDIS_ENCODING_INT &&
402 o2->encoding == REDIS_ENCODING_INT)
403 return o1->ptr == o2->ptr;
404
405 o1 = getDecodedObject(o1);
406 o2 = getDecodedObject(o2);
407 cmp = dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
408 decrRefCount(o1);
409 decrRefCount(o2);
410 return cmp;
411 }
412
413 unsigned int dictEncObjHash(const void *key) {
414 robj *o = (robj*) key;
415
416 if (o->encoding == REDIS_ENCODING_RAW) {
417 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
418 } else {
419 if (o->encoding == REDIS_ENCODING_INT) {
420 char buf[32];
421 int len;
422
423 len = ll2string(buf,32,(long)o->ptr);
424 return dictGenHashFunction((unsigned char*)buf, len);
425 } else {
426 unsigned int hash;
427
428 o = getDecodedObject(o);
429 hash = dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
430 decrRefCount(o);
431 return hash;
432 }
433 }
434 }
435
436 /* Sets type hash table */
437 dictType setDictType = {
438 dictEncObjHash, /* hash function */
439 NULL, /* key dup */
440 NULL, /* val dup */
441 dictEncObjKeyCompare, /* key compare */
442 dictRedisObjectDestructor, /* key destructor */
443 NULL /* val destructor */
444 };
445
446 /* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
447 dictType zsetDictType = {
448 dictEncObjHash, /* hash function */
449 NULL, /* key dup */
450 NULL, /* val dup */
451 dictEncObjKeyCompare, /* key compare */
452 dictRedisObjectDestructor, /* key destructor */
453 NULL /* val destructor */
454 };
455
456 /* Db->dict, keys are sds strings, vals are Redis objects. */
457 dictType dbDictType = {
458 dictSdsHash, /* hash function */
459 NULL, /* key dup */
460 NULL, /* val dup */
461 dictSdsKeyCompare, /* key compare */
462 dictSdsDestructor, /* key destructor */
463 dictRedisObjectDestructor /* val destructor */
464 };
465
466 /* Db->expires */
467 dictType keyptrDictType = {
468 dictSdsHash, /* hash function */
469 NULL, /* key dup */
470 NULL, /* val dup */
471 dictSdsKeyCompare, /* key compare */
472 NULL, /* key destructor */
473 NULL /* val destructor */
474 };
475
476 /* Command table. sds string -> command struct pointer. */
477 dictType commandTableDictType = {
478 dictSdsCaseHash, /* hash function */
479 NULL, /* key dup */
480 NULL, /* val dup */
481 dictSdsKeyCaseCompare, /* key compare */
482 dictSdsDestructor, /* key destructor */
483 NULL /* val destructor */
484 };
485
486 /* Hash type hash table (note that small hashes are represented with zimpaps) */
487 dictType hashDictType = {
488 dictEncObjHash, /* hash function */
489 NULL, /* key dup */
490 NULL, /* val dup */
491 dictEncObjKeyCompare, /* key compare */
492 dictRedisObjectDestructor, /* key destructor */
493 dictRedisObjectDestructor /* val destructor */
494 };
495
496 /* Keylist hash table type has unencoded redis objects as keys and
497 * lists as values. It's used for blocking operations (BLPOP) and to
498 * map swapped keys to a list of clients waiting for this keys to be loaded. */
499 dictType keylistDictType = {
500 dictObjHash, /* hash function */
501 NULL, /* key dup */
502 NULL, /* val dup */
503 dictObjKeyCompare, /* key compare */
504 dictRedisObjectDestructor, /* key destructor */
505 dictListDestructor /* val destructor */
506 };
507
508 int htNeedsResize(dict *dict) {
509 long long size, used;
510
511 size = dictSlots(dict);
512 used = dictSize(dict);
513 return (size && used && size > DICT_HT_INITIAL_SIZE &&
514 (used*100/size < REDIS_HT_MINFILL));
515 }
516
517 /* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
518 * we resize the hash table to save memory */
519 void tryResizeHashTables(void) {
520 int j;
521
522 for (j = 0; j < server.dbnum; j++) {
523 if (htNeedsResize(server.db[j].dict))
524 dictResize(server.db[j].dict);
525 if (htNeedsResize(server.db[j].expires))
526 dictResize(server.db[j].expires);
527 }
528 }
529
530 /* Our hash table implementation performs rehashing incrementally while
531 * we write/read from the hash table. Still if the server is idle, the hash
532 * table will use two tables for a long time. So we try to use 1 millisecond
533 * of CPU time at every serverCron() loop in order to rehash some key. */
534 void incrementallyRehash(void) {
535 int j;
536
537 for (j = 0; j < server.dbnum; j++) {
538 if (dictIsRehashing(server.db[j].dict)) {
539 dictRehashMilliseconds(server.db[j].dict,1);
540 break; /* already used our millisecond for this loop... */
541 }
542 }
543 }
544
545 /* This function is called once a background process of some kind terminates,
546 * as we want to avoid resizing the hash tables when there is a child in order
547 * to play well with copy-on-write (otherwise when a resize happens lots of
548 * memory pages are copied). The goal of this function is to update the ability
549 * for dict.c to resize the hash tables accordingly to the fact we have o not
550 * running childs. */
551 void updateDictResizePolicy(void) {
552 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
553 dictEnableResize();
554 else
555 dictDisableResize();
556 }
557
558 /* ======================= Cron: called every 100 ms ======================== */
559
560 /* Try to expire a few timed out keys. The algorithm used is adaptive and
561 * will use few CPU cycles if there are few expiring keys, otherwise
562 * it will get more aggressive to avoid that too much memory is used by
563 * keys that can be removed from the keyspace. */
564 void activeExpireCycle(void) {
565 int j;
566
567 for (j = 0; j < server.dbnum; j++) {
568 int expired;
569 redisDb *db = server.db+j;
570
571 /* Continue to expire if at the end of the cycle more than 25%
572 * of the keys were expired. */
573 do {
574 long num = dictSize(db->expires);
575 long long now = mstime();
576
577 expired = 0;
578 if (num > REDIS_EXPIRELOOKUPS_PER_CRON)
579 num = REDIS_EXPIRELOOKUPS_PER_CRON;
580 while (num--) {
581 dictEntry *de;
582 long long t;
583
584 if ((de = dictGetRandomKey(db->expires)) == NULL) break;
585 t = dictGetSignedIntegerVal(de);
586 if (now > t) {
587 sds key = dictGetKey(de);
588 robj *keyobj = createStringObject(key,sdslen(key));
589
590 propagateExpire(db,keyobj);
591 dbDelete(db,keyobj);
592 decrRefCount(keyobj);
593 expired++;
594 server.stat_expiredkeys++;
595 }
596 }
597 } while (expired > REDIS_EXPIRELOOKUPS_PER_CRON/4);
598 }
599 }
600
601 void updateLRUClock(void) {
602 server.lruclock = (time(NULL)/REDIS_LRU_CLOCK_RESOLUTION) &
603 REDIS_LRU_CLOCK_MAX;
604 }
605
606
607 /* Add a sample to the operations per second array of samples. */
608 void trackOperationsPerSecond(void) {
609 long long t = mstime() - server.ops_sec_last_sample_time;
610 long long ops = server.stat_numcommands - server.ops_sec_last_sample_ops;
611 long long ops_sec;
612
613 ops_sec = t > 0 ? (ops*1000/t) : 0;
614
615 server.ops_sec_samples[server.ops_sec_idx] = ops_sec;
616 server.ops_sec_idx = (server.ops_sec_idx+1) % REDIS_OPS_SEC_SAMPLES;
617 server.ops_sec_last_sample_time = mstime();
618 server.ops_sec_last_sample_ops = server.stat_numcommands;
619 }
620
621 /* Return the mean of all the samples. */
622 long long getOperationsPerSecond(void) {
623 int j;
624 long long sum = 0;
625
626 for (j = 0; j < REDIS_OPS_SEC_SAMPLES; j++)
627 sum += server.ops_sec_samples[j];
628 return sum / REDIS_OPS_SEC_SAMPLES;
629 }
630
631 /* Check for timeouts. Returns non-zero if the client was terminated */
632 int clientsCronHandleTimeout(redisClient *c) {
633 time_t now = server.unixtime;
634
635 if (server.maxidletime &&
636 !(c->flags & REDIS_SLAVE) && /* no timeout for slaves */
637 !(c->flags & REDIS_MASTER) && /* no timeout for masters */
638 !(c->flags & REDIS_BLOCKED) && /* no timeout for BLPOP */
639 dictSize(c->pubsub_channels) == 0 && /* no timeout for pubsub */
640 listLength(c->pubsub_patterns) == 0 &&
641 (now - c->lastinteraction > server.maxidletime))
642 {
643 redisLog(REDIS_VERBOSE,"Closing idle client");
644 freeClient(c);
645 return 1;
646 } else if (c->flags & REDIS_BLOCKED) {
647 if (c->bpop.timeout != 0 && c->bpop.timeout < now) {
648 addReply(c,shared.nullmultibulk);
649 unblockClientWaitingData(c);
650 }
651 }
652 return 0;
653 }
654
655 /* The client query buffer is an sds.c string that can end with a lot of
656 * free space not used, this function reclaims space if needed.
657 *
658 * The funciton always returns 0 as it never terminates the client. */
659 int clientsCronResizeQueryBuffer(redisClient *c) {
660 size_t querybuf_size = sdsAllocSize(c->querybuf);
661 time_t idletime = server.unixtime - c->lastinteraction;
662
663 /* There are two conditions to resize the query buffer:
664 * 1) Query buffer is > BIG_ARG and too big for latest peak.
665 * 2) Client is inactive and the buffer is bigger than 1k. */
666 if (((querybuf_size > REDIS_MBULK_BIG_ARG) &&
667 (querybuf_size/(c->querybuf_peak+1)) > 2) ||
668 (querybuf_size > 1024 && idletime > 2))
669 {
670 /* Only resize the query buffer if it is actually wasting space. */
671 if (sdsavail(c->querybuf) > 1024) {
672 c->querybuf = sdsRemoveFreeSpace(c->querybuf);
673 }
674 }
675 /* Reset the peak again to capture the peak memory usage in the next
676 * cycle. */
677 c->querybuf_peak = 0;
678 return 0;
679 }
680
681 void clientsCron(void) {
682 /* Make sure to process at least 1/100 of clients per call.
683 * Since this function is called 10 times per second we are sure that
684 * in the worst case we process all the clients in 10 seconds.
685 * In normal conditions (a reasonable number of clients) we process
686 * all the clients in a shorter time. */
687 int numclients = listLength(server.clients);
688 int iterations = numclients/100;
689
690 if (iterations < 50)
691 iterations = (numclients < 50) ? numclients : 50;
692 while(listLength(server.clients) && iterations--) {
693 redisClient *c;
694 listNode *head;
695
696 /* Rotate the list, take the current head, process.
697 * This way if the client must be removed from the list it's the
698 * first element and we don't incur into O(N) computation. */
699 listRotate(server.clients);
700 head = listFirst(server.clients);
701 c = listNodeValue(head);
702 /* The following functions do different service checks on the client.
703 * The protocol is that they return non-zero if the client was
704 * terminated. */
705 if (clientsCronHandleTimeout(c)) continue;
706 if (clientsCronResizeQueryBuffer(c)) continue;
707 }
708 }
709
710 int serverCron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
711 int j, loops = server.cronloops;
712 REDIS_NOTUSED(eventLoop);
713 REDIS_NOTUSED(id);
714 REDIS_NOTUSED(clientData);
715
716 /* We take a cached value of the unix time in the global state because
717 * with virtual memory and aging there is to store the current time
718 * in objects at every object access, and accuracy is not needed.
719 * To access a global var is faster than calling time(NULL) */
720 server.unixtime = time(NULL);
721
722 trackOperationsPerSecond();
723
724 /* We have just 22 bits per object for LRU information.
725 * So we use an (eventually wrapping) LRU clock with 10 seconds resolution.
726 * 2^22 bits with 10 seconds resoluton is more or less 1.5 years.
727 *
728 * Note that even if this will wrap after 1.5 years it's not a problem,
729 * everything will still work but just some object will appear younger
730 * to Redis. But for this to happen a given object should never be touched
731 * for 1.5 years.
732 *
733 * Note that you can change the resolution altering the
734 * REDIS_LRU_CLOCK_RESOLUTION define.
735 */
736 updateLRUClock();
737
738 /* Record the max memory used since the server was started. */
739 if (zmalloc_used_memory() > server.stat_peak_memory)
740 server.stat_peak_memory = zmalloc_used_memory();
741
742 /* We received a SIGTERM, shutting down here in a safe way, as it is
743 * not ok doing so inside the signal handler. */
744 if (server.shutdown_asap) {
745 if (prepareForShutdown(0) == REDIS_OK) exit(0);
746 redisLog(REDIS_WARNING,"SIGTERM received but errors trying to shut down the server, check the logs for more information");
747 }
748
749 /* Show some info about non-empty databases */
750 for (j = 0; j < server.dbnum; j++) {
751 long long size, used, vkeys;
752
753 size = dictSlots(server.db[j].dict);
754 used = dictSize(server.db[j].dict);
755 vkeys = dictSize(server.db[j].expires);
756 if (!(loops % 50) && (used || vkeys)) {
757 redisLog(REDIS_VERBOSE,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j,used,vkeys,size);
758 /* dictPrintStats(server.dict); */
759 }
760 }
761
762 /* We don't want to resize the hash tables while a bacground saving
763 * is in progress: the saving child is created using fork() that is
764 * implemented with a copy-on-write semantic in most modern systems, so
765 * if we resize the HT while there is the saving child at work actually
766 * a lot of memory movements in the parent will cause a lot of pages
767 * copied. */
768 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
769 if (!(loops % 10)) tryResizeHashTables();
770 if (server.activerehashing) incrementallyRehash();
771 }
772
773 /* Show information about connected clients */
774 if (!(loops % 50)) {
775 redisLog(REDIS_VERBOSE,"%d clients connected (%d slaves), %zu bytes in use",
776 listLength(server.clients)-listLength(server.slaves),
777 listLength(server.slaves),
778 zmalloc_used_memory());
779 }
780
781 /* We need to do a few operations on clients asynchronously. */
782 clientsCron();
783
784 /* Start a scheduled AOF rewrite if this was requested by the user while
785 * a BGSAVE was in progress. */
786 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1 &&
787 server.aof_rewrite_scheduled)
788 {
789 rewriteAppendOnlyFileBackground();
790 }
791
792 /* Check if a background saving or AOF rewrite in progress terminated. */
793 if (server.rdb_child_pid != -1 || server.aof_child_pid != -1) {
794 int statloc;
795 pid_t pid;
796
797 if ((pid = wait3(&statloc,WNOHANG,NULL)) != 0) {
798 int exitcode = WEXITSTATUS(statloc);
799 int bysignal = 0;
800
801 if (WIFSIGNALED(statloc)) bysignal = WTERMSIG(statloc);
802
803 if (pid == server.rdb_child_pid) {
804 backgroundSaveDoneHandler(exitcode,bysignal);
805 } else {
806 backgroundRewriteDoneHandler(exitcode,bysignal);
807 }
808 updateDictResizePolicy();
809 }
810 } else {
811 time_t now = time(NULL);
812
813 /* If there is not a background saving/rewrite in progress check if
814 * we have to save/rewrite now */
815 for (j = 0; j < server.saveparamslen; j++) {
816 struct saveparam *sp = server.saveparams+j;
817
818 if (server.dirty >= sp->changes &&
819 now-server.lastsave > sp->seconds) {
820 redisLog(REDIS_NOTICE,"%d changes in %d seconds. Saving...",
821 sp->changes, sp->seconds);
822 rdbSaveBackground(server.rdb_filename);
823 break;
824 }
825 }
826
827 /* Trigger an AOF rewrite if needed */
828 if (server.rdb_child_pid == -1 &&
829 server.aof_child_pid == -1 &&
830 server.aof_rewrite_perc &&
831 server.aof_current_size > server.aof_rewrite_min_size)
832 {
833 long long base = server.aof_rewrite_base_size ?
834 server.aof_rewrite_base_size : 1;
835 long long growth = (server.aof_current_size*100/base) - 100;
836 if (growth >= server.aof_rewrite_perc) {
837 redisLog(REDIS_NOTICE,"Starting automatic rewriting of AOF on %lld%% growth",growth);
838 rewriteAppendOnlyFileBackground();
839 }
840 }
841 }
842
843
844 /* If we postponed an AOF buffer flush, let's try to do it every time the
845 * cron function is called. */
846 if (server.aof_flush_postponed_start) flushAppendOnlyFile(0);
847
848 /* Expire a few keys per cycle, only if this is a master.
849 * On slaves we wait for DEL operations synthesized by the master
850 * in order to guarantee a strict consistency. */
851 if (server.masterhost == NULL) activeExpireCycle();
852
853 /* Close clients that need to be closed asynchronous */
854 freeClientsInAsyncFreeQueue();
855
856 /* Replication cron function -- used to reconnect to master and
857 * to detect transfer failures. */
858 if (!(loops % 10)) replicationCron();
859
860 server.cronloops++;
861 return 100;
862 }
863
864 /* This function gets called every time Redis is entering the
865 * main loop of the event driven library, that is, before to sleep
866 * for ready file descriptors. */
867 void beforeSleep(struct aeEventLoop *eventLoop) {
868 REDIS_NOTUSED(eventLoop);
869 listNode *ln;
870 redisClient *c;
871
872 /* Try to process pending commands for clients that were just unblocked. */
873 while (listLength(server.unblocked_clients)) {
874 ln = listFirst(server.unblocked_clients);
875 redisAssert(ln != NULL);
876 c = ln->value;
877 listDelNode(server.unblocked_clients,ln);
878 c->flags &= ~REDIS_UNBLOCKED;
879
880 /* Process remaining data in the input buffer. */
881 if (c->querybuf && sdslen(c->querybuf) > 0) {
882 server.current_client = c;
883 processInputBuffer(c);
884 server.current_client = NULL;
885 }
886 }
887
888 /* Write the AOF buffer on disk */
889 flushAppendOnlyFile(0);
890 }
891
892 /* =========================== Server initialization ======================== */
893
894 void createSharedObjects(void) {
895 int j;
896
897 shared.crlf = createObject(REDIS_STRING,sdsnew("\r\n"));
898 shared.ok = createObject(REDIS_STRING,sdsnew("+OK\r\n"));
899 shared.err = createObject(REDIS_STRING,sdsnew("-ERR\r\n"));
900 shared.emptybulk = createObject(REDIS_STRING,sdsnew("$0\r\n\r\n"));
901 shared.czero = createObject(REDIS_STRING,sdsnew(":0\r\n"));
902 shared.cone = createObject(REDIS_STRING,sdsnew(":1\r\n"));
903 shared.cnegone = createObject(REDIS_STRING,sdsnew(":-1\r\n"));
904 shared.nullbulk = createObject(REDIS_STRING,sdsnew("$-1\r\n"));
905 shared.nullmultibulk = createObject(REDIS_STRING,sdsnew("*-1\r\n"));
906 shared.emptymultibulk = createObject(REDIS_STRING,sdsnew("*0\r\n"));
907 shared.pong = createObject(REDIS_STRING,sdsnew("+PONG\r\n"));
908 shared.queued = createObject(REDIS_STRING,sdsnew("+QUEUED\r\n"));
909 shared.wrongtypeerr = createObject(REDIS_STRING,sdsnew(
910 "-ERR Operation against a key holding the wrong kind of value\r\n"));
911 shared.nokeyerr = createObject(REDIS_STRING,sdsnew(
912 "-ERR no such key\r\n"));
913 shared.syntaxerr = createObject(REDIS_STRING,sdsnew(
914 "-ERR syntax error\r\n"));
915 shared.sameobjecterr = createObject(REDIS_STRING,sdsnew(
916 "-ERR source and destination objects are the same\r\n"));
917 shared.outofrangeerr = createObject(REDIS_STRING,sdsnew(
918 "-ERR index out of range\r\n"));
919 shared.noscripterr = createObject(REDIS_STRING,sdsnew(
920 "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
921 shared.loadingerr = createObject(REDIS_STRING,sdsnew(
922 "-LOADING Redis is loading the dataset in memory\r\n"));
923 shared.slowscripterr = createObject(REDIS_STRING,sdsnew(
924 "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
925 shared.bgsaveerr = createObject(REDIS_STRING,sdsnew(
926 "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
927 shared.roslaveerr = createObject(REDIS_STRING,sdsnew(
928 "-READONLY You can't write against a read only slave.\r\n"));
929 shared.oomerr = createObject(REDIS_STRING,sdsnew(
930 "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
931 shared.space = createObject(REDIS_STRING,sdsnew(" "));
932 shared.colon = createObject(REDIS_STRING,sdsnew(":"));
933 shared.plus = createObject(REDIS_STRING,sdsnew("+"));
934 shared.select0 = createStringObject("select 0\r\n",10);
935 shared.select1 = createStringObject("select 1\r\n",10);
936 shared.select2 = createStringObject("select 2\r\n",10);
937 shared.select3 = createStringObject("select 3\r\n",10);
938 shared.select4 = createStringObject("select 4\r\n",10);
939 shared.select5 = createStringObject("select 5\r\n",10);
940 shared.select6 = createStringObject("select 6\r\n",10);
941 shared.select7 = createStringObject("select 7\r\n",10);
942 shared.select8 = createStringObject("select 8\r\n",10);
943 shared.select9 = createStringObject("select 9\r\n",10);
944 shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
945 shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
946 shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
947 shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
948 shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
949 shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
950 shared.del = createStringObject("DEL",3);
951 shared.rpop = createStringObject("RPOP",4);
952 shared.lpop = createStringObject("LPOP",4);
953 for (j = 0; j < REDIS_SHARED_INTEGERS; j++) {
954 shared.integers[j] = createObject(REDIS_STRING,(void*)(long)j);
955 shared.integers[j]->encoding = REDIS_ENCODING_INT;
956 }
957 for (j = 0; j < REDIS_SHARED_BULKHDR_LEN; j++) {
958 shared.mbulkhdr[j] = createObject(REDIS_STRING,
959 sdscatprintf(sdsempty(),"*%d\r\n",j));
960 shared.bulkhdr[j] = createObject(REDIS_STRING,
961 sdscatprintf(sdsempty(),"$%d\r\n",j));
962 }
963 }
964
965 void initServerConfig() {
966 getRandomHexChars(server.runid,REDIS_RUN_ID_SIZE);
967 server.runid[REDIS_RUN_ID_SIZE] = '\0';
968 server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
969 server.port = REDIS_SERVERPORT;
970 server.bindaddr = NULL;
971 server.unixsocket = NULL;
972 server.unixsocketperm = 0;
973 server.ipfd = -1;
974 server.sofd = -1;
975 server.dbnum = REDIS_DEFAULT_DBNUM;
976 server.verbosity = REDIS_NOTICE;
977 server.maxidletime = REDIS_MAXIDLETIME;
978 server.client_max_querybuf_len = REDIS_MAX_QUERYBUF_LEN;
979 server.saveparams = NULL;
980 server.loading = 0;
981 server.logfile = NULL; /* NULL = log on standard output */
982 server.syslog_enabled = 0;
983 server.syslog_ident = zstrdup("redis");
984 server.syslog_facility = LOG_LOCAL0;
985 server.daemonize = 0;
986 server.aof_state = REDIS_AOF_OFF;
987 server.aof_fsync = AOF_FSYNC_EVERYSEC;
988 server.aof_no_fsync_on_rewrite = 0;
989 server.aof_rewrite_perc = REDIS_AOF_REWRITE_PERC;
990 server.aof_rewrite_min_size = REDIS_AOF_REWRITE_MIN_SIZE;
991 server.aof_rewrite_base_size = 0;
992 server.aof_rewrite_scheduled = 0;
993 server.aof_last_fsync = time(NULL);
994 server.aof_delayed_fsync = 0;
995 server.aof_fd = -1;
996 server.aof_selected_db = -1; /* Make sure the first time will not match */
997 server.aof_flush_postponed_start = 0;
998 server.pidfile = zstrdup("/var/run/redis.pid");
999 server.rdb_filename = zstrdup("dump.rdb");
1000 server.aof_filename = zstrdup("appendonly.aof");
1001 server.requirepass = NULL;
1002 server.rdb_compression = 1;
1003 server.activerehashing = 1;
1004 server.maxclients = REDIS_MAX_CLIENTS;
1005 server.bpop_blocked_clients = 0;
1006 server.maxmemory = 0;
1007 server.maxmemory_policy = REDIS_MAXMEMORY_VOLATILE_LRU;
1008 server.maxmemory_samples = 3;
1009 server.hash_max_ziplist_entries = REDIS_HASH_MAX_ZIPLIST_ENTRIES;
1010 server.hash_max_ziplist_value = REDIS_HASH_MAX_ZIPLIST_VALUE;
1011 server.list_max_ziplist_entries = REDIS_LIST_MAX_ZIPLIST_ENTRIES;
1012 server.list_max_ziplist_value = REDIS_LIST_MAX_ZIPLIST_VALUE;
1013 server.set_max_intset_entries = REDIS_SET_MAX_INTSET_ENTRIES;
1014 server.zset_max_ziplist_entries = REDIS_ZSET_MAX_ZIPLIST_ENTRIES;
1015 server.zset_max_ziplist_value = REDIS_ZSET_MAX_ZIPLIST_VALUE;
1016 server.shutdown_asap = 0;
1017 server.repl_ping_slave_period = REDIS_REPL_PING_SLAVE_PERIOD;
1018 server.repl_timeout = REDIS_REPL_TIMEOUT;
1019 server.lua_caller = NULL;
1020 server.lua_time_limit = REDIS_LUA_TIME_LIMIT;
1021 server.lua_client = NULL;
1022 server.lua_timedout = 0;
1023
1024 updateLRUClock();
1025 resetServerSaveParams();
1026
1027 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1028 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1029 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1030 /* Replication related */
1031 server.masterauth = NULL;
1032 server.masterhost = NULL;
1033 server.masterport = 6379;
1034 server.master = NULL;
1035 server.repl_state = REDIS_REPL_NONE;
1036 server.repl_syncio_timeout = REDIS_REPL_SYNCIO_TIMEOUT;
1037 server.repl_serve_stale_data = 1;
1038 server.repl_slave_ro = 1;
1039 server.repl_down_since = -1;
1040
1041 /* Client output buffer limits */
1042 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].hard_limit_bytes = 0;
1043 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_bytes = 0;
1044 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_seconds = 0;
1045 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].hard_limit_bytes = 1024*1024*256;
1046 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_bytes = 1024*1024*64;
1047 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_seconds = 60;
1048 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].hard_limit_bytes = 1024*1024*32;
1049 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_bytes = 1024*1024*8;
1050 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_seconds = 60;
1051
1052 /* Double constants initialization */
1053 R_Zero = 0.0;
1054 R_PosInf = 1.0/R_Zero;
1055 R_NegInf = -1.0/R_Zero;
1056 R_Nan = R_Zero/R_Zero;
1057
1058 /* Command table -- we intiialize it here as it is part of the
1059 * initial configuration, since command names may be changed via
1060 * redis.conf using the rename-command directive. */
1061 server.commands = dictCreate(&commandTableDictType,NULL);
1062 populateCommandTable();
1063 server.delCommand = lookupCommandByCString("del");
1064 server.multiCommand = lookupCommandByCString("multi");
1065 server.lpushCommand = lookupCommandByCString("lpush");
1066
1067 /* Slow log */
1068 server.slowlog_log_slower_than = REDIS_SLOWLOG_LOG_SLOWER_THAN;
1069 server.slowlog_max_len = REDIS_SLOWLOG_MAX_LEN;
1070
1071 /* Assert */
1072 server.assert_failed = "<no assertion failed>";
1073 server.assert_file = "<no file>";
1074 server.assert_line = 0;
1075 server.bug_report_start = 0;
1076 }
1077
1078 /* This function will try to raise the max number of open files accordingly to
1079 * the configured max number of clients. It will also account for 32 additional
1080 * file descriptors as we need a few more for persistence, listening
1081 * sockets, log files and so forth.
1082 *
1083 * If it will not be possible to set the limit accordingly to the configured
1084 * max number of clients, the function will do the reverse setting
1085 * server.maxclients to the value that we can actually handle. */
1086 void adjustOpenFilesLimit(void) {
1087 rlim_t maxfiles = server.maxclients+32;
1088 struct rlimit limit;
1089
1090 if (maxfiles < 1024) maxfiles = 1024;
1091 if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
1092 redisLog(REDIS_WARNING,"Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
1093 strerror(errno));
1094 server.maxclients = 1024-32;
1095 } else {
1096 rlim_t oldlimit = limit.rlim_cur;
1097
1098 /* Set the max number of files if the current limit is not enough
1099 * for our needs. */
1100 if (oldlimit < maxfiles) {
1101 limit.rlim_cur = maxfiles;
1102 limit.rlim_max = maxfiles;
1103 if (setrlimit(RLIMIT_NOFILE,&limit) == -1) {
1104 server.maxclients = oldlimit-32;
1105 redisLog(REDIS_WARNING,"Unable to set the max number of files limit to %d (%s), setting the max clients configuration to %d.",
1106 (int) maxfiles, strerror(errno), (int) server.maxclients);
1107 } else {
1108 redisLog(REDIS_NOTICE,"Max number of open files set to %d",
1109 (int) maxfiles);
1110 }
1111 }
1112 }
1113 }
1114
1115 void initServer() {
1116 int j;
1117
1118 signal(SIGHUP, SIG_IGN);
1119 signal(SIGPIPE, SIG_IGN);
1120 setupSignalHandlers();
1121
1122 if (server.syslog_enabled) {
1123 openlog(server.syslog_ident, LOG_PID | LOG_NDELAY | LOG_NOWAIT,
1124 server.syslog_facility);
1125 }
1126
1127 server.current_client = NULL;
1128 server.clients = listCreate();
1129 server.clients_to_close = listCreate();
1130 server.slaves = listCreate();
1131 server.monitors = listCreate();
1132 server.unblocked_clients = listCreate();
1133
1134 createSharedObjects();
1135 adjustOpenFilesLimit();
1136 server.el = aeCreateEventLoop(server.maxclients+1024);
1137 server.db = zmalloc(sizeof(redisDb)*server.dbnum);
1138
1139 if (server.port != 0) {
1140 server.ipfd = anetTcpServer(server.neterr,server.port,server.bindaddr);
1141 if (server.ipfd == ANET_ERR) {
1142 redisLog(REDIS_WARNING, "Opening port %d: %s",
1143 server.port, server.neterr);
1144 exit(1);
1145 }
1146 }
1147 if (server.unixsocket != NULL) {
1148 unlink(server.unixsocket); /* don't care if this fails */
1149 server.sofd = anetUnixServer(server.neterr,server.unixsocket,server.unixsocketperm);
1150 if (server.sofd == ANET_ERR) {
1151 redisLog(REDIS_WARNING, "Opening socket: %s", server.neterr);
1152 exit(1);
1153 }
1154 }
1155 if (server.ipfd < 0 && server.sofd < 0) {
1156 redisLog(REDIS_WARNING, "Configured to not listen anywhere, exiting.");
1157 exit(1);
1158 }
1159 for (j = 0; j < server.dbnum; j++) {
1160 server.db[j].dict = dictCreate(&dbDictType,NULL);
1161 server.db[j].expires = dictCreate(&keyptrDictType,NULL);
1162 server.db[j].blocking_keys = dictCreate(&keylistDictType,NULL);
1163 server.db[j].watched_keys = dictCreate(&keylistDictType,NULL);
1164 server.db[j].id = j;
1165 }
1166 server.pubsub_channels = dictCreate(&keylistDictType,NULL);
1167 server.pubsub_patterns = listCreate();
1168 listSetFreeMethod(server.pubsub_patterns,freePubsubPattern);
1169 listSetMatchMethod(server.pubsub_patterns,listMatchPubsubPattern);
1170 server.cronloops = 0;
1171 server.rdb_child_pid = -1;
1172 server.aof_child_pid = -1;
1173 server.aof_rewrite_buf = sdsempty();
1174 server.aof_buf = sdsempty();
1175 server.lastsave = time(NULL);
1176 server.dirty = 0;
1177 server.stat_numcommands = 0;
1178 server.stat_numconnections = 0;
1179 server.stat_expiredkeys = 0;
1180 server.stat_evictedkeys = 0;
1181 server.stat_starttime = time(NULL);
1182 server.stat_keyspace_misses = 0;
1183 server.stat_keyspace_hits = 0;
1184 server.stat_peak_memory = 0;
1185 server.stat_fork_time = 0;
1186 server.stat_rejected_conn = 0;
1187 memset(server.ops_sec_samples,0,sizeof(server.ops_sec_samples));
1188 server.ops_sec_idx = 0;
1189 server.ops_sec_last_sample_time = mstime();
1190 server.ops_sec_last_sample_ops = 0;
1191 server.unixtime = time(NULL);
1192 server.lastbgsave_status = REDIS_OK;
1193 server.stop_writes_on_bgsave_err = 1;
1194 aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL);
1195 if (server.ipfd > 0 && aeCreateFileEvent(server.el,server.ipfd,AE_READABLE,
1196 acceptTcpHandler,NULL) == AE_ERR) oom("creating file event");
1197 if (server.sofd > 0 && aeCreateFileEvent(server.el,server.sofd,AE_READABLE,
1198 acceptUnixHandler,NULL) == AE_ERR) oom("creating file event");
1199
1200 if (server.aof_state == REDIS_AOF_ON) {
1201 server.aof_fd = open(server.aof_filename,
1202 O_WRONLY|O_APPEND|O_CREAT,0644);
1203 if (server.aof_fd == -1) {
1204 redisLog(REDIS_WARNING, "Can't open the append-only file: %s",
1205 strerror(errno));
1206 exit(1);
1207 }
1208 }
1209
1210 /* 32 bit instances are limited to 4GB of address space, so if there is
1211 * no explicit limit in the user provided configuration we set a limit
1212 * at 3.5GB using maxmemory with 'noeviction' policy'. This saves
1213 * useless crashes of the Redis instance. */
1214 if (server.arch_bits == 32 && server.maxmemory == 0) {
1215 redisLog(REDIS_WARNING,"Warning: 32 bit instance detected but no memory limit set. Setting 3.5 GB maxmemory limit with 'noeviction' policy now.");
1216 server.maxmemory = 3584LL*(1024*1024); /* 3584 MB = 3.5 GB */
1217 server.maxmemory_policy = REDIS_MAXMEMORY_NO_EVICTION;
1218 }
1219
1220 scriptingInit();
1221 slowlogInit();
1222 bioInit();
1223 }
1224
1225 /* Populates the Redis Command Table starting from the hard coded list
1226 * we have on top of redis.c file. */
1227 void populateCommandTable(void) {
1228 int j;
1229 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1230
1231 for (j = 0; j < numcommands; j++) {
1232 struct redisCommand *c = redisCommandTable+j;
1233 char *f = c->sflags;
1234 int retval;
1235
1236 while(*f != '\0') {
1237 switch(*f) {
1238 case 'w': c->flags |= REDIS_CMD_WRITE; break;
1239 case 'r': c->flags |= REDIS_CMD_READONLY; break;
1240 case 'm': c->flags |= REDIS_CMD_DENYOOM; break;
1241 case 'a': c->flags |= REDIS_CMD_ADMIN; break;
1242 case 'p': c->flags |= REDIS_CMD_PUBSUB; break;
1243 case 'f': c->flags |= REDIS_CMD_FORCE_REPLICATION; break;
1244 case 's': c->flags |= REDIS_CMD_NOSCRIPT; break;
1245 case 'R': c->flags |= REDIS_CMD_RANDOM; break;
1246 case 'S': c->flags |= REDIS_CMD_SORT_FOR_SCRIPT; break;
1247 default: redisPanic("Unsupported command flag"); break;
1248 }
1249 f++;
1250 }
1251
1252 retval = dictAdd(server.commands, sdsnew(c->name), c);
1253 assert(retval == DICT_OK);
1254 }
1255 }
1256
1257 void resetCommandTableStats(void) {
1258 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1259 int j;
1260
1261 for (j = 0; j < numcommands; j++) {
1262 struct redisCommand *c = redisCommandTable+j;
1263
1264 c->microseconds = 0;
1265 c->calls = 0;
1266 }
1267 }
1268
1269 /* ========================== Redis OP Array API ============================ */
1270
1271 void redisOpArrayInit(redisOpArray *oa) {
1272 oa->ops = NULL;
1273 oa->numops = 0;
1274 }
1275
1276 int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
1277 robj **argv, int argc, int target)
1278 {
1279 redisOp *op;
1280
1281 oa->ops = zrealloc(oa->ops,sizeof(redisOp)*(oa->numops+1));
1282 op = oa->ops+oa->numops;
1283 op->cmd = cmd;
1284 op->dbid = dbid;
1285 op->argv = argv;
1286 op->argc = argc;
1287 op->target = target;
1288 oa->numops++;
1289 return oa->numops;
1290 }
1291
1292 void redisOpArrayFree(redisOpArray *oa) {
1293 while(oa->numops) {
1294 int j;
1295 redisOp *op;
1296
1297 oa->numops--;
1298 op = oa->ops+oa->numops;
1299 for (j = 0; j < op->argc; j++)
1300 decrRefCount(op->argv[j]);
1301 zfree(op->argv);
1302 }
1303 zfree(oa->ops);
1304 }
1305
1306 /* ====================== Commands lookup and execution ===================== */
1307
1308 struct redisCommand *lookupCommand(sds name) {
1309 return dictFetchValue(server.commands, name);
1310 }
1311
1312 struct redisCommand *lookupCommandByCString(char *s) {
1313 struct redisCommand *cmd;
1314 sds name = sdsnew(s);
1315
1316 cmd = dictFetchValue(server.commands, name);
1317 sdsfree(name);
1318 return cmd;
1319 }
1320
1321 /* Propagate the specified command (in the context of the specified database id)
1322 * to AOF, Slaves and Monitors.
1323 *
1324 * flags are an xor between:
1325 * + REDIS_PROPAGATE_NONE (no propagation of command at all)
1326 * + REDIS_PROPAGATE_AOF (propagate into the AOF file if is enabled)
1327 * + REDIS_PROPAGATE_REPL (propagate into the replication link)
1328 */
1329 void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1330 int flags)
1331 {
1332 if (server.aof_state != REDIS_AOF_OFF && flags & REDIS_PROPAGATE_AOF)
1333 feedAppendOnlyFile(cmd,dbid,argv,argc);
1334 if (flags & REDIS_PROPAGATE_REPL && listLength(server.slaves))
1335 replicationFeedSlaves(server.slaves,dbid,argv,argc);
1336 }
1337
1338 /* Used inside commands to schedule the propagation of additional commands
1339 * after the current command is propagated to AOF / Replication. */
1340 void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1341 int target)
1342 {
1343 redisOpArrayAppend(&server.also_propagate,cmd,dbid,argv,argc,target);
1344 }
1345
1346 /* Call() is the core of Redis execution of a command */
1347 void call(redisClient *c, int flags) {
1348 long long dirty, start = ustime(), duration;
1349
1350 /* Sent the command to clients in MONITOR mode, only if the commands are
1351 * not geneated from reading an AOF. */
1352 if (listLength(server.monitors) && !server.loading)
1353 replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
1354
1355 /* Call the command. */
1356 redisOpArrayInit(&server.also_propagate);
1357 dirty = server.dirty;
1358 c->cmd->proc(c);
1359 dirty = server.dirty-dirty;
1360 duration = ustime()-start;
1361
1362 /* When EVAL is called loading the AOF we don't want commands called
1363 * from Lua to go into the slowlog or to populate statistics. */
1364 if (server.loading && c->flags & REDIS_LUA_CLIENT)
1365 flags &= ~(REDIS_CALL_SLOWLOG | REDIS_CALL_STATS);
1366
1367 /* Log the command into the Slow log if needed, and populate the
1368 * per-command statistics that we show in INFO commandstats. */
1369 if (flags & REDIS_CALL_SLOWLOG)
1370 slowlogPushEntryIfNeeded(c->argv,c->argc,duration);
1371 if (flags & REDIS_CALL_STATS) {
1372 c->cmd->microseconds += duration;
1373 c->cmd->calls++;
1374 }
1375
1376 /* Propagate the command into the AOF and replication link */
1377 if (flags & REDIS_CALL_PROPAGATE) {
1378 int flags = REDIS_PROPAGATE_NONE;
1379
1380 if (c->cmd->flags & REDIS_CMD_FORCE_REPLICATION)
1381 flags |= REDIS_PROPAGATE_REPL;
1382 if (dirty)
1383 flags |= (REDIS_PROPAGATE_REPL | REDIS_PROPAGATE_AOF);
1384 if (flags != REDIS_PROPAGATE_NONE)
1385 propagate(c->cmd,c->db->id,c->argv,c->argc,flags);
1386 }
1387 /* Commands such as LPUSH or BRPOPLPUSH may propagate an additional
1388 * PUSH command. */
1389 if (server.also_propagate.numops) {
1390 int j;
1391 redisOp *rop;
1392
1393 for (j = 0; j < server.also_propagate.numops; j++) {
1394 rop = &server.also_propagate.ops[j];
1395 propagate(rop->cmd, rop->dbid, rop->argv, rop->argc, rop->target);
1396 }
1397 redisOpArrayFree(&server.also_propagate);
1398 }
1399 server.stat_numcommands++;
1400 }
1401
1402 /* If this function gets called we already read a whole
1403 * command, argments are in the client argv/argc fields.
1404 * processCommand() execute the command or prepare the
1405 * server for a bulk read from the client.
1406 *
1407 * If 1 is returned the client is still alive and valid and
1408 * and other operations can be performed by the caller. Otherwise
1409 * if 0 is returned the client was destroied (i.e. after QUIT). */
1410 int processCommand(redisClient *c) {
1411 /* The QUIT command is handled separately. Normal command procs will
1412 * go through checking for replication and QUIT will cause trouble
1413 * when FORCE_REPLICATION is enabled and would be implemented in
1414 * a regular command proc. */
1415 if (!strcasecmp(c->argv[0]->ptr,"quit")) {
1416 addReply(c,shared.ok);
1417 c->flags |= REDIS_CLOSE_AFTER_REPLY;
1418 return REDIS_ERR;
1419 }
1420
1421 /* Now lookup the command and check ASAP about trivial error conditions
1422 * such as wrong arity, bad command name and so forth. */
1423 c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
1424 if (!c->cmd) {
1425 addReplyErrorFormat(c,"unknown command '%s'",
1426 (char*)c->argv[0]->ptr);
1427 return REDIS_OK;
1428 } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
1429 (c->argc < -c->cmd->arity)) {
1430 addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
1431 c->cmd->name);
1432 return REDIS_OK;
1433 }
1434
1435 /* Check if the user is authenticated */
1436 if (server.requirepass && !c->authenticated && c->cmd->proc != authCommand)
1437 {
1438 addReplyError(c,"operation not permitted");
1439 return REDIS_OK;
1440 }
1441
1442 /* Handle the maxmemory directive.
1443 *
1444 * First we try to free some memory if possible (if there are volatile
1445 * keys in the dataset). If there are not the only thing we can do
1446 * is returning an error. */
1447 if (server.maxmemory) {
1448 int retval = freeMemoryIfNeeded();
1449 if ((c->cmd->flags & REDIS_CMD_DENYOOM) && retval == REDIS_ERR) {
1450 addReply(c, shared.oomerr);
1451 return REDIS_OK;
1452 }
1453 }
1454
1455 /* Don't accept write commands if there are problems persisting on disk. */
1456 if (server.stop_writes_on_bgsave_err &&
1457 server.saveparamslen > 0
1458 && server.lastbgsave_status == REDIS_ERR &&
1459 c->cmd->flags & REDIS_CMD_WRITE)
1460 {
1461 addReply(c, shared.bgsaveerr);
1462 return REDIS_OK;
1463 }
1464
1465 /* Don't accept wirte commands if this is a read only slave. But
1466 * accept write commands if this is our master. */
1467 if (server.masterhost && server.repl_slave_ro &&
1468 !(c->flags & REDIS_MASTER) &&
1469 c->cmd->flags & REDIS_CMD_WRITE)
1470 {
1471 addReply(c, shared.roslaveerr);
1472 return REDIS_OK;
1473 }
1474
1475 /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
1476 if ((dictSize(c->pubsub_channels) > 0 || listLength(c->pubsub_patterns) > 0)
1477 &&
1478 c->cmd->proc != subscribeCommand &&
1479 c->cmd->proc != unsubscribeCommand &&
1480 c->cmd->proc != psubscribeCommand &&
1481 c->cmd->proc != punsubscribeCommand) {
1482 addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / QUIT allowed in this context");
1483 return REDIS_OK;
1484 }
1485
1486 /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
1487 * we are a slave with a broken link with master. */
1488 if (server.masterhost && server.repl_state != REDIS_REPL_CONNECTED &&
1489 server.repl_serve_stale_data == 0 &&
1490 c->cmd->proc != infoCommand && c->cmd->proc != slaveofCommand)
1491 {
1492 addReplyError(c,
1493 "link with MASTER is down and slave-serve-stale-data is set to no");
1494 return REDIS_OK;
1495 }
1496
1497 /* Loading DB? Return an error if the command is not INFO */
1498 if (server.loading && c->cmd->proc != infoCommand) {
1499 addReply(c, shared.loadingerr);
1500 return REDIS_OK;
1501 }
1502
1503 /* Lua script too slow? Only allow SHUTDOWN NOSAVE and SCRIPT KILL. */
1504 if (server.lua_timedout &&
1505 !(c->cmd->proc != shutdownCommand &&
1506 c->argc == 2 &&
1507 tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
1508 !(c->cmd->proc == scriptCommand &&
1509 c->argc == 2 &&
1510 tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
1511 {
1512 addReply(c, shared.slowscripterr);
1513 return REDIS_OK;
1514 }
1515
1516 /* Exec the command */
1517 if (c->flags & REDIS_MULTI &&
1518 c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
1519 c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
1520 {
1521 queueMultiCommand(c);
1522 addReply(c,shared.queued);
1523 } else {
1524 call(c,REDIS_CALL_FULL);
1525 }
1526 return REDIS_OK;
1527 }
1528
1529 /*================================== Shutdown =============================== */
1530
1531 int prepareForShutdown(int flags) {
1532 int save = flags & REDIS_SHUTDOWN_SAVE;
1533 int nosave = flags & REDIS_SHUTDOWN_NOSAVE;
1534
1535 redisLog(REDIS_WARNING,"User requested shutdown...");
1536 /* Kill the saving child if there is a background saving in progress.
1537 We want to avoid race conditions, for instance our saving child may
1538 overwrite the synchronous saving did by SHUTDOWN. */
1539 if (server.rdb_child_pid != -1) {
1540 redisLog(REDIS_WARNING,"There is a child saving an .rdb. Killing it!");
1541 kill(server.rdb_child_pid,SIGKILL);
1542 rdbRemoveTempFile(server.rdb_child_pid);
1543 }
1544 if (server.aof_state != REDIS_AOF_OFF) {
1545 /* Kill the AOF saving child as the AOF we already have may be longer
1546 * but contains the full dataset anyway. */
1547 if (server.aof_child_pid != -1) {
1548 redisLog(REDIS_WARNING,
1549 "There is a child rewriting the AOF. Killing it!");
1550 kill(server.aof_child_pid,SIGKILL);
1551 }
1552 /* Append only file: fsync() the AOF and exit */
1553 redisLog(REDIS_NOTICE,"Calling fsync() on the AOF file.");
1554 aof_fsync(server.aof_fd);
1555 }
1556 if ((server.saveparamslen > 0 && !nosave) || save) {
1557 redisLog(REDIS_NOTICE,"Saving the final RDB snapshot before exiting.");
1558 /* Snapshotting. Perform a SYNC SAVE and exit */
1559 if (rdbSave(server.rdb_filename) != REDIS_OK) {
1560 /* Ooops.. error saving! The best we can do is to continue
1561 * operating. Note that if there was a background saving process,
1562 * in the next cron() Redis will be notified that the background
1563 * saving aborted, handling special stuff like slaves pending for
1564 * synchronization... */
1565 redisLog(REDIS_WARNING,"Error trying to save the DB, can't exit.");
1566 return REDIS_ERR;
1567 }
1568 }
1569 if (server.daemonize) {
1570 redisLog(REDIS_NOTICE,"Removing the pid file.");
1571 unlink(server.pidfile);
1572 }
1573 /* Close the listening sockets. Apparently this allows faster restarts. */
1574 if (server.ipfd != -1) close(server.ipfd);
1575 if (server.sofd != -1) close(server.sofd);
1576 if (server.unixsocket) {
1577 redisLog(REDIS_NOTICE,"Removing the unix socket file.");
1578 unlink(server.unixsocket); /* don't care if this fails */
1579 }
1580
1581 redisLog(REDIS_WARNING,"Redis is now ready to exit, bye bye...");
1582 return REDIS_OK;
1583 }
1584
1585 /*================================== Commands =============================== */
1586
1587 void authCommand(redisClient *c) {
1588 if (!server.requirepass) {
1589 addReplyError(c,"Client sent AUTH, but no password is set");
1590 } else if (!strcmp(c->argv[1]->ptr, server.requirepass)) {
1591 c->authenticated = 1;
1592 addReply(c,shared.ok);
1593 } else {
1594 c->authenticated = 0;
1595 addReplyError(c,"invalid password");
1596 }
1597 }
1598
1599 void pingCommand(redisClient *c) {
1600 addReply(c,shared.pong);
1601 }
1602
1603 void echoCommand(redisClient *c) {
1604 addReplyBulk(c,c->argv[1]);
1605 }
1606
1607 void timeCommand(redisClient *c) {
1608 struct timeval tv;
1609
1610 /* gettimeofday() can only fail if &tv is a bad addresss so we
1611 * don't check for errors. */
1612 gettimeofday(&tv,NULL);
1613 addReplyMultiBulkLen(c,2);
1614 addReplyBulkLongLong(c,tv.tv_sec);
1615 addReplyBulkLongLong(c,tv.tv_usec);
1616 }
1617
1618 /* Convert an amount of bytes into a human readable string in the form
1619 * of 100B, 2G, 100M, 4K, and so forth. */
1620 void bytesToHuman(char *s, unsigned long long n) {
1621 double d;
1622
1623 if (n < 1024) {
1624 /* Bytes */
1625 sprintf(s,"%lluB",n);
1626 return;
1627 } else if (n < (1024*1024)) {
1628 d = (double)n/(1024);
1629 sprintf(s,"%.2fK",d);
1630 } else if (n < (1024LL*1024*1024)) {
1631 d = (double)n/(1024*1024);
1632 sprintf(s,"%.2fM",d);
1633 } else if (n < (1024LL*1024*1024*1024)) {
1634 d = (double)n/(1024LL*1024*1024);
1635 sprintf(s,"%.2fG",d);
1636 }
1637 }
1638
1639 /* Create the string returned by the INFO command. This is decoupled
1640 * by the INFO command itself as we need to report the same information
1641 * on memory corruption problems. */
1642 sds genRedisInfoString(char *section) {
1643 sds info = sdsempty();
1644 time_t uptime = time(NULL)-server.stat_starttime;
1645 int j, numcommands;
1646 struct rusage self_ru, c_ru;
1647 unsigned long lol, bib;
1648 int allsections = 0, defsections = 0;
1649 int sections = 0;
1650
1651 if (section) {
1652 allsections = strcasecmp(section,"all") == 0;
1653 defsections = strcasecmp(section,"default") == 0;
1654 }
1655
1656 getrusage(RUSAGE_SELF, &self_ru);
1657 getrusage(RUSAGE_CHILDREN, &c_ru);
1658 getClientsMaxBuffers(&lol,&bib);
1659
1660 /* Server */
1661 if (allsections || defsections || !strcasecmp(section,"server")) {
1662 if (sections++) info = sdscat(info,"\r\n");
1663 info = sdscatprintf(info,
1664 "# Server\r\n"
1665 "redis_version:%s\r\n"
1666 "redis_git_sha1:%s\r\n"
1667 "redis_git_dirty:%d\r\n"
1668 "arch_bits:%d\r\n"
1669 "multiplexing_api:%s\r\n"
1670 "gcc_version:%d.%d.%d\r\n"
1671 "process_id:%ld\r\n"
1672 "run_id:%s\r\n"
1673 "tcp_port:%d\r\n"
1674 "uptime_in_seconds:%ld\r\n"
1675 "uptime_in_days:%ld\r\n"
1676 "lru_clock:%ld\r\n",
1677 REDIS_VERSION,
1678 redisGitSHA1(),
1679 strtol(redisGitDirty(),NULL,10) > 0,
1680 server.arch_bits,
1681 aeGetApiName(),
1682 #ifdef __GNUC__
1683 __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
1684 #else
1685 0,0,0,
1686 #endif
1687 (long) getpid(),
1688 server.runid,
1689 server.port,
1690 uptime,
1691 uptime/(3600*24),
1692 (unsigned long) server.lruclock);
1693 }
1694
1695 /* Clients */
1696 if (allsections || defsections || !strcasecmp(section,"clients")) {
1697 if (sections++) info = sdscat(info,"\r\n");
1698 info = sdscatprintf(info,
1699 "# Clients\r\n"
1700 "connected_clients:%lu\r\n"
1701 "client_longest_output_list:%lu\r\n"
1702 "client_biggest_input_buf:%lu\r\n"
1703 "blocked_clients:%d\r\n",
1704 listLength(server.clients)-listLength(server.slaves),
1705 lol, bib,
1706 server.bpop_blocked_clients);
1707 }
1708
1709 /* Memory */
1710 if (allsections || defsections || !strcasecmp(section,"memory")) {
1711 char hmem[64];
1712 char peak_hmem[64];
1713
1714 bytesToHuman(hmem,zmalloc_used_memory());
1715 bytesToHuman(peak_hmem,server.stat_peak_memory);
1716 if (sections++) info = sdscat(info,"\r\n");
1717 info = sdscatprintf(info,
1718 "# Memory\r\n"
1719 "used_memory:%zu\r\n"
1720 "used_memory_human:%s\r\n"
1721 "used_memory_rss:%zu\r\n"
1722 "used_memory_peak:%zu\r\n"
1723 "used_memory_peak_human:%s\r\n"
1724 "used_memory_lua:%lld\r\n"
1725 "mem_fragmentation_ratio:%.2f\r\n"
1726 "mem_allocator:%s\r\n",
1727 zmalloc_used_memory(),
1728 hmem,
1729 zmalloc_get_rss(),
1730 server.stat_peak_memory,
1731 peak_hmem,
1732 ((long long)lua_gc(server.lua,LUA_GCCOUNT,0))*1024LL,
1733 zmalloc_get_fragmentation_ratio(),
1734 ZMALLOC_LIB
1735 );
1736 }
1737
1738 /* Persistence */
1739 if (allsections || defsections || !strcasecmp(section,"persistence")) {
1740 if (sections++) info = sdscat(info,"\r\n");
1741 info = sdscatprintf(info,
1742 "# Persistence\r\n"
1743 "loading:%d\r\n"
1744 "aof_enabled:%d\r\n"
1745 "changes_since_last_save:%lld\r\n"
1746 "bgsave_in_progress:%d\r\n"
1747 "last_save_time:%ld\r\n"
1748 "last_bgsave_status:%s\r\n"
1749 "bgrewriteaof_in_progress:%d\r\n",
1750 server.loading,
1751 server.aof_state != REDIS_AOF_OFF,
1752 server.dirty,
1753 server.rdb_child_pid != -1,
1754 server.lastsave,
1755 server.lastbgsave_status == REDIS_OK ? "ok" : "err",
1756 server.aof_child_pid != -1);
1757
1758 if (server.aof_state != REDIS_AOF_OFF) {
1759 info = sdscatprintf(info,
1760 "aof_current_size:%lld\r\n"
1761 "aof_base_size:%lld\r\n"
1762 "aof_pending_rewrite:%d\r\n"
1763 "aof_buffer_length:%zu\r\n"
1764 "aof_pending_bio_fsync:%llu\r\n"
1765 "aof_delayed_fsync:%lu\r\n",
1766 (long long) server.aof_current_size,
1767 (long long) server.aof_rewrite_base_size,
1768 server.aof_rewrite_scheduled,
1769 sdslen(server.aof_buf),
1770 bioPendingJobsOfType(REDIS_BIO_AOF_FSYNC),
1771 server.aof_delayed_fsync);
1772 }
1773
1774 if (server.loading) {
1775 double perc;
1776 time_t eta, elapsed;
1777 off_t remaining_bytes = server.loading_total_bytes-
1778 server.loading_loaded_bytes;
1779
1780 perc = ((double)server.loading_loaded_bytes /
1781 server.loading_total_bytes) * 100;
1782
1783 elapsed = time(NULL)-server.loading_start_time;
1784 if (elapsed == 0) {
1785 eta = 1; /* A fake 1 second figure if we don't have
1786 enough info */
1787 } else {
1788 eta = (elapsed*remaining_bytes)/server.loading_loaded_bytes;
1789 }
1790
1791 info = sdscatprintf(info,
1792 "loading_start_time:%ld\r\n"
1793 "loading_total_bytes:%llu\r\n"
1794 "loading_loaded_bytes:%llu\r\n"
1795 "loading_loaded_perc:%.2f\r\n"
1796 "loading_eta_seconds:%ld\r\n"
1797 ,(unsigned long) server.loading_start_time,
1798 (unsigned long long) server.loading_total_bytes,
1799 (unsigned long long) server.loading_loaded_bytes,
1800 perc,
1801 eta
1802 );
1803 }
1804 }
1805
1806 /* Stats */
1807 if (allsections || defsections || !strcasecmp(section,"stats")) {
1808 if (sections++) info = sdscat(info,"\r\n");
1809 info = sdscatprintf(info,
1810 "# Stats\r\n"
1811 "total_connections_received:%lld\r\n"
1812 "total_commands_processed:%lld\r\n"
1813 "instantaneous_ops_per_sec:%lld\r\n"
1814 "rejected_connections:%lld\r\n"
1815 "expired_keys:%lld\r\n"
1816 "evicted_keys:%lld\r\n"
1817 "keyspace_hits:%lld\r\n"
1818 "keyspace_misses:%lld\r\n"
1819 "pubsub_channels:%ld\r\n"
1820 "pubsub_patterns:%lu\r\n"
1821 "latest_fork_usec:%lld\r\n",
1822 server.stat_numconnections,
1823 server.stat_numcommands,
1824 getOperationsPerSecond(),
1825 server.stat_rejected_conn,
1826 server.stat_expiredkeys,
1827 server.stat_evictedkeys,
1828 server.stat_keyspace_hits,
1829 server.stat_keyspace_misses,
1830 dictSize(server.pubsub_channels),
1831 listLength(server.pubsub_patterns),
1832 server.stat_fork_time);
1833 }
1834
1835 /* Replication */
1836 if (allsections || defsections || !strcasecmp(section,"replication")) {
1837 if (sections++) info = sdscat(info,"\r\n");
1838 info = sdscatprintf(info,
1839 "# Replication\r\n"
1840 "role:%s\r\n",
1841 server.masterhost == NULL ? "master" : "slave");
1842 if (server.masterhost) {
1843 info = sdscatprintf(info,
1844 "master_host:%s\r\n"
1845 "master_port:%d\r\n"
1846 "master_link_status:%s\r\n"
1847 "master_last_io_seconds_ago:%d\r\n"
1848 "master_sync_in_progress:%d\r\n"
1849 ,server.masterhost,
1850 server.masterport,
1851 (server.repl_state == REDIS_REPL_CONNECTED) ?
1852 "up" : "down",
1853 server.master ?
1854 ((int)(time(NULL)-server.master->lastinteraction)) : -1,
1855 server.repl_state == REDIS_REPL_TRANSFER
1856 );
1857
1858 if (server.repl_state == REDIS_REPL_TRANSFER) {
1859 info = sdscatprintf(info,
1860 "master_sync_left_bytes:%ld\r\n"
1861 "master_sync_last_io_seconds_ago:%d\r\n"
1862 ,(long)server.repl_transfer_left,
1863 (int)(time(NULL)-server.repl_transfer_lastio)
1864 );
1865 }
1866
1867 if (server.repl_state != REDIS_REPL_CONNECTED) {
1868 info = sdscatprintf(info,
1869 "master_link_down_since_seconds:%ld\r\n",
1870 (long)time(NULL)-server.repl_down_since);
1871 }
1872 }
1873 info = sdscatprintf(info,
1874 "connected_slaves:%lu\r\n",
1875 listLength(server.slaves));
1876 if (listLength(server.slaves)) {
1877 int slaveid = 0;
1878 listNode *ln;
1879 listIter li;
1880
1881 listRewind(server.slaves,&li);
1882 while((ln = listNext(&li))) {
1883 redisClient *slave = listNodeValue(ln);
1884 char *state = NULL;
1885 char ip[32];
1886 int port;
1887
1888 if (anetPeerToString(slave->fd,ip,&port) == -1) continue;
1889 switch(slave->replstate) {
1890 case REDIS_REPL_WAIT_BGSAVE_START:
1891 case REDIS_REPL_WAIT_BGSAVE_END:
1892 state = "wait_bgsave";
1893 break;
1894 case REDIS_REPL_SEND_BULK:
1895 state = "send_bulk";
1896 break;
1897 case REDIS_REPL_ONLINE:
1898 state = "online";
1899 break;
1900 }
1901 if (state == NULL) continue;
1902 info = sdscatprintf(info,"slave%d:%s,%d,%s\r\n",
1903 slaveid,ip,port,state);
1904 slaveid++;
1905 }
1906 }
1907 }
1908
1909 /* CPU */
1910 if (allsections || defsections || !strcasecmp(section,"cpu")) {
1911 if (sections++) info = sdscat(info,"\r\n");
1912 info = sdscatprintf(info,
1913 "# CPU\r\n"
1914 "used_cpu_sys:%.2f\r\n"
1915 "used_cpu_user:%.2f\r\n"
1916 "used_cpu_sys_children:%.2f\r\n"
1917 "used_cpu_user_children:%.2f\r\n",
1918 (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
1919 (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000,
1920 (float)c_ru.ru_stime.tv_sec+(float)c_ru.ru_stime.tv_usec/1000000,
1921 (float)c_ru.ru_utime.tv_sec+(float)c_ru.ru_utime.tv_usec/1000000);
1922 }
1923
1924 /* cmdtime */
1925 if (allsections || !strcasecmp(section,"commandstats")) {
1926 if (sections++) info = sdscat(info,"\r\n");
1927 info = sdscatprintf(info, "# Commandstats\r\n");
1928 numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1929 for (j = 0; j < numcommands; j++) {
1930 struct redisCommand *c = redisCommandTable+j;
1931
1932 if (!c->calls) continue;
1933 info = sdscatprintf(info,
1934 "cmdstat_%s:calls=%lld,usec=%lld,usec_per_call=%.2f\r\n",
1935 c->name, c->calls, c->microseconds,
1936 (c->calls == 0) ? 0 : ((float)c->microseconds/c->calls));
1937 }
1938 }
1939
1940 /* Key space */
1941 if (allsections || defsections || !strcasecmp(section,"keyspace")) {
1942 if (sections++) info = sdscat(info,"\r\n");
1943 info = sdscatprintf(info, "# Keyspace\r\n");
1944 for (j = 0; j < server.dbnum; j++) {
1945 long long keys, vkeys;
1946
1947 keys = dictSize(server.db[j].dict);
1948 vkeys = dictSize(server.db[j].expires);
1949 if (keys || vkeys) {
1950 info = sdscatprintf(info, "db%d:keys=%lld,expires=%lld\r\n",
1951 j, keys, vkeys);
1952 }
1953 }
1954 }
1955 return info;
1956 }
1957
1958 void infoCommand(redisClient *c) {
1959 char *section = c->argc == 2 ? c->argv[1]->ptr : "default";
1960
1961 if (c->argc > 2) {
1962 addReply(c,shared.syntaxerr);
1963 return;
1964 }
1965 sds info = genRedisInfoString(section);
1966 addReplySds(c,sdscatprintf(sdsempty(),"$%lu\r\n",
1967 (unsigned long)sdslen(info)));
1968 addReplySds(c,info);
1969 addReply(c,shared.crlf);
1970 }
1971
1972 void monitorCommand(redisClient *c) {
1973 /* ignore MONITOR if aleady slave or in monitor mode */
1974 if (c->flags & REDIS_SLAVE) return;
1975
1976 c->flags |= (REDIS_SLAVE|REDIS_MONITOR);
1977 c->slaveseldb = 0;
1978 listAddNodeTail(server.monitors,c);
1979 addReply(c,shared.ok);
1980 }
1981
1982 /* ============================ Maxmemory directive ======================== */
1983
1984 /* This function gets called when 'maxmemory' is set on the config file to limit
1985 * the max memory used by the server, before processing a command.
1986 *
1987 * The goal of the function is to free enough memory to keep Redis under the
1988 * configured memory limit.
1989 *
1990 * The function starts calculating how many bytes should be freed to keep
1991 * Redis under the limit, and enters a loop selecting the best keys to
1992 * evict accordingly to the configured policy.
1993 *
1994 * If all the bytes needed to return back under the limit were freed the
1995 * function returns REDIS_OK, otherwise REDIS_ERR is returned, and the caller
1996 * should block the execution of commands that will result in more memory
1997 * used by the server.
1998 */
1999 int freeMemoryIfNeeded(void) {
2000 size_t mem_used, mem_tofree, mem_freed;
2001 int slaves = listLength(server.slaves);
2002
2003 /* Remove the size of slaves output buffers and AOF buffer from the
2004 * count of used memory. */
2005 mem_used = zmalloc_used_memory();
2006 if (slaves) {
2007 listIter li;
2008 listNode *ln;
2009
2010 listRewind(server.slaves,&li);
2011 while((ln = listNext(&li))) {
2012 redisClient *slave = listNodeValue(ln);
2013 unsigned long obuf_bytes = getClientOutputBufferMemoryUsage(slave);
2014 if (obuf_bytes > mem_used)
2015 mem_used = 0;
2016 else
2017 mem_used -= obuf_bytes;
2018 }
2019 }
2020 if (server.aof_state != REDIS_AOF_OFF) {
2021 mem_used -= sdslen(server.aof_buf);
2022 mem_used -= sdslen(server.aof_rewrite_buf);
2023 }
2024
2025 /* Check if we are over the memory limit. */
2026 if (mem_used <= server.maxmemory) return REDIS_OK;
2027
2028 if (server.maxmemory_policy == REDIS_MAXMEMORY_NO_EVICTION)
2029 return REDIS_ERR; /* We need to free memory, but policy forbids. */
2030
2031 /* Compute how much memory we need to free. */
2032 mem_tofree = mem_used - server.maxmemory;
2033 mem_freed = 0;
2034 while (mem_freed < mem_tofree) {
2035 int j, k, keys_freed = 0;
2036
2037 for (j = 0; j < server.dbnum; j++) {
2038 long bestval = 0; /* just to prevent warning */
2039 sds bestkey = NULL;
2040 struct dictEntry *de;
2041 redisDb *db = server.db+j;
2042 dict *dict;
2043
2044 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2045 server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM)
2046 {
2047 dict = server.db[j].dict;
2048 } else {
2049 dict = server.db[j].expires;
2050 }
2051 if (dictSize(dict) == 0) continue;
2052
2053 /* volatile-random and allkeys-random policy */
2054 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM ||
2055 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_RANDOM)
2056 {
2057 de = dictGetRandomKey(dict);
2058 bestkey = dictGetKey(de);
2059 }
2060
2061 /* volatile-lru and allkeys-lru policy */
2062 else if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2063 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2064 {
2065 for (k = 0; k < server.maxmemory_samples; k++) {
2066 sds thiskey;
2067 long thisval;
2068 robj *o;
2069
2070 de = dictGetRandomKey(dict);
2071 thiskey = dictGetKey(de);
2072 /* When policy is volatile-lru we need an additonal lookup
2073 * to locate the real key, as dict is set to db->expires. */
2074 if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2075 de = dictFind(db->dict, thiskey);
2076 o = dictGetVal(de);
2077 thisval = estimateObjectIdleTime(o);
2078
2079 /* Higher idle time is better candidate for deletion */
2080 if (bestkey == NULL || thisval > bestval) {
2081 bestkey = thiskey;
2082 bestval = thisval;
2083 }
2084 }
2085 }
2086
2087 /* volatile-ttl */
2088 else if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_TTL) {
2089 for (k = 0; k < server.maxmemory_samples; k++) {
2090 sds thiskey;
2091 long thisval;
2092
2093 de = dictGetRandomKey(dict);
2094 thiskey = dictGetKey(de);
2095 thisval = (long) dictGetVal(de);
2096
2097 /* Expire sooner (minor expire unix timestamp) is better
2098 * candidate for deletion */
2099 if (bestkey == NULL || thisval < bestval) {
2100 bestkey = thiskey;
2101 bestval = thisval;
2102 }
2103 }
2104 }
2105
2106 /* Finally remove the selected key. */
2107 if (bestkey) {
2108 long long delta;
2109
2110 robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
2111 propagateExpire(db,keyobj);
2112 /* We compute the amount of memory freed by dbDelete() alone.
2113 * It is possible that actually the memory needed to propagate
2114 * the DEL in AOF and replication link is greater than the one
2115 * we are freeing removing the key, but we can't account for
2116 * that otherwise we would never exit the loop.
2117 *
2118 * AOF and Output buffer memory will be freed eventually so
2119 * we only care about memory used by the key space. */
2120 delta = (long long) zmalloc_used_memory();
2121 dbDelete(db,keyobj);
2122 delta -= (long long) zmalloc_used_memory();
2123 mem_freed += delta;
2124 server.stat_evictedkeys++;
2125 decrRefCount(keyobj);
2126 keys_freed++;
2127
2128 /* When the memory to free starts to be big enough, we may
2129 * start spending so much time here that is impossible to
2130 * deliver data to the slaves fast enough, so we force the
2131 * transmission here inside the loop. */
2132 if (slaves) flushSlavesOutputBuffers();
2133 }
2134 }
2135 if (!keys_freed) return REDIS_ERR; /* nothing to free... */
2136 }
2137 return REDIS_OK;
2138 }
2139
2140 /* =================================== Main! ================================ */
2141
2142 #ifdef __linux__
2143 int linuxOvercommitMemoryValue(void) {
2144 FILE *fp = fopen("/proc/sys/vm/overcommit_memory","r");
2145 char buf[64];
2146
2147 if (!fp) return -1;
2148 if (fgets(buf,64,fp) == NULL) {
2149 fclose(fp);
2150 return -1;
2151 }
2152 fclose(fp);
2153
2154 return atoi(buf);
2155 }
2156
2157 void linuxOvercommitMemoryWarning(void) {
2158 if (linuxOvercommitMemoryValue() == 0) {
2159 redisLog(REDIS_WARNING,"WARNING overcommit_memory is set to 0! Background save may fail under low memory condition. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
2160 }
2161 }
2162 #endif /* __linux__ */
2163
2164 void createPidFile(void) {
2165 /* Try to write the pid file in a best-effort way. */
2166 FILE *fp = fopen(server.pidfile,"w");
2167 if (fp) {
2168 fprintf(fp,"%d\n",(int)getpid());
2169 fclose(fp);
2170 }
2171 }
2172
2173 void daemonize(void) {
2174 int fd;
2175
2176 if (fork() != 0) exit(0); /* parent exits */
2177 setsid(); /* create a new session */
2178
2179 /* Every output goes to /dev/null. If Redis is daemonized but
2180 * the 'logfile' is set to 'stdout' in the configuration file
2181 * it will not log at all. */
2182 if ((fd = open("/dev/null", O_RDWR, 0)) != -1) {
2183 dup2(fd, STDIN_FILENO);
2184 dup2(fd, STDOUT_FILENO);
2185 dup2(fd, STDERR_FILENO);
2186 if (fd > STDERR_FILENO) close(fd);
2187 }
2188 }
2189
2190 void version() {
2191 printf("Redis server v=%s sha=%s:%d malloc=%s\n", REDIS_VERSION,
2192 redisGitSHA1(), atoi(redisGitDirty()) > 0, ZMALLOC_LIB);
2193 exit(0);
2194 }
2195
2196 void usage() {
2197 fprintf(stderr,"Usage: ./redis-server [/path/to/redis.conf] [options]\n");
2198 fprintf(stderr," ./redis-server - (read config from stdin)\n");
2199 fprintf(stderr," ./redis-server -v or --version\n");
2200 fprintf(stderr," ./redis-server -h or --help\n");
2201 fprintf(stderr," ./redis-server --test-memory <megabytes>\n\n");
2202 fprintf(stderr,"Examples:\n");
2203 fprintf(stderr," ./redis-server (run the server with default conf)\n");
2204 fprintf(stderr," ./redis-server /etc/redis/6379.conf\n");
2205 fprintf(stderr," ./redis-server --port 7777\n");
2206 fprintf(stderr," ./redis-server --port 7777 --slaveof 127.0.0.1 8888\n");
2207 fprintf(stderr," ./redis-server /etc/myredis.conf --loglevel verbose\n");
2208 exit(1);
2209 }
2210
2211 void redisAsciiArt(void) {
2212 #include "asciilogo.h"
2213 char *buf = zmalloc(1024*16);
2214
2215 snprintf(buf,1024*16,ascii_logo,
2216 REDIS_VERSION,
2217 redisGitSHA1(),
2218 strtol(redisGitDirty(),NULL,10) > 0,
2219 (sizeof(long) == 8) ? "64" : "32",
2220 "stand alone",
2221 server.port,
2222 (long) getpid()
2223 );
2224 redisLogRaw(REDIS_NOTICE|REDIS_LOG_RAW,buf);
2225 zfree(buf);
2226 }
2227
2228 static void sigtermHandler(int sig) {
2229 REDIS_NOTUSED(sig);
2230
2231 redisLog(REDIS_WARNING,"Received SIGTERM, scheduling shutdown...");
2232 server.shutdown_asap = 1;
2233 }
2234
2235 void setupSignalHandlers(void) {
2236 struct sigaction act;
2237
2238 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction is used.
2239 * Otherwise, sa_handler is used. */
2240 sigemptyset(&act.sa_mask);
2241 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND;
2242 act.sa_handler = sigtermHandler;
2243 sigaction(SIGTERM, &act, NULL);
2244
2245 #ifdef HAVE_BACKTRACE
2246 sigemptyset(&act.sa_mask);
2247 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND | SA_SIGINFO;
2248 act.sa_sigaction = sigsegvHandler;
2249 sigaction(SIGSEGV, &act, NULL);
2250 sigaction(SIGBUS, &act, NULL);
2251 sigaction(SIGFPE, &act, NULL);
2252 sigaction(SIGILL, &act, NULL);
2253 #endif
2254 return;
2255 }
2256
2257 void memtest(size_t megabytes, int passes);
2258
2259 int main(int argc, char **argv) {
2260 long long start;
2261 struct timeval tv;
2262
2263 /* We need to initialize our libraries, and the server configuration. */
2264 zmalloc_enable_thread_safeness();
2265 srand(time(NULL)^getpid());
2266 gettimeofday(&tv,NULL);
2267 dictSetHashFunctionSeed(tv.tv_sec^tv.tv_usec^getpid());
2268 initServerConfig();
2269
2270 if (argc >= 2) {
2271 int j = 1; /* First option to parse in argv[] */
2272 sds options = sdsempty();
2273 char *configfile = NULL;
2274
2275 /* Handle special options --help and --version */
2276 if (strcmp(argv[1], "-v") == 0 ||
2277 strcmp(argv[1], "--version") == 0) version();
2278 if (strcmp(argv[1], "--help") == 0 ||
2279 strcmp(argv[1], "-h") == 0) usage();
2280 if (strcmp(argv[1], "--test-memory") == 0) {
2281 if (argc == 3) {
2282 memtest(atoi(argv[2]),50);
2283 exit(0);
2284 } else {
2285 fprintf(stderr,"Please specify the amount of memory to test in megabytes.\n");
2286 fprintf(stderr,"Example: ./redis-server --test-memory 4096\n\n");
2287 exit(1);
2288 }
2289 }
2290
2291 /* First argument is the config file name? */
2292 if (argv[j][0] != '-' || argv[j][1] != '-')
2293 configfile = argv[j++];
2294 /* All the other options are parsed and conceptually appended to the
2295 * configuration file. For instance --port 6380 will generate the
2296 * string "port 6380\n" to be parsed after the actual file name
2297 * is parsed, if any. */
2298 while(j != argc) {
2299 if (argv[j][0] == '-' && argv[j][1] == '-') {
2300 /* Option name */
2301 if (sdslen(options)) options = sdscat(options,"\n");
2302 options = sdscat(options,argv[j]+2);
2303 options = sdscat(options," ");
2304 } else {
2305 /* Option argument */
2306 options = sdscatrepr(options,argv[j],strlen(argv[j]));
2307 options = sdscat(options," ");
2308 }
2309 j++;
2310 }
2311 resetServerSaveParams();
2312 loadServerConfig(configfile,options);
2313 sdsfree(options);
2314 } else {
2315 redisLog(REDIS_WARNING,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
2316 }
2317 if (server.daemonize) daemonize();
2318 initServer();
2319 if (server.daemonize) createPidFile();
2320 redisAsciiArt();
2321 redisLog(REDIS_WARNING,"Server started, Redis version " REDIS_VERSION);
2322 #ifdef __linux__
2323 linuxOvercommitMemoryWarning();
2324 #endif
2325 start = ustime();
2326 if (server.aof_state == REDIS_AOF_ON) {
2327 if (loadAppendOnlyFile(server.aof_filename) == REDIS_OK)
2328 redisLog(REDIS_NOTICE,"DB loaded from append only file: %.3f seconds",(float)(ustime()-start)/1000000);
2329 } else {
2330 if (rdbLoad(server.rdb_filename) == REDIS_OK) {
2331 redisLog(REDIS_NOTICE,"DB loaded from disk: %.3f seconds",
2332 (float)(ustime()-start)/1000000);
2333 } else if (errno != ENOENT) {
2334 redisLog(REDIS_WARNING,"Fatal error loading the DB. Exiting.");
2335 exit(1);
2336 }
2337 }
2338 if (server.ipfd > 0)
2339 redisLog(REDIS_NOTICE,"The server is now ready to accept connections on port %d", server.port);
2340 if (server.sofd > 0)
2341 redisLog(REDIS_NOTICE,"The server is now ready to accept connections at %s", server.unixsocket);
2342 aeSetBeforeSleepProc(server.el,beforeSleep);
2343 aeMain(server.el);
2344 aeDeleteEventLoop(server.el);
2345 return 0;
2346 }
2347
2348 /* The End */