]> git.saurik.com Git - redis.git/blob - src/redis.c
SLAVEOF is not a write command.
[redis.git] / src / redis.c
1 /*
2 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 */
29
30 #include "redis.h"
31 #include "slowlog.h"
32 #include "bio.h"
33
34 #include <time.h>
35 #include <signal.h>
36 #include <sys/wait.h>
37 #include <errno.h>
38 #include <assert.h>
39 #include <ctype.h>
40 #include <stdarg.h>
41 #include <arpa/inet.h>
42 #include <sys/stat.h>
43 #include <fcntl.h>
44 #include <sys/time.h>
45 #include <sys/resource.h>
46 #include <sys/uio.h>
47 #include <limits.h>
48 #include <float.h>
49 #include <math.h>
50 #include <sys/resource.h>
51
52 /* Our shared "common" objects */
53
54 struct sharedObjectsStruct shared;
55
56 /* Global vars that are actually used as constants. The following double
57 * values are used for double on-disk serialization, and are initialized
58 * at runtime to avoid strange compiler optimizations. */
59
60 double R_Zero, R_PosInf, R_NegInf, R_Nan;
61
62 /*================================= Globals ================================= */
63
64 /* Global vars */
65 struct redisServer server; /* server global state */
66 struct redisCommand *commandTable;
67
68 /* Our command table.
69 *
70 * Every entry is composed of the following fields:
71 *
72 * name: a string representing the command name.
73 * function: pointer to the C function implementing the command.
74 * arity: number of arguments, it is possible to use -N to say >= N
75 * sflags: command flags as string. See below for a table of flags.
76 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
77 * get_keys_proc: an optional function to get key arguments from a command.
78 * This is only used when the following three fields are not
79 * enough to specify what arguments are keys.
80 * first_key_index: first argument that is a key
81 * last_key_index: last argument that is a key
82 * key_step: step to get all the keys from first to last argument. For instance
83 * in MSET the step is two since arguments are key,val,key,val,...
84 * microseconds: microseconds of total execution time for this command.
85 * calls: total number of calls of this command.
86 *
87 * The flags, microseconds and calls fields are computed by Redis and should
88 * always be set to zero.
89 *
90 * Command flags are expressed using strings where every character represents
91 * a flag. Later the populateCommandTable() function will take care of
92 * populating the real 'flags' field using this characters.
93 *
94 * This is the meaning of the flags:
95 *
96 * w: write command (may modify the key space).
97 * r: read command (will never modify the key space).
98 * m: may increase memory usage once called. Don't allow if out of memory.
99 * a: admin command, like SAVE or SHUTDOWN.
100 * p: Pub/Sub related command.
101 * f: force replication of this command, regarless of server.dirty.
102 * s: command not allowed in scripts.
103 * R: random command. Command is not deterministic, that is, the same command
104 * with the same arguments, with the same key space, may have different
105 * results. For instance SPOP and RANDOMKEY are two random commands.
106 * S: Sort command output array if called from script, so that the output
107 * is deterministic.
108 */
109 struct redisCommand redisCommandTable[] = {
110 {"get",getCommand,2,"r",0,NULL,1,1,1,0,0},
111 {"set",setCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
112 {"setnx",setnxCommand,3,"wm",0,noPreloadGetKeys,1,1,1,0,0},
113 {"setex",setexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
114 {"psetex",psetexCommand,4,"wm",0,noPreloadGetKeys,1,1,1,0,0},
115 {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
116 {"strlen",strlenCommand,2,"r",0,NULL,1,1,1,0,0},
117 {"del",delCommand,-2,"w",0,noPreloadGetKeys,1,-1,1,0,0},
118 {"exists",existsCommand,2,"r",0,NULL,1,1,1,0,0},
119 {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
120 {"getbit",getbitCommand,3,"r",0,NULL,1,1,1,0,0},
121 {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
122 {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
123 {"substr",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
124 {"incr",incrCommand,2,"wm",0,NULL,1,1,1,0,0},
125 {"decr",decrCommand,2,"wm",0,NULL,1,1,1,0,0},
126 {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
127 {"rpush",rpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
128 {"lpush",lpushCommand,-3,"wm",0,NULL,1,1,1,0,0},
129 {"rpushx",rpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
130 {"lpushx",lpushxCommand,3,"wm",0,NULL,1,1,1,0,0},
131 {"linsert",linsertCommand,5,"wm",0,NULL,1,1,1,0,0},
132 {"rpop",rpopCommand,2,"w",0,NULL,1,1,1,0,0},
133 {"lpop",lpopCommand,2,"w",0,NULL,1,1,1,0,0},
134 {"brpop",brpopCommand,-3,"ws",0,NULL,1,1,1,0,0},
135 {"brpoplpush",brpoplpushCommand,4,"wms",0,NULL,1,2,1,0,0},
136 {"blpop",blpopCommand,-3,"ws",0,NULL,1,-2,1,0,0},
137 {"llen",llenCommand,2,"r",0,NULL,1,1,1,0,0},
138 {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
139 {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
140 {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
141 {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
142 {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
143 {"rpoplpush",rpoplpushCommand,3,"wm",0,NULL,1,2,1,0,0},
144 {"sadd",saddCommand,-3,"wm",0,NULL,1,1,1,0,0},
145 {"srem",sremCommand,-3,"w",0,NULL,1,1,1,0,0},
146 {"smove",smoveCommand,4,"w",0,NULL,1,2,1,0,0},
147 {"sismember",sismemberCommand,3,"r",0,NULL,1,1,1,0,0},
148 {"scard",scardCommand,2,"r",0,NULL,1,1,1,0,0},
149 {"spop",spopCommand,2,"wRs",0,NULL,1,1,1,0,0},
150 {"srandmember",srandmemberCommand,2,"rR",0,NULL,1,1,1,0,0},
151 {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
152 {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
153 {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
154 {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
155 {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
156 {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
157 {"smembers",sinterCommand,2,"rS",0,NULL,1,1,1,0,0},
158 {"zadd",zaddCommand,-4,"wm",0,NULL,1,1,1,0,0},
159 {"zincrby",zincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
160 {"zrem",zremCommand,-3,"w",0,NULL,1,1,1,0,0},
161 {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
162 {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
163 {"zunionstore",zunionstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
164 {"zinterstore",zinterstoreCommand,-4,"wm",0,zunionInterGetKeys,0,0,0,0,0},
165 {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
166 {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
167 {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
168 {"zcount",zcountCommand,4,"r",0,NULL,1,1,1,0,0},
169 {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
170 {"zcard",zcardCommand,2,"r",0,NULL,1,1,1,0,0},
171 {"zscore",zscoreCommand,3,"r",0,NULL,1,1,1,0,0},
172 {"zrank",zrankCommand,3,"r",0,NULL,1,1,1,0,0},
173 {"zrevrank",zrevrankCommand,3,"r",0,NULL,1,1,1,0,0},
174 {"hset",hsetCommand,4,"wm",0,NULL,1,1,1,0,0},
175 {"hsetnx",hsetnxCommand,4,"wm",0,NULL,1,1,1,0,0},
176 {"hget",hgetCommand,3,"r",0,NULL,1,1,1,0,0},
177 {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
178 {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
179 {"hincrby",hincrbyCommand,4,"wm",0,NULL,1,1,1,0,0},
180 {"hincrbyfloat",hincrbyfloatCommand,4,"wm",0,NULL,1,1,1,0,0},
181 {"hdel",hdelCommand,-3,"w",0,NULL,1,1,1,0,0},
182 {"hlen",hlenCommand,2,"r",0,NULL,1,1,1,0,0},
183 {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
184 {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
185 {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
186 {"hexists",hexistsCommand,3,"r",0,NULL,1,1,1,0,0},
187 {"incrby",incrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
188 {"decrby",decrbyCommand,3,"wm",0,NULL,1,1,1,0,0},
189 {"incrbyfloat",incrbyfloatCommand,3,"wm",0,NULL,1,1,1,0,0},
190 {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
191 {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
192 {"msetnx",msetnxCommand,-3,"wm",0,NULL,1,-1,2,0,0},
193 {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
194 {"select",selectCommand,2,"r",0,NULL,0,0,0,0,0},
195 {"move",moveCommand,3,"w",0,NULL,1,1,1,0,0},
196 {"rename",renameCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
197 {"renamenx",renamenxCommand,3,"w",0,renameGetKeys,1,2,1,0,0},
198 {"expire",expireCommand,3,"w",0,NULL,1,1,1,0,0},
199 {"expireat",expireatCommand,3,"w",0,NULL,1,1,1,0,0},
200 {"pexpire",pexpireCommand,3,"w",0,NULL,1,1,1,0,0},
201 {"pexpireat",pexpireatCommand,3,"w",0,NULL,1,1,1,0,0},
202 {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
203 {"dbsize",dbsizeCommand,1,"r",0,NULL,0,0,0,0,0},
204 {"auth",authCommand,2,"rs",0,NULL,0,0,0,0,0},
205 {"ping",pingCommand,1,"r",0,NULL,0,0,0,0,0},
206 {"echo",echoCommand,2,"r",0,NULL,0,0,0,0,0},
207 {"save",saveCommand,1,"ars",0,NULL,0,0,0,0,0},
208 {"bgsave",bgsaveCommand,1,"ar",0,NULL,0,0,0,0,0},
209 {"bgrewriteaof",bgrewriteaofCommand,1,"ar",0,NULL,0,0,0,0,0},
210 {"shutdown",shutdownCommand,-1,"ar",0,NULL,0,0,0,0,0},
211 {"lastsave",lastsaveCommand,1,"r",0,NULL,0,0,0,0,0},
212 {"type",typeCommand,2,"r",0,NULL,1,1,1,0,0},
213 {"multi",multiCommand,1,"rs",0,NULL,0,0,0,0,0},
214 {"exec",execCommand,1,"s",0,NULL,0,0,0,0,0},
215 {"discard",discardCommand,1,"rs",0,NULL,0,0,0,0,0},
216 {"sync",syncCommand,1,"ars",0,NULL,0,0,0,0,0},
217 {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
218 {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
219 {"sort",sortCommand,-2,"wmS",0,NULL,1,1,1,0,0},
220 {"info",infoCommand,-1,"r",0,NULL,0,0,0,0,0},
221 {"monitor",monitorCommand,1,"ars",0,NULL,0,0,0,0,0},
222 {"ttl",ttlCommand,2,"r",0,NULL,1,1,1,0,0},
223 {"pttl",pttlCommand,2,"r",0,NULL,1,1,1,0,0},
224 {"persist",persistCommand,2,"w",0,NULL,1,1,1,0,0},
225 {"slaveof",slaveofCommand,3,"as",0,NULL,0,0,0,0,0},
226 {"debug",debugCommand,-2,"as",0,NULL,0,0,0,0,0},
227 {"config",configCommand,-2,"ar",0,NULL,0,0,0,0,0},
228 {"subscribe",subscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
229 {"unsubscribe",unsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
230 {"psubscribe",psubscribeCommand,-2,"rps",0,NULL,0,0,0,0,0},
231 {"punsubscribe",punsubscribeCommand,-1,"rps",0,NULL,0,0,0,0,0},
232 {"publish",publishCommand,3,"pf",0,NULL,0,0,0,0,0},
233 {"watch",watchCommand,-2,"rs",0,noPreloadGetKeys,1,-1,1,0,0},
234 {"unwatch",unwatchCommand,1,"rs",0,NULL,0,0,0,0,0},
235 {"restore",restoreCommand,4,"awm",0,NULL,1,1,1,0,0},
236 {"migrate",migrateCommand,6,"aw",0,NULL,0,0,0,0,0},
237 {"dump",dumpCommand,2,"ar",0,NULL,1,1,1,0,0},
238 {"object",objectCommand,-2,"r",0,NULL,2,2,2,0,0},
239 {"client",clientCommand,-2,"ar",0,NULL,0,0,0,0,0},
240 {"eval",evalCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
241 {"evalsha",evalShaCommand,-3,"s",0,zunionInterGetKeys,0,0,0,0,0},
242 {"slowlog",slowlogCommand,-2,"r",0,NULL,0,0,0,0,0},
243 {"script",scriptCommand,-2,"ras",0,NULL,0,0,0,0,0},
244 {"time",timeCommand,1,"rR",0,NULL,0,0,0,0,0}
245 };
246
247 /*============================ Utility functions ============================ */
248
249 /* Low level logging. To use only for very big messages, otherwise
250 * redisLog() is to prefer. */
251 void redisLogRaw(int level, const char *msg) {
252 const int syslogLevelMap[] = { LOG_DEBUG, LOG_INFO, LOG_NOTICE, LOG_WARNING };
253 const char *c = ".-*#";
254 FILE *fp;
255 char buf[64];
256 int rawmode = (level & REDIS_LOG_RAW);
257
258 level &= 0xff; /* clear flags */
259 if (level < server.verbosity) return;
260
261 fp = (server.logfile == NULL) ? stdout : fopen(server.logfile,"a");
262 if (!fp) return;
263
264 if (rawmode) {
265 fprintf(fp,"%s",msg);
266 } else {
267 int off;
268 struct timeval tv;
269
270 gettimeofday(&tv,NULL);
271 off = strftime(buf,sizeof(buf),"%d %b %H:%M:%S.",localtime(&tv.tv_sec));
272 snprintf(buf+off,sizeof(buf)-off,"%03d",(int)tv.tv_usec/1000);
273 fprintf(fp,"[%d] %s %c %s\n",(int)getpid(),buf,c[level],msg);
274 }
275 fflush(fp);
276
277 if (server.logfile) fclose(fp);
278
279 if (server.syslog_enabled) syslog(syslogLevelMap[level], "%s", msg);
280 }
281
282 /* Like redisLogRaw() but with printf-alike support. This is the funciton that
283 * is used across the code. The raw version is only used in order to dump
284 * the INFO output on crash. */
285 void redisLog(int level, const char *fmt, ...) {
286 va_list ap;
287 char msg[REDIS_MAX_LOGMSG_LEN];
288
289 if ((level&0xff) < server.verbosity) return;
290
291 va_start(ap, fmt);
292 vsnprintf(msg, sizeof(msg), fmt, ap);
293 va_end(ap);
294
295 redisLogRaw(level,msg);
296 }
297
298 /* Log a fixed message without printf-alike capabilities, in a way that is
299 * safe to call from a signal handler.
300 *
301 * We actually use this only for signals that are not fatal from the point
302 * of view of Redis. Signals that are going to kill the server anyway and
303 * where we need printf-alike features are served by redisLog(). */
304 void redisLogFromHandler(int level, const char *msg) {
305 int fd;
306 char buf[64];
307
308 if ((level&0xff) < server.verbosity ||
309 (server.logfile == NULL && server.daemonize)) return;
310 fd = server.logfile ?
311 open(server.logfile, O_APPEND|O_CREAT|O_WRONLY, 0644) :
312 STDOUT_FILENO;
313 if (fd == -1) return;
314 ll2string(buf,sizeof(buf),getpid());
315 write(fd,"[",1);
316 write(fd,buf,strlen(buf));
317 write(fd," | signal handler] (",20);
318 ll2string(buf,sizeof(buf),time(NULL));
319 write(fd,buf,strlen(buf));
320 write(fd,") ",2);
321 write(fd,msg,strlen(msg));
322 write(fd,"\n",1);
323 if (server.logfile) close(fd);
324 }
325
326 /* Redis generally does not try to recover from out of memory conditions
327 * when allocating objects or strings, it is not clear if it will be possible
328 * to report this condition to the client since the networking layer itself
329 * is based on heap allocation for send buffers, so we simply abort.
330 * At least the code will be simpler to read... */
331 void oom(const char *msg) {
332 redisLog(REDIS_WARNING, "%s: Out of memory\n",msg);
333 sleep(1);
334 abort();
335 }
336
337 /* Return the UNIX time in microseconds */
338 long long ustime(void) {
339 struct timeval tv;
340 long long ust;
341
342 gettimeofday(&tv, NULL);
343 ust = ((long long)tv.tv_sec)*1000000;
344 ust += tv.tv_usec;
345 return ust;
346 }
347
348 /* Return the UNIX time in milliseconds */
349 long long mstime(void) {
350 return ustime()/1000;
351 }
352
353 /*====================== Hash table type implementation ==================== */
354
355 /* This is an hash table type that uses the SDS dynamic strings libary as
356 * keys and radis objects as values (objects can hold SDS strings,
357 * lists, sets). */
358
359 void dictVanillaFree(void *privdata, void *val)
360 {
361 DICT_NOTUSED(privdata);
362 zfree(val);
363 }
364
365 void dictListDestructor(void *privdata, void *val)
366 {
367 DICT_NOTUSED(privdata);
368 listRelease((list*)val);
369 }
370
371 int dictSdsKeyCompare(void *privdata, const void *key1,
372 const void *key2)
373 {
374 int l1,l2;
375 DICT_NOTUSED(privdata);
376
377 l1 = sdslen((sds)key1);
378 l2 = sdslen((sds)key2);
379 if (l1 != l2) return 0;
380 return memcmp(key1, key2, l1) == 0;
381 }
382
383 /* A case insensitive version used for the command lookup table. */
384 int dictSdsKeyCaseCompare(void *privdata, const void *key1,
385 const void *key2)
386 {
387 DICT_NOTUSED(privdata);
388
389 return strcasecmp(key1, key2) == 0;
390 }
391
392 void dictRedisObjectDestructor(void *privdata, void *val)
393 {
394 DICT_NOTUSED(privdata);
395
396 if (val == NULL) return; /* Values of swapped out keys as set to NULL */
397 decrRefCount(val);
398 }
399
400 void dictSdsDestructor(void *privdata, void *val)
401 {
402 DICT_NOTUSED(privdata);
403
404 sdsfree(val);
405 }
406
407 int dictObjKeyCompare(void *privdata, const void *key1,
408 const void *key2)
409 {
410 const robj *o1 = key1, *o2 = key2;
411 return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
412 }
413
414 unsigned int dictObjHash(const void *key) {
415 const robj *o = key;
416 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
417 }
418
419 unsigned int dictSdsHash(const void *key) {
420 return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
421 }
422
423 unsigned int dictSdsCaseHash(const void *key) {
424 return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
425 }
426
427 int dictEncObjKeyCompare(void *privdata, const void *key1,
428 const void *key2)
429 {
430 robj *o1 = (robj*) key1, *o2 = (robj*) key2;
431 int cmp;
432
433 if (o1->encoding == REDIS_ENCODING_INT &&
434 o2->encoding == REDIS_ENCODING_INT)
435 return o1->ptr == o2->ptr;
436
437 o1 = getDecodedObject(o1);
438 o2 = getDecodedObject(o2);
439 cmp = dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
440 decrRefCount(o1);
441 decrRefCount(o2);
442 return cmp;
443 }
444
445 unsigned int dictEncObjHash(const void *key) {
446 robj *o = (robj*) key;
447
448 if (o->encoding == REDIS_ENCODING_RAW) {
449 return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
450 } else {
451 if (o->encoding == REDIS_ENCODING_INT) {
452 char buf[32];
453 int len;
454
455 len = ll2string(buf,32,(long)o->ptr);
456 return dictGenHashFunction((unsigned char*)buf, len);
457 } else {
458 unsigned int hash;
459
460 o = getDecodedObject(o);
461 hash = dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
462 decrRefCount(o);
463 return hash;
464 }
465 }
466 }
467
468 /* Sets type hash table */
469 dictType setDictType = {
470 dictEncObjHash, /* hash function */
471 NULL, /* key dup */
472 NULL, /* val dup */
473 dictEncObjKeyCompare, /* key compare */
474 dictRedisObjectDestructor, /* key destructor */
475 NULL /* val destructor */
476 };
477
478 /* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
479 dictType zsetDictType = {
480 dictEncObjHash, /* hash function */
481 NULL, /* key dup */
482 NULL, /* val dup */
483 dictEncObjKeyCompare, /* key compare */
484 dictRedisObjectDestructor, /* key destructor */
485 NULL /* val destructor */
486 };
487
488 /* Db->dict, keys are sds strings, vals are Redis objects. */
489 dictType dbDictType = {
490 dictSdsHash, /* hash function */
491 NULL, /* key dup */
492 NULL, /* val dup */
493 dictSdsKeyCompare, /* key compare */
494 dictSdsDestructor, /* key destructor */
495 dictRedisObjectDestructor /* val destructor */
496 };
497
498 /* Db->expires */
499 dictType keyptrDictType = {
500 dictSdsHash, /* hash function */
501 NULL, /* key dup */
502 NULL, /* val dup */
503 dictSdsKeyCompare, /* key compare */
504 NULL, /* key destructor */
505 NULL /* val destructor */
506 };
507
508 /* Command table. sds string -> command struct pointer. */
509 dictType commandTableDictType = {
510 dictSdsCaseHash, /* hash function */
511 NULL, /* key dup */
512 NULL, /* val dup */
513 dictSdsKeyCaseCompare, /* key compare */
514 dictSdsDestructor, /* key destructor */
515 NULL /* val destructor */
516 };
517
518 /* Hash type hash table (note that small hashes are represented with zimpaps) */
519 dictType hashDictType = {
520 dictEncObjHash, /* hash function */
521 NULL, /* key dup */
522 NULL, /* val dup */
523 dictEncObjKeyCompare, /* key compare */
524 dictRedisObjectDestructor, /* key destructor */
525 dictRedisObjectDestructor /* val destructor */
526 };
527
528 /* Keylist hash table type has unencoded redis objects as keys and
529 * lists as values. It's used for blocking operations (BLPOP) and to
530 * map swapped keys to a list of clients waiting for this keys to be loaded. */
531 dictType keylistDictType = {
532 dictObjHash, /* hash function */
533 NULL, /* key dup */
534 NULL, /* val dup */
535 dictObjKeyCompare, /* key compare */
536 dictRedisObjectDestructor, /* key destructor */
537 dictListDestructor /* val destructor */
538 };
539
540 int htNeedsResize(dict *dict) {
541 long long size, used;
542
543 size = dictSlots(dict);
544 used = dictSize(dict);
545 return (size && used && size > DICT_HT_INITIAL_SIZE &&
546 (used*100/size < REDIS_HT_MINFILL));
547 }
548
549 /* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
550 * we resize the hash table to save memory */
551 void tryResizeHashTables(void) {
552 int j;
553
554 for (j = 0; j < server.dbnum; j++) {
555 if (htNeedsResize(server.db[j].dict))
556 dictResize(server.db[j].dict);
557 if (htNeedsResize(server.db[j].expires))
558 dictResize(server.db[j].expires);
559 }
560 }
561
562 /* Our hash table implementation performs rehashing incrementally while
563 * we write/read from the hash table. Still if the server is idle, the hash
564 * table will use two tables for a long time. So we try to use 1 millisecond
565 * of CPU time at every serverCron() loop in order to rehash some key. */
566 void incrementallyRehash(void) {
567 int j;
568
569 for (j = 0; j < server.dbnum; j++) {
570 if (dictIsRehashing(server.db[j].dict)) {
571 dictRehashMilliseconds(server.db[j].dict,1);
572 break; /* already used our millisecond for this loop... */
573 }
574 }
575 }
576
577 /* This function is called once a background process of some kind terminates,
578 * as we want to avoid resizing the hash tables when there is a child in order
579 * to play well with copy-on-write (otherwise when a resize happens lots of
580 * memory pages are copied). The goal of this function is to update the ability
581 * for dict.c to resize the hash tables accordingly to the fact we have o not
582 * running childs. */
583 void updateDictResizePolicy(void) {
584 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
585 dictEnableResize();
586 else
587 dictDisableResize();
588 }
589
590 /* ======================= Cron: called every 100 ms ======================== */
591
592 /* Try to expire a few timed out keys. The algorithm used is adaptive and
593 * will use few CPU cycles if there are few expiring keys, otherwise
594 * it will get more aggressive to avoid that too much memory is used by
595 * keys that can be removed from the keyspace. */
596 void activeExpireCycle(void) {
597 int j;
598
599 for (j = 0; j < server.dbnum; j++) {
600 int expired;
601 redisDb *db = server.db+j;
602
603 /* Continue to expire if at the end of the cycle more than 25%
604 * of the keys were expired. */
605 do {
606 long num = dictSize(db->expires);
607 long long now = mstime();
608
609 expired = 0;
610 if (num > REDIS_EXPIRELOOKUPS_PER_CRON)
611 num = REDIS_EXPIRELOOKUPS_PER_CRON;
612 while (num--) {
613 dictEntry *de;
614 long long t;
615
616 if ((de = dictGetRandomKey(db->expires)) == NULL) break;
617 t = dictGetSignedIntegerVal(de);
618 if (now > t) {
619 sds key = dictGetKey(de);
620 robj *keyobj = createStringObject(key,sdslen(key));
621
622 propagateExpire(db,keyobj);
623 dbDelete(db,keyobj);
624 decrRefCount(keyobj);
625 expired++;
626 server.stat_expiredkeys++;
627 }
628 }
629 } while (expired > REDIS_EXPIRELOOKUPS_PER_CRON/4);
630 }
631 }
632
633 void updateLRUClock(void) {
634 server.lruclock = (server.unixtime/REDIS_LRU_CLOCK_RESOLUTION) &
635 REDIS_LRU_CLOCK_MAX;
636 }
637
638
639 /* Add a sample to the operations per second array of samples. */
640 void trackOperationsPerSecond(void) {
641 long long t = mstime() - server.ops_sec_last_sample_time;
642 long long ops = server.stat_numcommands - server.ops_sec_last_sample_ops;
643 long long ops_sec;
644
645 ops_sec = t > 0 ? (ops*1000/t) : 0;
646
647 server.ops_sec_samples[server.ops_sec_idx] = ops_sec;
648 server.ops_sec_idx = (server.ops_sec_idx+1) % REDIS_OPS_SEC_SAMPLES;
649 server.ops_sec_last_sample_time = mstime();
650 server.ops_sec_last_sample_ops = server.stat_numcommands;
651 }
652
653 /* Return the mean of all the samples. */
654 long long getOperationsPerSecond(void) {
655 int j;
656 long long sum = 0;
657
658 for (j = 0; j < REDIS_OPS_SEC_SAMPLES; j++)
659 sum += server.ops_sec_samples[j];
660 return sum / REDIS_OPS_SEC_SAMPLES;
661 }
662
663 /* Check for timeouts. Returns non-zero if the client was terminated */
664 int clientsCronHandleTimeout(redisClient *c) {
665 time_t now = server.unixtime;
666
667 if (server.maxidletime &&
668 !(c->flags & REDIS_SLAVE) && /* no timeout for slaves */
669 !(c->flags & REDIS_MASTER) && /* no timeout for masters */
670 !(c->flags & REDIS_BLOCKED) && /* no timeout for BLPOP */
671 dictSize(c->pubsub_channels) == 0 && /* no timeout for pubsub */
672 listLength(c->pubsub_patterns) == 0 &&
673 (now - c->lastinteraction > server.maxidletime))
674 {
675 redisLog(REDIS_VERBOSE,"Closing idle client");
676 freeClient(c);
677 return 1;
678 } else if (c->flags & REDIS_BLOCKED) {
679 if (c->bpop.timeout != 0 && c->bpop.timeout < now) {
680 addReply(c,shared.nullmultibulk);
681 unblockClientWaitingData(c);
682 }
683 }
684 return 0;
685 }
686
687 /* The client query buffer is an sds.c string that can end with a lot of
688 * free space not used, this function reclaims space if needed.
689 *
690 * The funciton always returns 0 as it never terminates the client. */
691 int clientsCronResizeQueryBuffer(redisClient *c) {
692 size_t querybuf_size = sdsAllocSize(c->querybuf);
693 time_t idletime = server.unixtime - c->lastinteraction;
694
695 /* There are two conditions to resize the query buffer:
696 * 1) Query buffer is > BIG_ARG and too big for latest peak.
697 * 2) Client is inactive and the buffer is bigger than 1k. */
698 if (((querybuf_size > REDIS_MBULK_BIG_ARG) &&
699 (querybuf_size/(c->querybuf_peak+1)) > 2) ||
700 (querybuf_size > 1024 && idletime > 2))
701 {
702 /* Only resize the query buffer if it is actually wasting space. */
703 if (sdsavail(c->querybuf) > 1024) {
704 c->querybuf = sdsRemoveFreeSpace(c->querybuf);
705 }
706 }
707 /* Reset the peak again to capture the peak memory usage in the next
708 * cycle. */
709 c->querybuf_peak = 0;
710 return 0;
711 }
712
713 void clientsCron(void) {
714 /* Make sure to process at least 1/100 of clients per call.
715 * Since this function is called 10 times per second we are sure that
716 * in the worst case we process all the clients in 10 seconds.
717 * In normal conditions (a reasonable number of clients) we process
718 * all the clients in a shorter time. */
719 int numclients = listLength(server.clients);
720 int iterations = numclients/100;
721
722 if (iterations < 50)
723 iterations = (numclients < 50) ? numclients : 50;
724 while(listLength(server.clients) && iterations--) {
725 redisClient *c;
726 listNode *head;
727
728 /* Rotate the list, take the current head, process.
729 * This way if the client must be removed from the list it's the
730 * first element and we don't incur into O(N) computation. */
731 listRotate(server.clients);
732 head = listFirst(server.clients);
733 c = listNodeValue(head);
734 /* The following functions do different service checks on the client.
735 * The protocol is that they return non-zero if the client was
736 * terminated. */
737 if (clientsCronHandleTimeout(c)) continue;
738 if (clientsCronResizeQueryBuffer(c)) continue;
739 }
740 }
741
742 int serverCron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
743 int j, loops = server.cronloops;
744 REDIS_NOTUSED(eventLoop);
745 REDIS_NOTUSED(id);
746 REDIS_NOTUSED(clientData);
747
748 /* Software watchdog: deliver the SIGALRM that will reach the signal
749 * handler if we don't return here fast enough. */
750 if (server.watchdog_period) watchdogScheduleSignal(server.watchdog_period);
751
752 /* We take a cached value of the unix time in the global state because
753 * with virtual memory and aging there is to store the current time
754 * in objects at every object access, and accuracy is not needed.
755 * To access a global var is faster than calling time(NULL) */
756 server.unixtime = time(NULL);
757
758 trackOperationsPerSecond();
759
760 /* We have just 22 bits per object for LRU information.
761 * So we use an (eventually wrapping) LRU clock with 10 seconds resolution.
762 * 2^22 bits with 10 seconds resoluton is more or less 1.5 years.
763 *
764 * Note that even if this will wrap after 1.5 years it's not a problem,
765 * everything will still work but just some object will appear younger
766 * to Redis. But for this to happen a given object should never be touched
767 * for 1.5 years.
768 *
769 * Note that you can change the resolution altering the
770 * REDIS_LRU_CLOCK_RESOLUTION define.
771 */
772 updateLRUClock();
773
774 /* Record the max memory used since the server was started. */
775 if (zmalloc_used_memory() > server.stat_peak_memory)
776 server.stat_peak_memory = zmalloc_used_memory();
777
778 /* We received a SIGTERM, shutting down here in a safe way, as it is
779 * not ok doing so inside the signal handler. */
780 if (server.shutdown_asap) {
781 if (prepareForShutdown(0) == REDIS_OK) exit(0);
782 redisLog(REDIS_WARNING,"SIGTERM received but errors trying to shut down the server, check the logs for more information");
783 }
784
785 /* Show some info about non-empty databases */
786 for (j = 0; j < server.dbnum; j++) {
787 long long size, used, vkeys;
788
789 size = dictSlots(server.db[j].dict);
790 used = dictSize(server.db[j].dict);
791 vkeys = dictSize(server.db[j].expires);
792 if (!(loops % 50) && (used || vkeys)) {
793 redisLog(REDIS_VERBOSE,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j,used,vkeys,size);
794 /* dictPrintStats(server.dict); */
795 }
796 }
797
798 /* We don't want to resize the hash tables while a bacground saving
799 * is in progress: the saving child is created using fork() that is
800 * implemented with a copy-on-write semantic in most modern systems, so
801 * if we resize the HT while there is the saving child at work actually
802 * a lot of memory movements in the parent will cause a lot of pages
803 * copied. */
804 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
805 if (!(loops % 10)) tryResizeHashTables();
806 if (server.activerehashing) incrementallyRehash();
807 }
808
809 /* Show information about connected clients */
810 if (!(loops % 50)) {
811 redisLog(REDIS_VERBOSE,"%d clients connected (%d slaves), %zu bytes in use",
812 listLength(server.clients)-listLength(server.slaves),
813 listLength(server.slaves),
814 zmalloc_used_memory());
815 }
816
817 /* We need to do a few operations on clients asynchronously. */
818 clientsCron();
819
820 /* Start a scheduled AOF rewrite if this was requested by the user while
821 * a BGSAVE was in progress. */
822 if (server.rdb_child_pid == -1 && server.aof_child_pid == -1 &&
823 server.aof_rewrite_scheduled)
824 {
825 rewriteAppendOnlyFileBackground();
826 }
827
828 /* Check if a background saving or AOF rewrite in progress terminated. */
829 if (server.rdb_child_pid != -1 || server.aof_child_pid != -1) {
830 int statloc;
831 pid_t pid;
832
833 if ((pid = wait3(&statloc,WNOHANG,NULL)) != 0) {
834 int exitcode = WEXITSTATUS(statloc);
835 int bysignal = 0;
836
837 if (WIFSIGNALED(statloc)) bysignal = WTERMSIG(statloc);
838
839 if (pid == server.rdb_child_pid) {
840 backgroundSaveDoneHandler(exitcode,bysignal);
841 } else {
842 backgroundRewriteDoneHandler(exitcode,bysignal);
843 }
844 updateDictResizePolicy();
845 }
846 } else {
847 /* If there is not a background saving/rewrite in progress check if
848 * we have to save/rewrite now */
849 for (j = 0; j < server.saveparamslen; j++) {
850 struct saveparam *sp = server.saveparams+j;
851
852 if (server.dirty >= sp->changes &&
853 server.unixtime-server.lastsave > sp->seconds) {
854 redisLog(REDIS_NOTICE,"%d changes in %d seconds. Saving...",
855 sp->changes, sp->seconds);
856 rdbSaveBackground(server.rdb_filename);
857 break;
858 }
859 }
860
861 /* Trigger an AOF rewrite if needed */
862 if (server.rdb_child_pid == -1 &&
863 server.aof_child_pid == -1 &&
864 server.aof_rewrite_perc &&
865 server.aof_current_size > server.aof_rewrite_min_size)
866 {
867 long long base = server.aof_rewrite_base_size ?
868 server.aof_rewrite_base_size : 1;
869 long long growth = (server.aof_current_size*100/base) - 100;
870 if (growth >= server.aof_rewrite_perc) {
871 redisLog(REDIS_NOTICE,"Starting automatic rewriting of AOF on %lld%% growth",growth);
872 rewriteAppendOnlyFileBackground();
873 }
874 }
875 }
876
877
878 /* If we postponed an AOF buffer flush, let's try to do it every time the
879 * cron function is called. */
880 if (server.aof_flush_postponed_start) flushAppendOnlyFile(0);
881
882 /* Expire a few keys per cycle, only if this is a master.
883 * On slaves we wait for DEL operations synthesized by the master
884 * in order to guarantee a strict consistency. */
885 if (server.masterhost == NULL) activeExpireCycle();
886
887 /* Close clients that need to be closed asynchronous */
888 freeClientsInAsyncFreeQueue();
889
890 /* Replication cron function -- used to reconnect to master and
891 * to detect transfer failures. */
892 if (!(loops % 10)) replicationCron();
893
894 server.cronloops++;
895 return 100;
896 }
897
898 /* This function gets called every time Redis is entering the
899 * main loop of the event driven library, that is, before to sleep
900 * for ready file descriptors. */
901 void beforeSleep(struct aeEventLoop *eventLoop) {
902 REDIS_NOTUSED(eventLoop);
903 listNode *ln;
904 redisClient *c;
905
906 /* Try to process pending commands for clients that were just unblocked. */
907 while (listLength(server.unblocked_clients)) {
908 ln = listFirst(server.unblocked_clients);
909 redisAssert(ln != NULL);
910 c = ln->value;
911 listDelNode(server.unblocked_clients,ln);
912 c->flags &= ~REDIS_UNBLOCKED;
913
914 /* Process remaining data in the input buffer. */
915 if (c->querybuf && sdslen(c->querybuf) > 0) {
916 server.current_client = c;
917 processInputBuffer(c);
918 server.current_client = NULL;
919 }
920 }
921
922 /* Write the AOF buffer on disk */
923 flushAppendOnlyFile(0);
924 }
925
926 /* =========================== Server initialization ======================== */
927
928 void createSharedObjects(void) {
929 int j;
930
931 shared.crlf = createObject(REDIS_STRING,sdsnew("\r\n"));
932 shared.ok = createObject(REDIS_STRING,sdsnew("+OK\r\n"));
933 shared.err = createObject(REDIS_STRING,sdsnew("-ERR\r\n"));
934 shared.emptybulk = createObject(REDIS_STRING,sdsnew("$0\r\n\r\n"));
935 shared.czero = createObject(REDIS_STRING,sdsnew(":0\r\n"));
936 shared.cone = createObject(REDIS_STRING,sdsnew(":1\r\n"));
937 shared.cnegone = createObject(REDIS_STRING,sdsnew(":-1\r\n"));
938 shared.nullbulk = createObject(REDIS_STRING,sdsnew("$-1\r\n"));
939 shared.nullmultibulk = createObject(REDIS_STRING,sdsnew("*-1\r\n"));
940 shared.emptymultibulk = createObject(REDIS_STRING,sdsnew("*0\r\n"));
941 shared.pong = createObject(REDIS_STRING,sdsnew("+PONG\r\n"));
942 shared.queued = createObject(REDIS_STRING,sdsnew("+QUEUED\r\n"));
943 shared.wrongtypeerr = createObject(REDIS_STRING,sdsnew(
944 "-ERR Operation against a key holding the wrong kind of value\r\n"));
945 shared.nokeyerr = createObject(REDIS_STRING,sdsnew(
946 "-ERR no such key\r\n"));
947 shared.syntaxerr = createObject(REDIS_STRING,sdsnew(
948 "-ERR syntax error\r\n"));
949 shared.sameobjecterr = createObject(REDIS_STRING,sdsnew(
950 "-ERR source and destination objects are the same\r\n"));
951 shared.outofrangeerr = createObject(REDIS_STRING,sdsnew(
952 "-ERR index out of range\r\n"));
953 shared.noscripterr = createObject(REDIS_STRING,sdsnew(
954 "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
955 shared.loadingerr = createObject(REDIS_STRING,sdsnew(
956 "-LOADING Redis is loading the dataset in memory\r\n"));
957 shared.slowscripterr = createObject(REDIS_STRING,sdsnew(
958 "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
959 shared.bgsaveerr = createObject(REDIS_STRING,sdsnew(
960 "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
961 shared.roslaveerr = createObject(REDIS_STRING,sdsnew(
962 "-READONLY You can't write against a read only slave.\r\n"));
963 shared.oomerr = createObject(REDIS_STRING,sdsnew(
964 "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
965 shared.space = createObject(REDIS_STRING,sdsnew(" "));
966 shared.colon = createObject(REDIS_STRING,sdsnew(":"));
967 shared.plus = createObject(REDIS_STRING,sdsnew("+"));
968
969 for (j = 0; j < REDIS_SHARED_SELECT_CMDS; j++) {
970 shared.select[j] = createObject(REDIS_STRING,
971 sdscatprintf(sdsempty(),"select %d\r\n", j));
972 }
973 shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
974 shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
975 shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
976 shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
977 shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
978 shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
979 shared.del = createStringObject("DEL",3);
980 shared.rpop = createStringObject("RPOP",4);
981 shared.lpop = createStringObject("LPOP",4);
982 for (j = 0; j < REDIS_SHARED_INTEGERS; j++) {
983 shared.integers[j] = createObject(REDIS_STRING,(void*)(long)j);
984 shared.integers[j]->encoding = REDIS_ENCODING_INT;
985 }
986 for (j = 0; j < REDIS_SHARED_BULKHDR_LEN; j++) {
987 shared.mbulkhdr[j] = createObject(REDIS_STRING,
988 sdscatprintf(sdsempty(),"*%d\r\n",j));
989 shared.bulkhdr[j] = createObject(REDIS_STRING,
990 sdscatprintf(sdsempty(),"$%d\r\n",j));
991 }
992 }
993
994 void initServerConfig() {
995 getRandomHexChars(server.runid,REDIS_RUN_ID_SIZE);
996 server.runid[REDIS_RUN_ID_SIZE] = '\0';
997 server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
998 server.port = REDIS_SERVERPORT;
999 server.bindaddr = NULL;
1000 server.unixsocket = NULL;
1001 server.unixsocketperm = 0;
1002 server.ipfd = -1;
1003 server.sofd = -1;
1004 server.dbnum = REDIS_DEFAULT_DBNUM;
1005 server.verbosity = REDIS_NOTICE;
1006 server.maxidletime = REDIS_MAXIDLETIME;
1007 server.client_max_querybuf_len = REDIS_MAX_QUERYBUF_LEN;
1008 server.saveparams = NULL;
1009 server.loading = 0;
1010 server.logfile = NULL; /* NULL = log on standard output */
1011 server.syslog_enabled = 0;
1012 server.syslog_ident = zstrdup("redis");
1013 server.syslog_facility = LOG_LOCAL0;
1014 server.daemonize = 0;
1015 server.aof_state = REDIS_AOF_OFF;
1016 server.aof_fsync = AOF_FSYNC_EVERYSEC;
1017 server.aof_no_fsync_on_rewrite = 0;
1018 server.aof_rewrite_perc = REDIS_AOF_REWRITE_PERC;
1019 server.aof_rewrite_min_size = REDIS_AOF_REWRITE_MIN_SIZE;
1020 server.aof_rewrite_base_size = 0;
1021 server.aof_rewrite_scheduled = 0;
1022 server.aof_last_fsync = time(NULL);
1023 server.aof_delayed_fsync = 0;
1024 server.aof_fd = -1;
1025 server.aof_selected_db = -1; /* Make sure the first time will not match */
1026 server.aof_flush_postponed_start = 0;
1027 server.pidfile = zstrdup("/var/run/redis.pid");
1028 server.rdb_filename = zstrdup("dump.rdb");
1029 server.aof_filename = zstrdup("appendonly.aof");
1030 server.requirepass = NULL;
1031 server.rdb_compression = 1;
1032 server.activerehashing = 1;
1033 server.maxclients = REDIS_MAX_CLIENTS;
1034 server.bpop_blocked_clients = 0;
1035 server.maxmemory = 0;
1036 server.maxmemory_policy = REDIS_MAXMEMORY_VOLATILE_LRU;
1037 server.maxmemory_samples = 3;
1038 server.hash_max_ziplist_entries = REDIS_HASH_MAX_ZIPLIST_ENTRIES;
1039 server.hash_max_ziplist_value = REDIS_HASH_MAX_ZIPLIST_VALUE;
1040 server.list_max_ziplist_entries = REDIS_LIST_MAX_ZIPLIST_ENTRIES;
1041 server.list_max_ziplist_value = REDIS_LIST_MAX_ZIPLIST_VALUE;
1042 server.set_max_intset_entries = REDIS_SET_MAX_INTSET_ENTRIES;
1043 server.zset_max_ziplist_entries = REDIS_ZSET_MAX_ZIPLIST_ENTRIES;
1044 server.zset_max_ziplist_value = REDIS_ZSET_MAX_ZIPLIST_VALUE;
1045 server.shutdown_asap = 0;
1046 server.repl_ping_slave_period = REDIS_REPL_PING_SLAVE_PERIOD;
1047 server.repl_timeout = REDIS_REPL_TIMEOUT;
1048 server.lua_caller = NULL;
1049 server.lua_time_limit = REDIS_LUA_TIME_LIMIT;
1050 server.lua_client = NULL;
1051 server.lua_timedout = 0;
1052
1053 updateLRUClock();
1054 resetServerSaveParams();
1055
1056 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1057 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1058 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1059 /* Replication related */
1060 server.masterauth = NULL;
1061 server.masterhost = NULL;
1062 server.masterport = 6379;
1063 server.master = NULL;
1064 server.repl_state = REDIS_REPL_NONE;
1065 server.repl_syncio_timeout = REDIS_REPL_SYNCIO_TIMEOUT;
1066 server.repl_serve_stale_data = 1;
1067 server.repl_slave_ro = 1;
1068 server.repl_down_since = -1;
1069
1070 /* Client output buffer limits */
1071 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].hard_limit_bytes = 0;
1072 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_bytes = 0;
1073 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_NORMAL].soft_limit_seconds = 0;
1074 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].hard_limit_bytes = 1024*1024*256;
1075 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_bytes = 1024*1024*64;
1076 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_SLAVE].soft_limit_seconds = 60;
1077 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].hard_limit_bytes = 1024*1024*32;
1078 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_bytes = 1024*1024*8;
1079 server.client_obuf_limits[REDIS_CLIENT_LIMIT_CLASS_PUBSUB].soft_limit_seconds = 60;
1080
1081 /* Double constants initialization */
1082 R_Zero = 0.0;
1083 R_PosInf = 1.0/R_Zero;
1084 R_NegInf = -1.0/R_Zero;
1085 R_Nan = R_Zero/R_Zero;
1086
1087 /* Command table -- we intiialize it here as it is part of the
1088 * initial configuration, since command names may be changed via
1089 * redis.conf using the rename-command directive. */
1090 server.commands = dictCreate(&commandTableDictType,NULL);
1091 populateCommandTable();
1092 server.delCommand = lookupCommandByCString("del");
1093 server.multiCommand = lookupCommandByCString("multi");
1094 server.lpushCommand = lookupCommandByCString("lpush");
1095
1096 /* Slow log */
1097 server.slowlog_log_slower_than = REDIS_SLOWLOG_LOG_SLOWER_THAN;
1098 server.slowlog_max_len = REDIS_SLOWLOG_MAX_LEN;
1099
1100 /* Debugging */
1101 server.assert_failed = "<no assertion failed>";
1102 server.assert_file = "<no file>";
1103 server.assert_line = 0;
1104 server.bug_report_start = 0;
1105 server.watchdog_period = 0;
1106 }
1107
1108 /* This function will try to raise the max number of open files accordingly to
1109 * the configured max number of clients. It will also account for 32 additional
1110 * file descriptors as we need a few more for persistence, listening
1111 * sockets, log files and so forth.
1112 *
1113 * If it will not be possible to set the limit accordingly to the configured
1114 * max number of clients, the function will do the reverse setting
1115 * server.maxclients to the value that we can actually handle. */
1116 void adjustOpenFilesLimit(void) {
1117 rlim_t maxfiles = server.maxclients+32;
1118 struct rlimit limit;
1119
1120 if (maxfiles < 1024) maxfiles = 1024;
1121 if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
1122 redisLog(REDIS_WARNING,"Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
1123 strerror(errno));
1124 server.maxclients = 1024-32;
1125 } else {
1126 rlim_t oldlimit = limit.rlim_cur;
1127
1128 /* Set the max number of files if the current limit is not enough
1129 * for our needs. */
1130 if (oldlimit < maxfiles) {
1131 rlim_t f;
1132
1133 f = maxfiles;
1134 while(f > oldlimit) {
1135 limit.rlim_cur = f;
1136 limit.rlim_max = f;
1137 if (setrlimit(RLIMIT_NOFILE,&limit) != -1) break;
1138 f -= 128;
1139 }
1140 if (f < oldlimit) f = oldlimit;
1141 if (f != maxfiles) {
1142 server.maxclients = f-32;
1143 redisLog(REDIS_WARNING,"Unable to set the max number of files limit to %d (%s), setting the max clients configuration to %d.",
1144 (int) maxfiles, strerror(errno), (int) server.maxclients);
1145 } else {
1146 redisLog(REDIS_NOTICE,"Max number of open files set to %d",
1147 (int) maxfiles);
1148 }
1149 }
1150 }
1151 }
1152
1153 void initServer() {
1154 int j;
1155
1156 signal(SIGHUP, SIG_IGN);
1157 signal(SIGPIPE, SIG_IGN);
1158 setupSignalHandlers();
1159
1160 if (server.syslog_enabled) {
1161 openlog(server.syslog_ident, LOG_PID | LOG_NDELAY | LOG_NOWAIT,
1162 server.syslog_facility);
1163 }
1164
1165 server.current_client = NULL;
1166 server.clients = listCreate();
1167 server.clients_to_close = listCreate();
1168 server.slaves = listCreate();
1169 server.monitors = listCreate();
1170 server.unblocked_clients = listCreate();
1171
1172 createSharedObjects();
1173 adjustOpenFilesLimit();
1174 server.el = aeCreateEventLoop(server.maxclients+1024);
1175 server.db = zmalloc(sizeof(redisDb)*server.dbnum);
1176
1177 if (server.port != 0) {
1178 server.ipfd = anetTcpServer(server.neterr,server.port,server.bindaddr);
1179 if (server.ipfd == ANET_ERR) {
1180 redisLog(REDIS_WARNING, "Opening port %d: %s",
1181 server.port, server.neterr);
1182 exit(1);
1183 }
1184 }
1185 if (server.unixsocket != NULL) {
1186 unlink(server.unixsocket); /* don't care if this fails */
1187 server.sofd = anetUnixServer(server.neterr,server.unixsocket,server.unixsocketperm);
1188 if (server.sofd == ANET_ERR) {
1189 redisLog(REDIS_WARNING, "Opening socket: %s", server.neterr);
1190 exit(1);
1191 }
1192 }
1193 if (server.ipfd < 0 && server.sofd < 0) {
1194 redisLog(REDIS_WARNING, "Configured to not listen anywhere, exiting.");
1195 exit(1);
1196 }
1197 for (j = 0; j < server.dbnum; j++) {
1198 server.db[j].dict = dictCreate(&dbDictType,NULL);
1199 server.db[j].expires = dictCreate(&keyptrDictType,NULL);
1200 server.db[j].blocking_keys = dictCreate(&keylistDictType,NULL);
1201 server.db[j].watched_keys = dictCreate(&keylistDictType,NULL);
1202 server.db[j].id = j;
1203 }
1204 server.pubsub_channels = dictCreate(&keylistDictType,NULL);
1205 server.pubsub_patterns = listCreate();
1206 listSetFreeMethod(server.pubsub_patterns,freePubsubPattern);
1207 listSetMatchMethod(server.pubsub_patterns,listMatchPubsubPattern);
1208 server.cronloops = 0;
1209 server.rdb_child_pid = -1;
1210 server.aof_child_pid = -1;
1211 server.aof_rewrite_buf = sdsempty();
1212 server.aof_buf = sdsempty();
1213 server.lastsave = time(NULL);
1214 server.dirty = 0;
1215 server.stat_numcommands = 0;
1216 server.stat_numconnections = 0;
1217 server.stat_expiredkeys = 0;
1218 server.stat_evictedkeys = 0;
1219 server.stat_starttime = time(NULL);
1220 server.stat_keyspace_misses = 0;
1221 server.stat_keyspace_hits = 0;
1222 server.stat_peak_memory = 0;
1223 server.stat_fork_time = 0;
1224 server.stat_rejected_conn = 0;
1225 memset(server.ops_sec_samples,0,sizeof(server.ops_sec_samples));
1226 server.ops_sec_idx = 0;
1227 server.ops_sec_last_sample_time = mstime();
1228 server.ops_sec_last_sample_ops = 0;
1229 server.unixtime = time(NULL);
1230 server.lastbgsave_status = REDIS_OK;
1231 server.stop_writes_on_bgsave_err = 1;
1232 aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL);
1233 if (server.ipfd > 0 && aeCreateFileEvent(server.el,server.ipfd,AE_READABLE,
1234 acceptTcpHandler,NULL) == AE_ERR) oom("creating file event");
1235 if (server.sofd > 0 && aeCreateFileEvent(server.el,server.sofd,AE_READABLE,
1236 acceptUnixHandler,NULL) == AE_ERR) oom("creating file event");
1237
1238 if (server.aof_state == REDIS_AOF_ON) {
1239 server.aof_fd = open(server.aof_filename,
1240 O_WRONLY|O_APPEND|O_CREAT,0644);
1241 if (server.aof_fd == -1) {
1242 redisLog(REDIS_WARNING, "Can't open the append-only file: %s",
1243 strerror(errno));
1244 exit(1);
1245 }
1246 }
1247
1248 /* 32 bit instances are limited to 4GB of address space, so if there is
1249 * no explicit limit in the user provided configuration we set a limit
1250 * at 3.5GB using maxmemory with 'noeviction' policy'. This saves
1251 * useless crashes of the Redis instance. */
1252 if (server.arch_bits == 32 && server.maxmemory == 0) {
1253 redisLog(REDIS_WARNING,"Warning: 32 bit instance detected but no memory limit set. Setting 3.5 GB maxmemory limit with 'noeviction' policy now.");
1254 server.maxmemory = 3584LL*(1024*1024); /* 3584 MB = 3.5 GB */
1255 server.maxmemory_policy = REDIS_MAXMEMORY_NO_EVICTION;
1256 }
1257
1258 scriptingInit();
1259 slowlogInit();
1260 bioInit();
1261 }
1262
1263 /* Populates the Redis Command Table starting from the hard coded list
1264 * we have on top of redis.c file. */
1265 void populateCommandTable(void) {
1266 int j;
1267 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1268
1269 for (j = 0; j < numcommands; j++) {
1270 struct redisCommand *c = redisCommandTable+j;
1271 char *f = c->sflags;
1272 int retval;
1273
1274 while(*f != '\0') {
1275 switch(*f) {
1276 case 'w': c->flags |= REDIS_CMD_WRITE; break;
1277 case 'r': c->flags |= REDIS_CMD_READONLY; break;
1278 case 'm': c->flags |= REDIS_CMD_DENYOOM; break;
1279 case 'a': c->flags |= REDIS_CMD_ADMIN; break;
1280 case 'p': c->flags |= REDIS_CMD_PUBSUB; break;
1281 case 'f': c->flags |= REDIS_CMD_FORCE_REPLICATION; break;
1282 case 's': c->flags |= REDIS_CMD_NOSCRIPT; break;
1283 case 'R': c->flags |= REDIS_CMD_RANDOM; break;
1284 case 'S': c->flags |= REDIS_CMD_SORT_FOR_SCRIPT; break;
1285 default: redisPanic("Unsupported command flag"); break;
1286 }
1287 f++;
1288 }
1289
1290 retval = dictAdd(server.commands, sdsnew(c->name), c);
1291 assert(retval == DICT_OK);
1292 }
1293 }
1294
1295 void resetCommandTableStats(void) {
1296 int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1297 int j;
1298
1299 for (j = 0; j < numcommands; j++) {
1300 struct redisCommand *c = redisCommandTable+j;
1301
1302 c->microseconds = 0;
1303 c->calls = 0;
1304 }
1305 }
1306
1307 /* ========================== Redis OP Array API ============================ */
1308
1309 void redisOpArrayInit(redisOpArray *oa) {
1310 oa->ops = NULL;
1311 oa->numops = 0;
1312 }
1313
1314 int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
1315 robj **argv, int argc, int target)
1316 {
1317 redisOp *op;
1318
1319 oa->ops = zrealloc(oa->ops,sizeof(redisOp)*(oa->numops+1));
1320 op = oa->ops+oa->numops;
1321 op->cmd = cmd;
1322 op->dbid = dbid;
1323 op->argv = argv;
1324 op->argc = argc;
1325 op->target = target;
1326 oa->numops++;
1327 return oa->numops;
1328 }
1329
1330 void redisOpArrayFree(redisOpArray *oa) {
1331 while(oa->numops) {
1332 int j;
1333 redisOp *op;
1334
1335 oa->numops--;
1336 op = oa->ops+oa->numops;
1337 for (j = 0; j < op->argc; j++)
1338 decrRefCount(op->argv[j]);
1339 zfree(op->argv);
1340 }
1341 zfree(oa->ops);
1342 }
1343
1344 /* ====================== Commands lookup and execution ===================== */
1345
1346 struct redisCommand *lookupCommand(sds name) {
1347 return dictFetchValue(server.commands, name);
1348 }
1349
1350 struct redisCommand *lookupCommandByCString(char *s) {
1351 struct redisCommand *cmd;
1352 sds name = sdsnew(s);
1353
1354 cmd = dictFetchValue(server.commands, name);
1355 sdsfree(name);
1356 return cmd;
1357 }
1358
1359 /* Propagate the specified command (in the context of the specified database id)
1360 * to AOF, Slaves and Monitors.
1361 *
1362 * flags are an xor between:
1363 * + REDIS_PROPAGATE_NONE (no propagation of command at all)
1364 * + REDIS_PROPAGATE_AOF (propagate into the AOF file if is enabled)
1365 * + REDIS_PROPAGATE_REPL (propagate into the replication link)
1366 */
1367 void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1368 int flags)
1369 {
1370 if (server.aof_state != REDIS_AOF_OFF && flags & REDIS_PROPAGATE_AOF)
1371 feedAppendOnlyFile(cmd,dbid,argv,argc);
1372 if (flags & REDIS_PROPAGATE_REPL && listLength(server.slaves))
1373 replicationFeedSlaves(server.slaves,dbid,argv,argc);
1374 }
1375
1376 /* Used inside commands to schedule the propagation of additional commands
1377 * after the current command is propagated to AOF / Replication. */
1378 void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
1379 int target)
1380 {
1381 redisOpArrayAppend(&server.also_propagate,cmd,dbid,argv,argc,target);
1382 }
1383
1384 /* Call() is the core of Redis execution of a command */
1385 void call(redisClient *c, int flags) {
1386 long long dirty, start = ustime(), duration;
1387
1388 /* Sent the command to clients in MONITOR mode, only if the commands are
1389 * not geneated from reading an AOF. */
1390 if (listLength(server.monitors) && !server.loading)
1391 replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
1392
1393 /* Call the command. */
1394 redisOpArrayInit(&server.also_propagate);
1395 dirty = server.dirty;
1396 c->cmd->proc(c);
1397 dirty = server.dirty-dirty;
1398 duration = ustime()-start;
1399
1400 /* When EVAL is called loading the AOF we don't want commands called
1401 * from Lua to go into the slowlog or to populate statistics. */
1402 if (server.loading && c->flags & REDIS_LUA_CLIENT)
1403 flags &= ~(REDIS_CALL_SLOWLOG | REDIS_CALL_STATS);
1404
1405 /* Log the command into the Slow log if needed, and populate the
1406 * per-command statistics that we show in INFO commandstats. */
1407 if (flags & REDIS_CALL_SLOWLOG)
1408 slowlogPushEntryIfNeeded(c->argv,c->argc,duration);
1409 if (flags & REDIS_CALL_STATS) {
1410 c->cmd->microseconds += duration;
1411 c->cmd->calls++;
1412 }
1413
1414 /* Propagate the command into the AOF and replication link */
1415 if (flags & REDIS_CALL_PROPAGATE) {
1416 int flags = REDIS_PROPAGATE_NONE;
1417
1418 if (c->cmd->flags & REDIS_CMD_FORCE_REPLICATION)
1419 flags |= REDIS_PROPAGATE_REPL;
1420 if (dirty)
1421 flags |= (REDIS_PROPAGATE_REPL | REDIS_PROPAGATE_AOF);
1422 if (flags != REDIS_PROPAGATE_NONE)
1423 propagate(c->cmd,c->db->id,c->argv,c->argc,flags);
1424 }
1425 /* Commands such as LPUSH or BRPOPLPUSH may propagate an additional
1426 * PUSH command. */
1427 if (server.also_propagate.numops) {
1428 int j;
1429 redisOp *rop;
1430
1431 for (j = 0; j < server.also_propagate.numops; j++) {
1432 rop = &server.also_propagate.ops[j];
1433 propagate(rop->cmd, rop->dbid, rop->argv, rop->argc, rop->target);
1434 }
1435 redisOpArrayFree(&server.also_propagate);
1436 }
1437 server.stat_numcommands++;
1438 }
1439
1440 /* If this function gets called we already read a whole
1441 * command, argments are in the client argv/argc fields.
1442 * processCommand() execute the command or prepare the
1443 * server for a bulk read from the client.
1444 *
1445 * If 1 is returned the client is still alive and valid and
1446 * and other operations can be performed by the caller. Otherwise
1447 * if 0 is returned the client was destroied (i.e. after QUIT). */
1448 int processCommand(redisClient *c) {
1449 /* The QUIT command is handled separately. Normal command procs will
1450 * go through checking for replication and QUIT will cause trouble
1451 * when FORCE_REPLICATION is enabled and would be implemented in
1452 * a regular command proc. */
1453 if (!strcasecmp(c->argv[0]->ptr,"quit")) {
1454 addReply(c,shared.ok);
1455 c->flags |= REDIS_CLOSE_AFTER_REPLY;
1456 return REDIS_ERR;
1457 }
1458
1459 /* Now lookup the command and check ASAP about trivial error conditions
1460 * such as wrong arity, bad command name and so forth. */
1461 c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
1462 if (!c->cmd) {
1463 addReplyErrorFormat(c,"unknown command '%s'",
1464 (char*)c->argv[0]->ptr);
1465 return REDIS_OK;
1466 } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
1467 (c->argc < -c->cmd->arity)) {
1468 addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
1469 c->cmd->name);
1470 return REDIS_OK;
1471 }
1472
1473 /* Check if the user is authenticated */
1474 if (server.requirepass && !c->authenticated && c->cmd->proc != authCommand)
1475 {
1476 addReplyError(c,"operation not permitted");
1477 return REDIS_OK;
1478 }
1479
1480 /* Handle the maxmemory directive.
1481 *
1482 * First we try to free some memory if possible (if there are volatile
1483 * keys in the dataset). If there are not the only thing we can do
1484 * is returning an error. */
1485 if (server.maxmemory) {
1486 int retval = freeMemoryIfNeeded();
1487 if ((c->cmd->flags & REDIS_CMD_DENYOOM) && retval == REDIS_ERR) {
1488 addReply(c, shared.oomerr);
1489 return REDIS_OK;
1490 }
1491 }
1492
1493 /* Don't accept write commands if there are problems persisting on disk. */
1494 if (server.stop_writes_on_bgsave_err &&
1495 server.saveparamslen > 0
1496 && server.lastbgsave_status == REDIS_ERR &&
1497 c->cmd->flags & REDIS_CMD_WRITE)
1498 {
1499 addReply(c, shared.bgsaveerr);
1500 return REDIS_OK;
1501 }
1502
1503 /* Don't accept wirte commands if this is a read only slave. But
1504 * accept write commands if this is our master. */
1505 if (server.masterhost && server.repl_slave_ro &&
1506 !(c->flags & REDIS_MASTER) &&
1507 c->cmd->flags & REDIS_CMD_WRITE)
1508 {
1509 addReply(c, shared.roslaveerr);
1510 return REDIS_OK;
1511 }
1512
1513 /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
1514 if ((dictSize(c->pubsub_channels) > 0 || listLength(c->pubsub_patterns) > 0)
1515 &&
1516 c->cmd->proc != subscribeCommand &&
1517 c->cmd->proc != unsubscribeCommand &&
1518 c->cmd->proc != psubscribeCommand &&
1519 c->cmd->proc != punsubscribeCommand) {
1520 addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / QUIT allowed in this context");
1521 return REDIS_OK;
1522 }
1523
1524 /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
1525 * we are a slave with a broken link with master. */
1526 if (server.masterhost && server.repl_state != REDIS_REPL_CONNECTED &&
1527 server.repl_serve_stale_data == 0 &&
1528 c->cmd->proc != infoCommand && c->cmd->proc != slaveofCommand)
1529 {
1530 addReplyError(c,
1531 "link with MASTER is down and slave-serve-stale-data is set to no");
1532 return REDIS_OK;
1533 }
1534
1535 /* Loading DB? Return an error if the command is not INFO */
1536 if (server.loading && c->cmd->proc != infoCommand) {
1537 addReply(c, shared.loadingerr);
1538 return REDIS_OK;
1539 }
1540
1541 /* Lua script too slow? Only allow SHUTDOWN NOSAVE and SCRIPT KILL. */
1542 if (server.lua_timedout &&
1543 !(c->cmd->proc != shutdownCommand &&
1544 c->argc == 2 &&
1545 tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
1546 !(c->cmd->proc == scriptCommand &&
1547 c->argc == 2 &&
1548 tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
1549 {
1550 addReply(c, shared.slowscripterr);
1551 return REDIS_OK;
1552 }
1553
1554 /* Exec the command */
1555 if (c->flags & REDIS_MULTI &&
1556 c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
1557 c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
1558 {
1559 queueMultiCommand(c);
1560 addReply(c,shared.queued);
1561 } else {
1562 call(c,REDIS_CALL_FULL);
1563 }
1564 return REDIS_OK;
1565 }
1566
1567 /*================================== Shutdown =============================== */
1568
1569 int prepareForShutdown(int flags) {
1570 int save = flags & REDIS_SHUTDOWN_SAVE;
1571 int nosave = flags & REDIS_SHUTDOWN_NOSAVE;
1572
1573 redisLog(REDIS_WARNING,"User requested shutdown...");
1574 /* Kill the saving child if there is a background saving in progress.
1575 We want to avoid race conditions, for instance our saving child may
1576 overwrite the synchronous saving did by SHUTDOWN. */
1577 if (server.rdb_child_pid != -1) {
1578 redisLog(REDIS_WARNING,"There is a child saving an .rdb. Killing it!");
1579 kill(server.rdb_child_pid,SIGKILL);
1580 rdbRemoveTempFile(server.rdb_child_pid);
1581 }
1582 if (server.aof_state != REDIS_AOF_OFF) {
1583 /* Kill the AOF saving child as the AOF we already have may be longer
1584 * but contains the full dataset anyway. */
1585 if (server.aof_child_pid != -1) {
1586 redisLog(REDIS_WARNING,
1587 "There is a child rewriting the AOF. Killing it!");
1588 kill(server.aof_child_pid,SIGKILL);
1589 }
1590 /* Append only file: fsync() the AOF and exit */
1591 redisLog(REDIS_NOTICE,"Calling fsync() on the AOF file.");
1592 aof_fsync(server.aof_fd);
1593 }
1594 if ((server.saveparamslen > 0 && !nosave) || save) {
1595 redisLog(REDIS_NOTICE,"Saving the final RDB snapshot before exiting.");
1596 /* Snapshotting. Perform a SYNC SAVE and exit */
1597 if (rdbSave(server.rdb_filename) != REDIS_OK) {
1598 /* Ooops.. error saving! The best we can do is to continue
1599 * operating. Note that if there was a background saving process,
1600 * in the next cron() Redis will be notified that the background
1601 * saving aborted, handling special stuff like slaves pending for
1602 * synchronization... */
1603 redisLog(REDIS_WARNING,"Error trying to save the DB, can't exit.");
1604 return REDIS_ERR;
1605 }
1606 }
1607 if (server.daemonize) {
1608 redisLog(REDIS_NOTICE,"Removing the pid file.");
1609 unlink(server.pidfile);
1610 }
1611 /* Close the listening sockets. Apparently this allows faster restarts. */
1612 if (server.ipfd != -1) close(server.ipfd);
1613 if (server.sofd != -1) close(server.sofd);
1614 if (server.unixsocket) {
1615 redisLog(REDIS_NOTICE,"Removing the unix socket file.");
1616 unlink(server.unixsocket); /* don't care if this fails */
1617 }
1618
1619 redisLog(REDIS_WARNING,"Redis is now ready to exit, bye bye...");
1620 return REDIS_OK;
1621 }
1622
1623 /*================================== Commands =============================== */
1624
1625 void authCommand(redisClient *c) {
1626 if (!server.requirepass) {
1627 addReplyError(c,"Client sent AUTH, but no password is set");
1628 } else if (!strcmp(c->argv[1]->ptr, server.requirepass)) {
1629 c->authenticated = 1;
1630 addReply(c,shared.ok);
1631 } else {
1632 c->authenticated = 0;
1633 addReplyError(c,"invalid password");
1634 }
1635 }
1636
1637 void pingCommand(redisClient *c) {
1638 addReply(c,shared.pong);
1639 }
1640
1641 void echoCommand(redisClient *c) {
1642 addReplyBulk(c,c->argv[1]);
1643 }
1644
1645 void timeCommand(redisClient *c) {
1646 struct timeval tv;
1647
1648 /* gettimeofday() can only fail if &tv is a bad addresss so we
1649 * don't check for errors. */
1650 gettimeofday(&tv,NULL);
1651 addReplyMultiBulkLen(c,2);
1652 addReplyBulkLongLong(c,tv.tv_sec);
1653 addReplyBulkLongLong(c,tv.tv_usec);
1654 }
1655
1656 /* Convert an amount of bytes into a human readable string in the form
1657 * of 100B, 2G, 100M, 4K, and so forth. */
1658 void bytesToHuman(char *s, unsigned long long n) {
1659 double d;
1660
1661 if (n < 1024) {
1662 /* Bytes */
1663 sprintf(s,"%lluB",n);
1664 return;
1665 } else if (n < (1024*1024)) {
1666 d = (double)n/(1024);
1667 sprintf(s,"%.2fK",d);
1668 } else if (n < (1024LL*1024*1024)) {
1669 d = (double)n/(1024*1024);
1670 sprintf(s,"%.2fM",d);
1671 } else if (n < (1024LL*1024*1024*1024)) {
1672 d = (double)n/(1024LL*1024*1024);
1673 sprintf(s,"%.2fG",d);
1674 }
1675 }
1676
1677 /* Create the string returned by the INFO command. This is decoupled
1678 * by the INFO command itself as we need to report the same information
1679 * on memory corruption problems. */
1680 sds genRedisInfoString(char *section) {
1681 sds info = sdsempty();
1682 time_t uptime = server.unixtime-server.stat_starttime;
1683 int j, numcommands;
1684 struct rusage self_ru, c_ru;
1685 unsigned long lol, bib;
1686 int allsections = 0, defsections = 0;
1687 int sections = 0;
1688
1689 if (section) {
1690 allsections = strcasecmp(section,"all") == 0;
1691 defsections = strcasecmp(section,"default") == 0;
1692 }
1693
1694 getrusage(RUSAGE_SELF, &self_ru);
1695 getrusage(RUSAGE_CHILDREN, &c_ru);
1696 getClientsMaxBuffers(&lol,&bib);
1697
1698 /* Server */
1699 if (allsections || defsections || !strcasecmp(section,"server")) {
1700 if (sections++) info = sdscat(info,"\r\n");
1701 info = sdscatprintf(info,
1702 "# Server\r\n"
1703 "redis_version:%s\r\n"
1704 "redis_git_sha1:%s\r\n"
1705 "redis_git_dirty:%d\r\n"
1706 "arch_bits:%d\r\n"
1707 "multiplexing_api:%s\r\n"
1708 "gcc_version:%d.%d.%d\r\n"
1709 "process_id:%ld\r\n"
1710 "run_id:%s\r\n"
1711 "tcp_port:%d\r\n"
1712 "uptime_in_seconds:%ld\r\n"
1713 "uptime_in_days:%ld\r\n"
1714 "lru_clock:%ld\r\n",
1715 REDIS_VERSION,
1716 redisGitSHA1(),
1717 strtol(redisGitDirty(),NULL,10) > 0,
1718 server.arch_bits,
1719 aeGetApiName(),
1720 #ifdef __GNUC__
1721 __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
1722 #else
1723 0,0,0,
1724 #endif
1725 (long) getpid(),
1726 server.runid,
1727 server.port,
1728 uptime,
1729 uptime/(3600*24),
1730 (unsigned long) server.lruclock);
1731 }
1732
1733 /* Clients */
1734 if (allsections || defsections || !strcasecmp(section,"clients")) {
1735 if (sections++) info = sdscat(info,"\r\n");
1736 info = sdscatprintf(info,
1737 "# Clients\r\n"
1738 "connected_clients:%lu\r\n"
1739 "client_longest_output_list:%lu\r\n"
1740 "client_biggest_input_buf:%lu\r\n"
1741 "blocked_clients:%d\r\n",
1742 listLength(server.clients)-listLength(server.slaves),
1743 lol, bib,
1744 server.bpop_blocked_clients);
1745 }
1746
1747 /* Memory */
1748 if (allsections || defsections || !strcasecmp(section,"memory")) {
1749 char hmem[64];
1750 char peak_hmem[64];
1751
1752 bytesToHuman(hmem,zmalloc_used_memory());
1753 bytesToHuman(peak_hmem,server.stat_peak_memory);
1754 if (sections++) info = sdscat(info,"\r\n");
1755 info = sdscatprintf(info,
1756 "# Memory\r\n"
1757 "used_memory:%zu\r\n"
1758 "used_memory_human:%s\r\n"
1759 "used_memory_rss:%zu\r\n"
1760 "used_memory_peak:%zu\r\n"
1761 "used_memory_peak_human:%s\r\n"
1762 "used_memory_lua:%lld\r\n"
1763 "mem_fragmentation_ratio:%.2f\r\n"
1764 "mem_allocator:%s\r\n",
1765 zmalloc_used_memory(),
1766 hmem,
1767 zmalloc_get_rss(),
1768 server.stat_peak_memory,
1769 peak_hmem,
1770 ((long long)lua_gc(server.lua,LUA_GCCOUNT,0))*1024LL,
1771 zmalloc_get_fragmentation_ratio(),
1772 ZMALLOC_LIB
1773 );
1774 }
1775
1776 /* Persistence */
1777 if (allsections || defsections || !strcasecmp(section,"persistence")) {
1778 if (sections++) info = sdscat(info,"\r\n");
1779 info = sdscatprintf(info,
1780 "# Persistence\r\n"
1781 "loading:%d\r\n"
1782 "aof_enabled:%d\r\n"
1783 "changes_since_last_save:%lld\r\n"
1784 "bgsave_in_progress:%d\r\n"
1785 "last_save_time:%ld\r\n"
1786 "last_bgsave_status:%s\r\n"
1787 "bgrewriteaof_in_progress:%d\r\n",
1788 server.loading,
1789 server.aof_state != REDIS_AOF_OFF,
1790 server.dirty,
1791 server.rdb_child_pid != -1,
1792 server.lastsave,
1793 server.lastbgsave_status == REDIS_OK ? "ok" : "err",
1794 server.aof_child_pid != -1);
1795
1796 if (server.aof_state != REDIS_AOF_OFF) {
1797 info = sdscatprintf(info,
1798 "aof_current_size:%lld\r\n"
1799 "aof_base_size:%lld\r\n"
1800 "aof_pending_rewrite:%d\r\n"
1801 "aof_buffer_length:%zu\r\n"
1802 "aof_pending_bio_fsync:%llu\r\n"
1803 "aof_delayed_fsync:%lu\r\n",
1804 (long long) server.aof_current_size,
1805 (long long) server.aof_rewrite_base_size,
1806 server.aof_rewrite_scheduled,
1807 sdslen(server.aof_buf),
1808 bioPendingJobsOfType(REDIS_BIO_AOF_FSYNC),
1809 server.aof_delayed_fsync);
1810 }
1811
1812 if (server.loading) {
1813 double perc;
1814 time_t eta, elapsed;
1815 off_t remaining_bytes = server.loading_total_bytes-
1816 server.loading_loaded_bytes;
1817
1818 perc = ((double)server.loading_loaded_bytes /
1819 server.loading_total_bytes) * 100;
1820
1821 elapsed = server.unixtime-server.loading_start_time;
1822 if (elapsed == 0) {
1823 eta = 1; /* A fake 1 second figure if we don't have
1824 enough info */
1825 } else {
1826 eta = (elapsed*remaining_bytes)/server.loading_loaded_bytes;
1827 }
1828
1829 info = sdscatprintf(info,
1830 "loading_start_time:%ld\r\n"
1831 "loading_total_bytes:%llu\r\n"
1832 "loading_loaded_bytes:%llu\r\n"
1833 "loading_loaded_perc:%.2f\r\n"
1834 "loading_eta_seconds:%ld\r\n"
1835 ,(unsigned long) server.loading_start_time,
1836 (unsigned long long) server.loading_total_bytes,
1837 (unsigned long long) server.loading_loaded_bytes,
1838 perc,
1839 eta
1840 );
1841 }
1842 }
1843
1844 /* Stats */
1845 if (allsections || defsections || !strcasecmp(section,"stats")) {
1846 if (sections++) info = sdscat(info,"\r\n");
1847 info = sdscatprintf(info,
1848 "# Stats\r\n"
1849 "total_connections_received:%lld\r\n"
1850 "total_commands_processed:%lld\r\n"
1851 "instantaneous_ops_per_sec:%lld\r\n"
1852 "rejected_connections:%lld\r\n"
1853 "expired_keys:%lld\r\n"
1854 "evicted_keys:%lld\r\n"
1855 "keyspace_hits:%lld\r\n"
1856 "keyspace_misses:%lld\r\n"
1857 "pubsub_channels:%ld\r\n"
1858 "pubsub_patterns:%lu\r\n"
1859 "latest_fork_usec:%lld\r\n",
1860 server.stat_numconnections,
1861 server.stat_numcommands,
1862 getOperationsPerSecond(),
1863 server.stat_rejected_conn,
1864 server.stat_expiredkeys,
1865 server.stat_evictedkeys,
1866 server.stat_keyspace_hits,
1867 server.stat_keyspace_misses,
1868 dictSize(server.pubsub_channels),
1869 listLength(server.pubsub_patterns),
1870 server.stat_fork_time);
1871 }
1872
1873 /* Replication */
1874 if (allsections || defsections || !strcasecmp(section,"replication")) {
1875 if (sections++) info = sdscat(info,"\r\n");
1876 info = sdscatprintf(info,
1877 "# Replication\r\n"
1878 "role:%s\r\n",
1879 server.masterhost == NULL ? "master" : "slave");
1880 if (server.masterhost) {
1881 info = sdscatprintf(info,
1882 "master_host:%s\r\n"
1883 "master_port:%d\r\n"
1884 "master_link_status:%s\r\n"
1885 "master_last_io_seconds_ago:%d\r\n"
1886 "master_sync_in_progress:%d\r\n"
1887 ,server.masterhost,
1888 server.masterport,
1889 (server.repl_state == REDIS_REPL_CONNECTED) ?
1890 "up" : "down",
1891 server.master ?
1892 ((int)(server.unixtime-server.master->lastinteraction)) : -1,
1893 server.repl_state == REDIS_REPL_TRANSFER
1894 );
1895
1896 if (server.repl_state == REDIS_REPL_TRANSFER) {
1897 info = sdscatprintf(info,
1898 "master_sync_left_bytes:%ld\r\n"
1899 "master_sync_last_io_seconds_ago:%d\r\n"
1900 ,(long)server.repl_transfer_left,
1901 (int)(server.unixtime-server.repl_transfer_lastio)
1902 );
1903 }
1904
1905 if (server.repl_state != REDIS_REPL_CONNECTED) {
1906 info = sdscatprintf(info,
1907 "master_link_down_since_seconds:%ld\r\n",
1908 (long)server.unixtime-server.repl_down_since);
1909 }
1910 }
1911 info = sdscatprintf(info,
1912 "connected_slaves:%lu\r\n",
1913 listLength(server.slaves));
1914 if (listLength(server.slaves)) {
1915 int slaveid = 0;
1916 listNode *ln;
1917 listIter li;
1918
1919 listRewind(server.slaves,&li);
1920 while((ln = listNext(&li))) {
1921 redisClient *slave = listNodeValue(ln);
1922 char *state = NULL;
1923 char ip[32];
1924 int port;
1925
1926 if (anetPeerToString(slave->fd,ip,&port) == -1) continue;
1927 switch(slave->replstate) {
1928 case REDIS_REPL_WAIT_BGSAVE_START:
1929 case REDIS_REPL_WAIT_BGSAVE_END:
1930 state = "wait_bgsave";
1931 break;
1932 case REDIS_REPL_SEND_BULK:
1933 state = "send_bulk";
1934 break;
1935 case REDIS_REPL_ONLINE:
1936 state = "online";
1937 break;
1938 }
1939 if (state == NULL) continue;
1940 info = sdscatprintf(info,"slave%d:%s,%d,%s\r\n",
1941 slaveid,ip,port,state);
1942 slaveid++;
1943 }
1944 }
1945 }
1946
1947 /* CPU */
1948 if (allsections || defsections || !strcasecmp(section,"cpu")) {
1949 if (sections++) info = sdscat(info,"\r\n");
1950 info = sdscatprintf(info,
1951 "# CPU\r\n"
1952 "used_cpu_sys:%.2f\r\n"
1953 "used_cpu_user:%.2f\r\n"
1954 "used_cpu_sys_children:%.2f\r\n"
1955 "used_cpu_user_children:%.2f\r\n",
1956 (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
1957 (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000,
1958 (float)c_ru.ru_stime.tv_sec+(float)c_ru.ru_stime.tv_usec/1000000,
1959 (float)c_ru.ru_utime.tv_sec+(float)c_ru.ru_utime.tv_usec/1000000);
1960 }
1961
1962 /* cmdtime */
1963 if (allsections || !strcasecmp(section,"commandstats")) {
1964 if (sections++) info = sdscat(info,"\r\n");
1965 info = sdscatprintf(info, "# Commandstats\r\n");
1966 numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
1967 for (j = 0; j < numcommands; j++) {
1968 struct redisCommand *c = redisCommandTable+j;
1969
1970 if (!c->calls) continue;
1971 info = sdscatprintf(info,
1972 "cmdstat_%s:calls=%lld,usec=%lld,usec_per_call=%.2f\r\n",
1973 c->name, c->calls, c->microseconds,
1974 (c->calls == 0) ? 0 : ((float)c->microseconds/c->calls));
1975 }
1976 }
1977
1978 /* Key space */
1979 if (allsections || defsections || !strcasecmp(section,"keyspace")) {
1980 if (sections++) info = sdscat(info,"\r\n");
1981 info = sdscatprintf(info, "# Keyspace\r\n");
1982 for (j = 0; j < server.dbnum; j++) {
1983 long long keys, vkeys;
1984
1985 keys = dictSize(server.db[j].dict);
1986 vkeys = dictSize(server.db[j].expires);
1987 if (keys || vkeys) {
1988 info = sdscatprintf(info, "db%d:keys=%lld,expires=%lld\r\n",
1989 j, keys, vkeys);
1990 }
1991 }
1992 }
1993 return info;
1994 }
1995
1996 void infoCommand(redisClient *c) {
1997 char *section = c->argc == 2 ? c->argv[1]->ptr : "default";
1998
1999 if (c->argc > 2) {
2000 addReply(c,shared.syntaxerr);
2001 return;
2002 }
2003 sds info = genRedisInfoString(section);
2004 addReplySds(c,sdscatprintf(sdsempty(),"$%lu\r\n",
2005 (unsigned long)sdslen(info)));
2006 addReplySds(c,info);
2007 addReply(c,shared.crlf);
2008 }
2009
2010 void monitorCommand(redisClient *c) {
2011 /* ignore MONITOR if aleady slave or in monitor mode */
2012 if (c->flags & REDIS_SLAVE) return;
2013
2014 c->flags |= (REDIS_SLAVE|REDIS_MONITOR);
2015 c->slaveseldb = 0;
2016 listAddNodeTail(server.monitors,c);
2017 addReply(c,shared.ok);
2018 }
2019
2020 /* ============================ Maxmemory directive ======================== */
2021
2022 /* This function gets called when 'maxmemory' is set on the config file to limit
2023 * the max memory used by the server, before processing a command.
2024 *
2025 * The goal of the function is to free enough memory to keep Redis under the
2026 * configured memory limit.
2027 *
2028 * The function starts calculating how many bytes should be freed to keep
2029 * Redis under the limit, and enters a loop selecting the best keys to
2030 * evict accordingly to the configured policy.
2031 *
2032 * If all the bytes needed to return back under the limit were freed the
2033 * function returns REDIS_OK, otherwise REDIS_ERR is returned, and the caller
2034 * should block the execution of commands that will result in more memory
2035 * used by the server.
2036 */
2037 int freeMemoryIfNeeded(void) {
2038 size_t mem_used, mem_tofree, mem_freed;
2039 int slaves = listLength(server.slaves);
2040
2041 /* Remove the size of slaves output buffers and AOF buffer from the
2042 * count of used memory. */
2043 mem_used = zmalloc_used_memory();
2044 if (slaves) {
2045 listIter li;
2046 listNode *ln;
2047
2048 listRewind(server.slaves,&li);
2049 while((ln = listNext(&li))) {
2050 redisClient *slave = listNodeValue(ln);
2051 unsigned long obuf_bytes = getClientOutputBufferMemoryUsage(slave);
2052 if (obuf_bytes > mem_used)
2053 mem_used = 0;
2054 else
2055 mem_used -= obuf_bytes;
2056 }
2057 }
2058 if (server.aof_state != REDIS_AOF_OFF) {
2059 mem_used -= sdslen(server.aof_buf);
2060 mem_used -= sdslen(server.aof_rewrite_buf);
2061 }
2062
2063 /* Check if we are over the memory limit. */
2064 if (mem_used <= server.maxmemory) return REDIS_OK;
2065
2066 if (server.maxmemory_policy == REDIS_MAXMEMORY_NO_EVICTION)
2067 return REDIS_ERR; /* We need to free memory, but policy forbids. */
2068
2069 /* Compute how much memory we need to free. */
2070 mem_tofree = mem_used - server.maxmemory;
2071 mem_freed = 0;
2072 while (mem_freed < mem_tofree) {
2073 int j, k, keys_freed = 0;
2074
2075 for (j = 0; j < server.dbnum; j++) {
2076 long bestval = 0; /* just to prevent warning */
2077 sds bestkey = NULL;
2078 struct dictEntry *de;
2079 redisDb *db = server.db+j;
2080 dict *dict;
2081
2082 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2083 server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM)
2084 {
2085 dict = server.db[j].dict;
2086 } else {
2087 dict = server.db[j].expires;
2088 }
2089 if (dictSize(dict) == 0) continue;
2090
2091 /* volatile-random and allkeys-random policy */
2092 if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_RANDOM ||
2093 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_RANDOM)
2094 {
2095 de = dictGetRandomKey(dict);
2096 bestkey = dictGetKey(de);
2097 }
2098
2099 /* volatile-lru and allkeys-lru policy */
2100 else if (server.maxmemory_policy == REDIS_MAXMEMORY_ALLKEYS_LRU ||
2101 server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2102 {
2103 for (k = 0; k < server.maxmemory_samples; k++) {
2104 sds thiskey;
2105 long thisval;
2106 robj *o;
2107
2108 de = dictGetRandomKey(dict);
2109 thiskey = dictGetKey(de);
2110 /* When policy is volatile-lru we need an additonal lookup
2111 * to locate the real key, as dict is set to db->expires. */
2112 if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_LRU)
2113 de = dictFind(db->dict, thiskey);
2114 o = dictGetVal(de);
2115 thisval = estimateObjectIdleTime(o);
2116
2117 /* Higher idle time is better candidate for deletion */
2118 if (bestkey == NULL || thisval > bestval) {
2119 bestkey = thiskey;
2120 bestval = thisval;
2121 }
2122 }
2123 }
2124
2125 /* volatile-ttl */
2126 else if (server.maxmemory_policy == REDIS_MAXMEMORY_VOLATILE_TTL) {
2127 for (k = 0; k < server.maxmemory_samples; k++) {
2128 sds thiskey;
2129 long thisval;
2130
2131 de = dictGetRandomKey(dict);
2132 thiskey = dictGetKey(de);
2133 thisval = (long) dictGetVal(de);
2134
2135 /* Expire sooner (minor expire unix timestamp) is better
2136 * candidate for deletion */
2137 if (bestkey == NULL || thisval < bestval) {
2138 bestkey = thiskey;
2139 bestval = thisval;
2140 }
2141 }
2142 }
2143
2144 /* Finally remove the selected key. */
2145 if (bestkey) {
2146 long long delta;
2147
2148 robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
2149 propagateExpire(db,keyobj);
2150 /* We compute the amount of memory freed by dbDelete() alone.
2151 * It is possible that actually the memory needed to propagate
2152 * the DEL in AOF and replication link is greater than the one
2153 * we are freeing removing the key, but we can't account for
2154 * that otherwise we would never exit the loop.
2155 *
2156 * AOF and Output buffer memory will be freed eventually so
2157 * we only care about memory used by the key space. */
2158 delta = (long long) zmalloc_used_memory();
2159 dbDelete(db,keyobj);
2160 delta -= (long long) zmalloc_used_memory();
2161 mem_freed += delta;
2162 server.stat_evictedkeys++;
2163 decrRefCount(keyobj);
2164 keys_freed++;
2165
2166 /* When the memory to free starts to be big enough, we may
2167 * start spending so much time here that is impossible to
2168 * deliver data to the slaves fast enough, so we force the
2169 * transmission here inside the loop. */
2170 if (slaves) flushSlavesOutputBuffers();
2171 }
2172 }
2173 if (!keys_freed) return REDIS_ERR; /* nothing to free... */
2174 }
2175 return REDIS_OK;
2176 }
2177
2178 /* =================================== Main! ================================ */
2179
2180 #ifdef __linux__
2181 int linuxOvercommitMemoryValue(void) {
2182 FILE *fp = fopen("/proc/sys/vm/overcommit_memory","r");
2183 char buf[64];
2184
2185 if (!fp) return -1;
2186 if (fgets(buf,64,fp) == NULL) {
2187 fclose(fp);
2188 return -1;
2189 }
2190 fclose(fp);
2191
2192 return atoi(buf);
2193 }
2194
2195 void linuxOvercommitMemoryWarning(void) {
2196 if (linuxOvercommitMemoryValue() == 0) {
2197 redisLog(REDIS_WARNING,"WARNING overcommit_memory is set to 0! Background save may fail under low memory condition. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
2198 }
2199 }
2200 #endif /* __linux__ */
2201
2202 void createPidFile(void) {
2203 /* Try to write the pid file in a best-effort way. */
2204 FILE *fp = fopen(server.pidfile,"w");
2205 if (fp) {
2206 fprintf(fp,"%d\n",(int)getpid());
2207 fclose(fp);
2208 }
2209 }
2210
2211 void daemonize(void) {
2212 int fd;
2213
2214 if (fork() != 0) exit(0); /* parent exits */
2215 setsid(); /* create a new session */
2216
2217 /* Every output goes to /dev/null. If Redis is daemonized but
2218 * the 'logfile' is set to 'stdout' in the configuration file
2219 * it will not log at all. */
2220 if ((fd = open("/dev/null", O_RDWR, 0)) != -1) {
2221 dup2(fd, STDIN_FILENO);
2222 dup2(fd, STDOUT_FILENO);
2223 dup2(fd, STDERR_FILENO);
2224 if (fd > STDERR_FILENO) close(fd);
2225 }
2226 }
2227
2228 void version() {
2229 printf("Redis server v=%s sha=%s:%d malloc=%s\n", REDIS_VERSION,
2230 redisGitSHA1(), atoi(redisGitDirty()) > 0, ZMALLOC_LIB);
2231 exit(0);
2232 }
2233
2234 void usage() {
2235 fprintf(stderr,"Usage: ./redis-server [/path/to/redis.conf] [options]\n");
2236 fprintf(stderr," ./redis-server - (read config from stdin)\n");
2237 fprintf(stderr," ./redis-server -v or --version\n");
2238 fprintf(stderr," ./redis-server -h or --help\n");
2239 fprintf(stderr," ./redis-server --test-memory <megabytes>\n\n");
2240 fprintf(stderr,"Examples:\n");
2241 fprintf(stderr," ./redis-server (run the server with default conf)\n");
2242 fprintf(stderr," ./redis-server /etc/redis/6379.conf\n");
2243 fprintf(stderr," ./redis-server --port 7777\n");
2244 fprintf(stderr," ./redis-server --port 7777 --slaveof 127.0.0.1 8888\n");
2245 fprintf(stderr," ./redis-server /etc/myredis.conf --loglevel verbose\n");
2246 exit(1);
2247 }
2248
2249 void redisAsciiArt(void) {
2250 #include "asciilogo.h"
2251 char *buf = zmalloc(1024*16);
2252
2253 snprintf(buf,1024*16,ascii_logo,
2254 REDIS_VERSION,
2255 redisGitSHA1(),
2256 strtol(redisGitDirty(),NULL,10) > 0,
2257 (sizeof(long) == 8) ? "64" : "32",
2258 "stand alone",
2259 server.port,
2260 (long) getpid()
2261 );
2262 redisLogRaw(REDIS_NOTICE|REDIS_LOG_RAW,buf);
2263 zfree(buf);
2264 }
2265
2266 static void sigtermHandler(int sig) {
2267 REDIS_NOTUSED(sig);
2268
2269 redisLogFromHandler(REDIS_WARNING,"Received SIGTERM, scheduling shutdown...");
2270 server.shutdown_asap = 1;
2271 }
2272
2273 void setupSignalHandlers(void) {
2274 struct sigaction act;
2275
2276 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction is used.
2277 * Otherwise, sa_handler is used. */
2278 sigemptyset(&act.sa_mask);
2279 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND;
2280 act.sa_handler = sigtermHandler;
2281 sigaction(SIGTERM, &act, NULL);
2282
2283 #ifdef HAVE_BACKTRACE
2284 sigemptyset(&act.sa_mask);
2285 act.sa_flags = SA_NODEFER | SA_ONSTACK | SA_RESETHAND | SA_SIGINFO;
2286 act.sa_sigaction = sigsegvHandler;
2287 sigaction(SIGSEGV, &act, NULL);
2288 sigaction(SIGBUS, &act, NULL);
2289 sigaction(SIGFPE, &act, NULL);
2290 sigaction(SIGILL, &act, NULL);
2291 #endif
2292 return;
2293 }
2294
2295 void memtest(size_t megabytes, int passes);
2296
2297 int main(int argc, char **argv) {
2298 long long start;
2299 struct timeval tv;
2300
2301 /* We need to initialize our libraries, and the server configuration. */
2302 zmalloc_enable_thread_safeness();
2303 srand(time(NULL)^getpid());
2304 gettimeofday(&tv,NULL);
2305 dictSetHashFunctionSeed(tv.tv_sec^tv.tv_usec^getpid());
2306 initServerConfig();
2307
2308 if (argc >= 2) {
2309 int j = 1; /* First option to parse in argv[] */
2310 sds options = sdsempty();
2311 char *configfile = NULL;
2312
2313 /* Handle special options --help and --version */
2314 if (strcmp(argv[1], "-v") == 0 ||
2315 strcmp(argv[1], "--version") == 0) version();
2316 if (strcmp(argv[1], "--help") == 0 ||
2317 strcmp(argv[1], "-h") == 0) usage();
2318 if (strcmp(argv[1], "--test-memory") == 0) {
2319 if (argc == 3) {
2320 memtest(atoi(argv[2]),50);
2321 exit(0);
2322 } else {
2323 fprintf(stderr,"Please specify the amount of memory to test in megabytes.\n");
2324 fprintf(stderr,"Example: ./redis-server --test-memory 4096\n\n");
2325 exit(1);
2326 }
2327 }
2328
2329 /* First argument is the config file name? */
2330 if (argv[j][0] != '-' || argv[j][1] != '-')
2331 configfile = argv[j++];
2332 /* All the other options are parsed and conceptually appended to the
2333 * configuration file. For instance --port 6380 will generate the
2334 * string "port 6380\n" to be parsed after the actual file name
2335 * is parsed, if any. */
2336 while(j != argc) {
2337 if (argv[j][0] == '-' && argv[j][1] == '-') {
2338 /* Option name */
2339 if (sdslen(options)) options = sdscat(options,"\n");
2340 options = sdscat(options,argv[j]+2);
2341 options = sdscat(options," ");
2342 } else {
2343 /* Option argument */
2344 options = sdscatrepr(options,argv[j],strlen(argv[j]));
2345 options = sdscat(options," ");
2346 }
2347 j++;
2348 }
2349 resetServerSaveParams();
2350 loadServerConfig(configfile,options);
2351 sdsfree(options);
2352 } else {
2353 redisLog(REDIS_WARNING,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
2354 }
2355 if (server.daemonize) daemonize();
2356 initServer();
2357 if (server.daemonize) createPidFile();
2358 redisAsciiArt();
2359 redisLog(REDIS_WARNING,"Server started, Redis version " REDIS_VERSION);
2360 #ifdef __linux__
2361 linuxOvercommitMemoryWarning();
2362 #endif
2363 start = ustime();
2364 if (server.aof_state == REDIS_AOF_ON) {
2365 if (loadAppendOnlyFile(server.aof_filename) == REDIS_OK)
2366 redisLog(REDIS_NOTICE,"DB loaded from append only file: %.3f seconds",(float)(ustime()-start)/1000000);
2367 } else {
2368 if (rdbLoad(server.rdb_filename) == REDIS_OK) {
2369 redisLog(REDIS_NOTICE,"DB loaded from disk: %.3f seconds",
2370 (float)(ustime()-start)/1000000);
2371 } else if (errno != ENOENT) {
2372 redisLog(REDIS_WARNING,"Fatal error loading the DB. Exiting.");
2373 exit(1);
2374 }
2375 }
2376 if (server.ipfd > 0)
2377 redisLog(REDIS_NOTICE,"The server is now ready to accept connections on port %d", server.port);
2378 if (server.sofd > 0)
2379 redisLog(REDIS_NOTICE,"The server is now ready to accept connections at %s", server.unixsocket);
2380 aeSetBeforeSleepProc(server.el,beforeSleep);
2381 aeMain(server.el);
2382 aeDeleteEventLoop(server.el);
2383 return 0;
2384 }
2385
2386 /* The End */