2 * Copyright (c) 2006-2009, Salvatore Sanfilippo <antirez at gmail dot com>
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
30 #define REDIS_VERSION "1.050"
40 #define __USE_POSIX199309
46 #endif /* HAVE_BACKTRACE */
54 #include <arpa/inet.h>
58 #include <sys/resource.h>
64 #include "solarisfixes.h"
68 #include "ae.h" /* Event driven programming library */
69 #include "sds.h" /* Dynamic safe strings */
70 #include "anet.h" /* Networking the easy way */
71 #include "dict.h" /* Hash tables */
72 #include "adlist.h" /* Linked lists */
73 #include "zmalloc.h" /* total memory usage aware version of malloc/free */
74 #include "lzf.h" /* LZF compression library */
75 #include "pqsort.h" /* Partial qsort for SORT+LIMIT */
81 /* Static server configuration */
82 #define REDIS_SERVERPORT 6379 /* TCP port */
83 #define REDIS_MAXIDLETIME (60*5) /* default client timeout */
84 #define REDIS_IOBUF_LEN 1024
85 #define REDIS_LOADBUF_LEN 1024
86 #define REDIS_STATIC_ARGS 4
87 #define REDIS_DEFAULT_DBNUM 16
88 #define REDIS_CONFIGLINE_MAX 1024
89 #define REDIS_OBJFREELIST_MAX 1000000 /* Max number of objects to cache */
90 #define REDIS_MAX_SYNC_TIME 60 /* Slave can't take more to sync */
91 #define REDIS_EXPIRELOOKUPS_PER_CRON 100 /* try to expire 100 keys/second */
92 #define REDIS_MAX_WRITE_PER_EVENT (1024*64)
93 #define REDIS_REQUEST_MAX_SIZE (1024*1024*256) /* max bytes in inline command */
95 /* If more then REDIS_WRITEV_THRESHOLD write packets are pending use writev */
96 #define REDIS_WRITEV_THRESHOLD 3
97 /* Max number of iovecs used for each writev call */
98 #define REDIS_WRITEV_IOVEC_COUNT 256
100 /* Hash table parameters */
101 #define REDIS_HT_MINFILL 10 /* Minimal hash table fill 10% */
104 #define REDIS_CMD_BULK 1 /* Bulk write command */
105 #define REDIS_CMD_INLINE 2 /* Inline command */
106 /* REDIS_CMD_DENYOOM reserves a longer comment: all the commands marked with
107 this flags will return an error when the 'maxmemory' option is set in the
108 config file and the server is using more than maxmemory bytes of memory.
109 In short this commands are denied on low memory conditions. */
110 #define REDIS_CMD_DENYOOM 4
113 #define REDIS_STRING 0
119 /* Objects encoding */
120 #define REDIS_ENCODING_RAW 0 /* Raw representation */
121 #define REDIS_ENCODING_INT 1 /* Encoded as integer */
123 /* Object types only used for dumping to disk */
124 #define REDIS_EXPIRETIME 253
125 #define REDIS_SELECTDB 254
126 #define REDIS_EOF 255
128 /* Defines related to the dump file format. To store 32 bits lengths for short
129 * keys requires a lot of space, so we check the most significant 2 bits of
130 * the first byte to interpreter the length:
132 * 00|000000 => if the two MSB are 00 the len is the 6 bits of this byte
133 * 01|000000 00000000 => 01, the len is 14 byes, 6 bits + 8 bits of next byte
134 * 10|000000 [32 bit integer] => if it's 01, a full 32 bit len will follow
135 * 11|000000 this means: specially encoded object will follow. The six bits
136 * number specify the kind of object that follows.
137 * See the REDIS_RDB_ENC_* defines.
139 * Lenghts up to 63 are stored using a single byte, most DB keys, and may
140 * values, will fit inside. */
141 #define REDIS_RDB_6BITLEN 0
142 #define REDIS_RDB_14BITLEN 1
143 #define REDIS_RDB_32BITLEN 2
144 #define REDIS_RDB_ENCVAL 3
145 #define REDIS_RDB_LENERR UINT_MAX
147 /* When a length of a string object stored on disk has the first two bits
148 * set, the remaining two bits specify a special encoding for the object
149 * accordingly to the following defines: */
150 #define REDIS_RDB_ENC_INT8 0 /* 8 bit signed integer */
151 #define REDIS_RDB_ENC_INT16 1 /* 16 bit signed integer */
152 #define REDIS_RDB_ENC_INT32 2 /* 32 bit signed integer */
153 #define REDIS_RDB_ENC_LZF 3 /* string compressed with FASTLZ */
156 #define REDIS_CLOSE 1 /* This client connection should be closed ASAP */
157 #define REDIS_SLAVE 2 /* This client is a slave server */
158 #define REDIS_MASTER 4 /* This client is a master server */
159 #define REDIS_MONITOR 8 /* This client is a slave monitor, see MONITOR */
161 /* Slave replication state - slave side */
162 #define REDIS_REPL_NONE 0 /* No active replication */
163 #define REDIS_REPL_CONNECT 1 /* Must connect to master */
164 #define REDIS_REPL_CONNECTED 2 /* Connected to master */
166 /* Slave replication state - from the point of view of master
167 * Note that in SEND_BULK and ONLINE state the slave receives new updates
168 * in its output queue. In the WAIT_BGSAVE state instead the server is waiting
169 * to start the next background saving in order to send updates to it. */
170 #define REDIS_REPL_WAIT_BGSAVE_START 3 /* master waits bgsave to start feeding it */
171 #define REDIS_REPL_WAIT_BGSAVE_END 4 /* master waits bgsave to start bulk DB transmission */
172 #define REDIS_REPL_SEND_BULK 5 /* master is sending the bulk DB */
173 #define REDIS_REPL_ONLINE 6 /* bulk DB already transmitted, receive updates */
175 /* List related stuff */
179 /* Sort operations */
180 #define REDIS_SORT_GET 0
181 #define REDIS_SORT_ASC 1
182 #define REDIS_SORT_DESC 2
183 #define REDIS_SORTKEY_MAX 1024
186 #define REDIS_DEBUG 0
187 #define REDIS_NOTICE 1
188 #define REDIS_WARNING 2
190 /* Anti-warning macro... */
191 #define REDIS_NOTUSED(V) ((void) V)
193 #define ZSKIPLIST_MAXLEVEL 32 /* Should be enough for 2^32 elements */
194 #define ZSKIPLIST_P 0.25 /* Skiplist P = 1/4 */
196 /* Append only defines */
197 #define APPENDFSYNC_NO 0
198 #define APPENDFSYNC_ALWAYS 1
199 #define APPENDFSYNC_EVERYSEC 2
201 /*================================= Data types ============================== */
203 /* A redis object, that is a type able to hold a string / list / set */
204 typedef struct redisObject
{
207 unsigned char encoding
;
208 unsigned char notused
[2];
212 typedef struct redisDb
{
218 /* With multiplexing we need to take per-clinet state.
219 * Clients are taken in a liked list. */
220 typedef struct redisClient
{
225 robj
**argv
, **mbargv
;
227 int bulklen
; /* bulk read len. -1 if not in bulk read mode */
228 int multibulk
; /* multi bulk command format active */
231 time_t lastinteraction
; /* time of the last interaction, used for timeout */
232 int flags
; /* REDIS_CLOSE | REDIS_SLAVE | REDIS_MONITOR */
233 int slaveseldb
; /* slave selected db, if this client is a slave */
234 int authenticated
; /* when requirepass is non-NULL */
235 int replstate
; /* replication state if this is a slave */
236 int repldbfd
; /* replication DB file descriptor */
237 long repldboff
; /* replication DB file offset */
238 off_t repldbsize
; /* replication DB file size */
246 /* Global server state structure */
252 unsigned int sharingpoolsize
;
253 long long dirty
; /* changes to DB from the last save */
255 list
*slaves
, *monitors
;
256 char neterr
[ANET_ERR_LEN
];
258 int cronloops
; /* number of times the cron function run */
259 list
*objfreelist
; /* A list of freed objects to avoid malloc() */
260 time_t lastsave
; /* Unix time of last save succeeede */
261 size_t usedmemory
; /* Used memory in megabytes */
262 /* Fields used only for stats */
263 time_t stat_starttime
; /* server start time */
264 long long stat_numcommands
; /* number of processed commands */
265 long long stat_numconnections
; /* number of connections received */
278 int bgsaveinprogress
;
279 pid_t bgsavechildpid
;
280 struct saveparam
*saveparams
;
285 char *appendfilename
;
288 /* Replication related */
293 redisClient
*master
; /* client that is master for this slave */
295 unsigned int maxclients
;
296 unsigned long maxmemory
;
297 /* Sort parameters - qsort_r() is only available under BSD so we
298 * have to take this state global, in order to pass it to sortCompare() */
304 typedef void redisCommandProc(redisClient
*c
);
305 struct redisCommand
{
307 redisCommandProc
*proc
;
312 struct redisFunctionSym
{
314 unsigned long pointer
;
317 typedef struct _redisSortObject
{
325 typedef struct _redisSortOperation
{
328 } redisSortOperation
;
330 /* ZSETs use a specialized version of Skiplists */
332 typedef struct zskiplistNode
{
333 struct zskiplistNode
**forward
;
334 struct zskiplistNode
*backward
;
339 typedef struct zskiplist
{
340 struct zskiplistNode
*header
, *tail
;
341 unsigned long length
;
345 typedef struct zset
{
350 /* Our shared "common" objects */
352 struct sharedObjectsStruct
{
353 robj
*crlf
, *ok
, *err
, *emptybulk
, *czero
, *cone
, *pong
, *space
,
354 *colon
, *nullbulk
, *nullmultibulk
,
355 *emptymultibulk
, *wrongtypeerr
, *nokeyerr
, *syntaxerr
, *sameobjecterr
,
356 *outofrangeerr
, *plus
,
357 *select0
, *select1
, *select2
, *select3
, *select4
,
358 *select5
, *select6
, *select7
, *select8
, *select9
;
361 /* Global vars that are actally used as constants. The following double
362 * values are used for double on-disk serialization, and are initialized
363 * at runtime to avoid strange compiler optimizations. */
365 static double R_Zero
, R_PosInf
, R_NegInf
, R_Nan
;
367 /*================================ Prototypes =============================== */
369 static void freeStringObject(robj
*o
);
370 static void freeListObject(robj
*o
);
371 static void freeSetObject(robj
*o
);
372 static void decrRefCount(void *o
);
373 static robj
*createObject(int type
, void *ptr
);
374 static void freeClient(redisClient
*c
);
375 static int rdbLoad(char *filename
);
376 static void addReply(redisClient
*c
, robj
*obj
);
377 static void addReplySds(redisClient
*c
, sds s
);
378 static void incrRefCount(robj
*o
);
379 static int rdbSaveBackground(char *filename
);
380 static robj
*createStringObject(char *ptr
, size_t len
);
381 static void replicationFeedSlaves(list
*slaves
, struct redisCommand
*cmd
, int dictid
, robj
**argv
, int argc
);
382 static void feedAppendOnlyFile(struct redisCommand
*cmd
, int dictid
, robj
**argv
, int argc
);
383 static int syncWithMaster(void);
384 static robj
*tryObjectSharing(robj
*o
);
385 static int tryObjectEncoding(robj
*o
);
386 static robj
*getDecodedObject(const robj
*o
);
387 static int removeExpire(redisDb
*db
, robj
*key
);
388 static int expireIfNeeded(redisDb
*db
, robj
*key
);
389 static int deleteIfVolatile(redisDb
*db
, robj
*key
);
390 static int deleteKey(redisDb
*db
, robj
*key
);
391 static time_t getExpire(redisDb
*db
, robj
*key
);
392 static int setExpire(redisDb
*db
, robj
*key
, time_t when
);
393 static void updateSlavesWaitingBgsave(int bgsaveerr
);
394 static void freeMemoryIfNeeded(void);
395 static int processCommand(redisClient
*c
);
396 static void setupSigSegvAction(void);
397 static void rdbRemoveTempFile(pid_t childpid
);
398 static size_t stringObjectLen(robj
*o
);
399 static void processInputBuffer(redisClient
*c
);
400 static zskiplist
*zslCreate(void);
401 static void zslFree(zskiplist
*zsl
);
402 static void zslInsert(zskiplist
*zsl
, double score
, robj
*obj
);
403 static void sendReplyToClientWritev(aeEventLoop
*el
, int fd
, void *privdata
, int mask
);
405 static void authCommand(redisClient
*c
);
406 static void pingCommand(redisClient
*c
);
407 static void echoCommand(redisClient
*c
);
408 static void setCommand(redisClient
*c
);
409 static void setnxCommand(redisClient
*c
);
410 static void getCommand(redisClient
*c
);
411 static void delCommand(redisClient
*c
);
412 static void existsCommand(redisClient
*c
);
413 static void incrCommand(redisClient
*c
);
414 static void decrCommand(redisClient
*c
);
415 static void incrbyCommand(redisClient
*c
);
416 static void decrbyCommand(redisClient
*c
);
417 static void selectCommand(redisClient
*c
);
418 static void randomkeyCommand(redisClient
*c
);
419 static void keysCommand(redisClient
*c
);
420 static void dbsizeCommand(redisClient
*c
);
421 static void lastsaveCommand(redisClient
*c
);
422 static void saveCommand(redisClient
*c
);
423 static void bgsaveCommand(redisClient
*c
);
424 static void shutdownCommand(redisClient
*c
);
425 static void moveCommand(redisClient
*c
);
426 static void renameCommand(redisClient
*c
);
427 static void renamenxCommand(redisClient
*c
);
428 static void lpushCommand(redisClient
*c
);
429 static void rpushCommand(redisClient
*c
);
430 static void lpopCommand(redisClient
*c
);
431 static void rpopCommand(redisClient
*c
);
432 static void llenCommand(redisClient
*c
);
433 static void lindexCommand(redisClient
*c
);
434 static void lrangeCommand(redisClient
*c
);
435 static void ltrimCommand(redisClient
*c
);
436 static void typeCommand(redisClient
*c
);
437 static void lsetCommand(redisClient
*c
);
438 static void saddCommand(redisClient
*c
);
439 static void sremCommand(redisClient
*c
);
440 static void smoveCommand(redisClient
*c
);
441 static void sismemberCommand(redisClient
*c
);
442 static void scardCommand(redisClient
*c
);
443 static void spopCommand(redisClient
*c
);
444 static void srandmemberCommand(redisClient
*c
);
445 static void sinterCommand(redisClient
*c
);
446 static void sinterstoreCommand(redisClient
*c
);
447 static void sunionCommand(redisClient
*c
);
448 static void sunionstoreCommand(redisClient
*c
);
449 static void sdiffCommand(redisClient
*c
);
450 static void sdiffstoreCommand(redisClient
*c
);
451 static void syncCommand(redisClient
*c
);
452 static void flushdbCommand(redisClient
*c
);
453 static void flushallCommand(redisClient
*c
);
454 static void sortCommand(redisClient
*c
);
455 static void lremCommand(redisClient
*c
);
456 static void rpoplpushcommand(redisClient
*c
);
457 static void infoCommand(redisClient
*c
);
458 static void mgetCommand(redisClient
*c
);
459 static void monitorCommand(redisClient
*c
);
460 static void expireCommand(redisClient
*c
);
461 static void expireatCommand(redisClient
*c
);
462 static void getsetCommand(redisClient
*c
);
463 static void ttlCommand(redisClient
*c
);
464 static void slaveofCommand(redisClient
*c
);
465 static void debugCommand(redisClient
*c
);
466 static void msetCommand(redisClient
*c
);
467 static void msetnxCommand(redisClient
*c
);
468 static void zaddCommand(redisClient
*c
);
469 static void zrangeCommand(redisClient
*c
);
470 static void zrangebyscoreCommand(redisClient
*c
);
471 static void zrevrangeCommand(redisClient
*c
);
472 static void zcardCommand(redisClient
*c
);
473 static void zremCommand(redisClient
*c
);
474 static void zscoreCommand(redisClient
*c
);
475 static void zremrangebyscoreCommand(redisClient
*c
);
477 /*================================= Globals ================================= */
480 static struct redisServer server
; /* server global state */
481 static struct redisCommand cmdTable
[] = {
482 {"get",getCommand
,2,REDIS_CMD_INLINE
},
483 {"set",setCommand
,3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
484 {"setnx",setnxCommand
,3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
485 {"del",delCommand
,-2,REDIS_CMD_INLINE
},
486 {"exists",existsCommand
,2,REDIS_CMD_INLINE
},
487 {"incr",incrCommand
,2,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
488 {"decr",decrCommand
,2,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
489 {"mget",mgetCommand
,-2,REDIS_CMD_INLINE
},
490 {"rpush",rpushCommand
,3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
491 {"lpush",lpushCommand
,3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
492 {"rpop",rpopCommand
,2,REDIS_CMD_INLINE
},
493 {"lpop",lpopCommand
,2,REDIS_CMD_INLINE
},
494 {"llen",llenCommand
,2,REDIS_CMD_INLINE
},
495 {"lindex",lindexCommand
,3,REDIS_CMD_INLINE
},
496 {"lset",lsetCommand
,4,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
497 {"lrange",lrangeCommand
,4,REDIS_CMD_INLINE
},
498 {"ltrim",ltrimCommand
,4,REDIS_CMD_INLINE
},
499 {"lrem",lremCommand
,4,REDIS_CMD_BULK
},
500 {"rpoplpush",rpoplpushcommand
,3,REDIS_CMD_BULK
},
501 {"sadd",saddCommand
,3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
502 {"srem",sremCommand
,3,REDIS_CMD_BULK
},
503 {"smove",smoveCommand
,4,REDIS_CMD_BULK
},
504 {"sismember",sismemberCommand
,3,REDIS_CMD_BULK
},
505 {"scard",scardCommand
,2,REDIS_CMD_INLINE
},
506 {"spop",spopCommand
,2,REDIS_CMD_INLINE
},
507 {"srandmember",srandmemberCommand
,2,REDIS_CMD_INLINE
},
508 {"sinter",sinterCommand
,-2,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
509 {"sinterstore",sinterstoreCommand
,-3,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
510 {"sunion",sunionCommand
,-2,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
511 {"sunionstore",sunionstoreCommand
,-3,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
512 {"sdiff",sdiffCommand
,-2,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
513 {"sdiffstore",sdiffstoreCommand
,-3,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
514 {"smembers",sinterCommand
,2,REDIS_CMD_INLINE
},
515 {"zadd",zaddCommand
,4,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
516 {"zrem",zremCommand
,3,REDIS_CMD_BULK
},
517 {"zremrangebyscore",zremrangebyscoreCommand
,4,REDIS_CMD_INLINE
},
518 {"zrange",zrangeCommand
,4,REDIS_CMD_INLINE
},
519 {"zrangebyscore",zrangebyscoreCommand
,4,REDIS_CMD_INLINE
},
520 {"zrevrange",zrevrangeCommand
,4,REDIS_CMD_INLINE
},
521 {"zcard",zcardCommand
,2,REDIS_CMD_INLINE
},
522 {"zscore",zscoreCommand
,3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
523 {"incrby",incrbyCommand
,3,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
524 {"decrby",decrbyCommand
,3,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
525 {"getset",getsetCommand
,3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
526 {"mset",msetCommand
,-3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
527 {"msetnx",msetnxCommand
,-3,REDIS_CMD_BULK
|REDIS_CMD_DENYOOM
},
528 {"randomkey",randomkeyCommand
,1,REDIS_CMD_INLINE
},
529 {"select",selectCommand
,2,REDIS_CMD_INLINE
},
530 {"move",moveCommand
,3,REDIS_CMD_INLINE
},
531 {"rename",renameCommand
,3,REDIS_CMD_INLINE
},
532 {"renamenx",renamenxCommand
,3,REDIS_CMD_INLINE
},
533 {"expire",expireCommand
,3,REDIS_CMD_INLINE
},
534 {"expireat",expireatCommand
,3,REDIS_CMD_INLINE
},
535 {"keys",keysCommand
,2,REDIS_CMD_INLINE
},
536 {"dbsize",dbsizeCommand
,1,REDIS_CMD_INLINE
},
537 {"auth",authCommand
,2,REDIS_CMD_INLINE
},
538 {"ping",pingCommand
,1,REDIS_CMD_INLINE
},
539 {"echo",echoCommand
,2,REDIS_CMD_BULK
},
540 {"save",saveCommand
,1,REDIS_CMD_INLINE
},
541 {"bgsave",bgsaveCommand
,1,REDIS_CMD_INLINE
},
542 {"shutdown",shutdownCommand
,1,REDIS_CMD_INLINE
},
543 {"lastsave",lastsaveCommand
,1,REDIS_CMD_INLINE
},
544 {"type",typeCommand
,2,REDIS_CMD_INLINE
},
545 {"sync",syncCommand
,1,REDIS_CMD_INLINE
},
546 {"flushdb",flushdbCommand
,1,REDIS_CMD_INLINE
},
547 {"flushall",flushallCommand
,1,REDIS_CMD_INLINE
},
548 {"sort",sortCommand
,-2,REDIS_CMD_INLINE
|REDIS_CMD_DENYOOM
},
549 {"info",infoCommand
,1,REDIS_CMD_INLINE
},
550 {"monitor",monitorCommand
,1,REDIS_CMD_INLINE
},
551 {"ttl",ttlCommand
,2,REDIS_CMD_INLINE
},
552 {"slaveof",slaveofCommand
,3,REDIS_CMD_INLINE
},
553 {"debug",debugCommand
,-2,REDIS_CMD_INLINE
},
557 /*============================ Utility functions ============================ */
559 /* Glob-style pattern matching. */
560 int stringmatchlen(const char *pattern
, int patternLen
,
561 const char *string
, int stringLen
, int nocase
)
566 while (pattern
[1] == '*') {
571 return 1; /* match */
573 if (stringmatchlen(pattern
+1, patternLen
-1,
574 string
, stringLen
, nocase
))
575 return 1; /* match */
579 return 0; /* no match */
583 return 0; /* no match */
593 not = pattern
[0] == '^';
600 if (pattern
[0] == '\\') {
603 if (pattern
[0] == string
[0])
605 } else if (pattern
[0] == ']') {
607 } else if (patternLen
== 0) {
611 } else if (pattern
[1] == '-' && patternLen
>= 3) {
612 int start
= pattern
[0];
613 int end
= pattern
[2];
621 start
= tolower(start
);
627 if (c
>= start
&& c
<= end
)
631 if (pattern
[0] == string
[0])
634 if (tolower((int)pattern
[0]) == tolower((int)string
[0]))
644 return 0; /* no match */
650 if (patternLen
>= 2) {
657 if (pattern
[0] != string
[0])
658 return 0; /* no match */
660 if (tolower((int)pattern
[0]) != tolower((int)string
[0]))
661 return 0; /* no match */
669 if (stringLen
== 0) {
670 while(*pattern
== '*') {
677 if (patternLen
== 0 && stringLen
== 0)
682 static void redisLog(int level
, const char *fmt
, ...) {
686 fp
= (server
.logfile
== NULL
) ? stdout
: fopen(server
.logfile
,"a");
690 if (level
>= server
.verbosity
) {
696 strftime(buf
,64,"%d %b %H:%M:%S",localtime(&now
));
697 fprintf(fp
,"%s %c ",buf
,c
[level
]);
698 vfprintf(fp
, fmt
, ap
);
704 if (server
.logfile
) fclose(fp
);
707 /*====================== Hash table type implementation ==================== */
709 /* This is an hash table type that uses the SDS dynamic strings libary as
710 * keys and radis objects as values (objects can hold SDS strings,
713 static void dictVanillaFree(void *privdata
, void *val
)
715 DICT_NOTUSED(privdata
);
719 static int sdsDictKeyCompare(void *privdata
, const void *key1
,
723 DICT_NOTUSED(privdata
);
725 l1
= sdslen((sds
)key1
);
726 l2
= sdslen((sds
)key2
);
727 if (l1
!= l2
) return 0;
728 return memcmp(key1
, key2
, l1
) == 0;
731 static void dictRedisObjectDestructor(void *privdata
, void *val
)
733 DICT_NOTUSED(privdata
);
738 static int dictObjKeyCompare(void *privdata
, const void *key1
,
741 const robj
*o1
= key1
, *o2
= key2
;
742 return sdsDictKeyCompare(privdata
,o1
->ptr
,o2
->ptr
);
745 static unsigned int dictObjHash(const void *key
) {
747 return dictGenHashFunction(o
->ptr
, sdslen((sds
)o
->ptr
));
750 static int dictEncObjKeyCompare(void *privdata
, const void *key1
,
753 const robj
*o1
= key1
, *o2
= key2
;
755 if (o1
->encoding
== REDIS_ENCODING_RAW
&&
756 o2
->encoding
== REDIS_ENCODING_RAW
)
757 return sdsDictKeyCompare(privdata
,o1
->ptr
,o2
->ptr
);
762 dec1
= o1
->encoding
!= REDIS_ENCODING_RAW
?
763 getDecodedObject(o1
) : (robj
*)o1
;
764 dec2
= o2
->encoding
!= REDIS_ENCODING_RAW
?
765 getDecodedObject(o2
) : (robj
*)o2
;
766 cmp
= sdsDictKeyCompare(privdata
,dec1
->ptr
,dec2
->ptr
);
767 if (dec1
!= o1
) decrRefCount(dec1
);
768 if (dec2
!= o2
) decrRefCount(dec2
);
773 static unsigned int dictEncObjHash(const void *key
) {
776 if (o
->encoding
== REDIS_ENCODING_RAW
)
777 return dictGenHashFunction(o
->ptr
, sdslen((sds
)o
->ptr
));
779 robj
*dec
= getDecodedObject(o
);
780 unsigned int hash
= dictGenHashFunction(dec
->ptr
, sdslen((sds
)dec
->ptr
));
786 static dictType setDictType
= {
787 dictEncObjHash
, /* hash function */
790 dictEncObjKeyCompare
, /* key compare */
791 dictRedisObjectDestructor
, /* key destructor */
792 NULL
/* val destructor */
795 static dictType zsetDictType
= {
796 dictEncObjHash
, /* hash function */
799 dictEncObjKeyCompare
, /* key compare */
800 dictRedisObjectDestructor
, /* key destructor */
801 dictVanillaFree
/* val destructor */
804 static dictType hashDictType
= {
805 dictObjHash
, /* hash function */
808 dictObjKeyCompare
, /* key compare */
809 dictRedisObjectDestructor
, /* key destructor */
810 dictRedisObjectDestructor
/* val destructor */
813 /* ========================= Random utility functions ======================= */
815 /* Redis generally does not try to recover from out of memory conditions
816 * when allocating objects or strings, it is not clear if it will be possible
817 * to report this condition to the client since the networking layer itself
818 * is based on heap allocation for send buffers, so we simply abort.
819 * At least the code will be simpler to read... */
820 static void oom(const char *msg
) {
821 fprintf(stderr
, "%s: Out of memory\n",msg
);
827 /* ====================== Redis server networking stuff ===================== */
828 static void closeTimedoutClients(void) {
831 time_t now
= time(NULL
);
833 listRewind(server
.clients
);
834 while ((ln
= listYield(server
.clients
)) != NULL
) {
835 c
= listNodeValue(ln
);
836 if (!(c
->flags
& REDIS_SLAVE
) && /* no timeout for slaves */
837 !(c
->flags
& REDIS_MASTER
) && /* no timeout for masters */
838 (now
- c
->lastinteraction
> server
.maxidletime
)) {
839 redisLog(REDIS_DEBUG
,"Closing idle client");
845 static int htNeedsResize(dict
*dict
) {
846 long long size
, used
;
848 size
= dictSlots(dict
);
849 used
= dictSize(dict
);
850 return (size
&& used
&& size
> DICT_HT_INITIAL_SIZE
&&
851 (used
*100/size
< REDIS_HT_MINFILL
));
854 /* If the percentage of used slots in the HT reaches REDIS_HT_MINFILL
855 * we resize the hash table to save memory */
856 static void tryResizeHashTables(void) {
859 for (j
= 0; j
< server
.dbnum
; j
++) {
860 if (htNeedsResize(server
.db
[j
].dict
)) {
861 redisLog(REDIS_DEBUG
,"The hash table %d is too sparse, resize it...",j
);
862 dictResize(server
.db
[j
].dict
);
863 redisLog(REDIS_DEBUG
,"Hash table %d resized.",j
);
865 if (htNeedsResize(server
.db
[j
].expires
))
866 dictResize(server
.db
[j
].expires
);
870 static int serverCron(struct aeEventLoop
*eventLoop
, long long id
, void *clientData
) {
871 int j
, loops
= server
.cronloops
++;
872 REDIS_NOTUSED(eventLoop
);
874 REDIS_NOTUSED(clientData
);
876 /* Update the global state with the amount of used memory */
877 server
.usedmemory
= zmalloc_used_memory();
879 /* Show some info about non-empty databases */
880 for (j
= 0; j
< server
.dbnum
; j
++) {
881 long long size
, used
, vkeys
;
883 size
= dictSlots(server
.db
[j
].dict
);
884 used
= dictSize(server
.db
[j
].dict
);
885 vkeys
= dictSize(server
.db
[j
].expires
);
886 if (!(loops
% 5) && (used
|| vkeys
)) {
887 redisLog(REDIS_DEBUG
,"DB %d: %lld keys (%lld volatile) in %lld slots HT.",j
,used
,vkeys
,size
);
888 /* dictPrintStats(server.dict); */
892 /* We don't want to resize the hash tables while a bacground saving
893 * is in progress: the saving child is created using fork() that is
894 * implemented with a copy-on-write semantic in most modern systems, so
895 * if we resize the HT while there is the saving child at work actually
896 * a lot of memory movements in the parent will cause a lot of pages
898 if (!server
.bgsaveinprogress
) tryResizeHashTables();
900 /* Show information about connected clients */
902 redisLog(REDIS_DEBUG
,"%d clients connected (%d slaves), %zu bytes in use, %d shared objects",
903 listLength(server
.clients
)-listLength(server
.slaves
),
904 listLength(server
.slaves
),
906 dictSize(server
.sharingpool
));
909 /* Close connections of timedout clients */
910 if (server
.maxidletime
&& !(loops
% 10))
911 closeTimedoutClients();
913 /* Check if a background saving in progress terminated */
914 if (server
.bgsaveinprogress
) {
916 if (wait3(&statloc
,WNOHANG
,NULL
)) {
917 int exitcode
= WEXITSTATUS(statloc
);
918 int bysignal
= WIFSIGNALED(statloc
);
920 if (!bysignal
&& exitcode
== 0) {
921 redisLog(REDIS_NOTICE
,
922 "Background saving terminated with success");
924 server
.lastsave
= time(NULL
);
925 } else if (!bysignal
&& exitcode
!= 0) {
926 redisLog(REDIS_WARNING
, "Background saving error");
928 redisLog(REDIS_WARNING
,
929 "Background saving terminated by signal");
930 rdbRemoveTempFile(server
.bgsavechildpid
);
932 server
.bgsaveinprogress
= 0;
933 server
.bgsavechildpid
= -1;
934 updateSlavesWaitingBgsave(exitcode
== 0 ? REDIS_OK
: REDIS_ERR
);
937 /* If there is not a background saving in progress check if
938 * we have to save now */
939 time_t now
= time(NULL
);
940 for (j
= 0; j
< server
.saveparamslen
; j
++) {
941 struct saveparam
*sp
= server
.saveparams
+j
;
943 if (server
.dirty
>= sp
->changes
&&
944 now
-server
.lastsave
> sp
->seconds
) {
945 redisLog(REDIS_NOTICE
,"%d changes in %d seconds. Saving...",
946 sp
->changes
, sp
->seconds
);
947 rdbSaveBackground(server
.dbfilename
);
953 /* Try to expire a few timed out keys. The algorithm used is adaptive and
954 * will use few CPU cycles if there are few expiring keys, otherwise
955 * it will get more aggressive to avoid that too much memory is used by
956 * keys that can be removed from the keyspace. */
957 for (j
= 0; j
< server
.dbnum
; j
++) {
959 redisDb
*db
= server
.db
+j
;
961 /* Continue to expire if at the end of the cycle more than 25%
962 * of the keys were expired. */
964 int num
= dictSize(db
->expires
);
965 time_t now
= time(NULL
);
968 if (num
> REDIS_EXPIRELOOKUPS_PER_CRON
)
969 num
= REDIS_EXPIRELOOKUPS_PER_CRON
;
974 if ((de
= dictGetRandomKey(db
->expires
)) == NULL
) break;
975 t
= (time_t) dictGetEntryVal(de
);
977 deleteKey(db
,dictGetEntryKey(de
));
981 } while (expired
> REDIS_EXPIRELOOKUPS_PER_CRON
/4);
984 /* Check if we should connect to a MASTER */
985 if (server
.replstate
== REDIS_REPL_CONNECT
) {
986 redisLog(REDIS_NOTICE
,"Connecting to MASTER...");
987 if (syncWithMaster() == REDIS_OK
) {
988 redisLog(REDIS_NOTICE
,"MASTER <-> SLAVE sync succeeded");
994 static void createSharedObjects(void) {
995 shared
.crlf
= createObject(REDIS_STRING
,sdsnew("\r\n"));
996 shared
.ok
= createObject(REDIS_STRING
,sdsnew("+OK\r\n"));
997 shared
.err
= createObject(REDIS_STRING
,sdsnew("-ERR\r\n"));
998 shared
.emptybulk
= createObject(REDIS_STRING
,sdsnew("$0\r\n\r\n"));
999 shared
.czero
= createObject(REDIS_STRING
,sdsnew(":0\r\n"));
1000 shared
.cone
= createObject(REDIS_STRING
,sdsnew(":1\r\n"));
1001 shared
.nullbulk
= createObject(REDIS_STRING
,sdsnew("$-1\r\n"));
1002 shared
.nullmultibulk
= createObject(REDIS_STRING
,sdsnew("*-1\r\n"));
1003 shared
.emptymultibulk
= createObject(REDIS_STRING
,sdsnew("*0\r\n"));
1005 shared
.pong
= createObject(REDIS_STRING
,sdsnew("+PONG\r\n"));
1006 shared
.wrongtypeerr
= createObject(REDIS_STRING
,sdsnew(
1007 "-ERR Operation against a key holding the wrong kind of value\r\n"));
1008 shared
.nokeyerr
= createObject(REDIS_STRING
,sdsnew(
1009 "-ERR no such key\r\n"));
1010 shared
.syntaxerr
= createObject(REDIS_STRING
,sdsnew(
1011 "-ERR syntax error\r\n"));
1012 shared
.sameobjecterr
= createObject(REDIS_STRING
,sdsnew(
1013 "-ERR source and destination objects are the same\r\n"));
1014 shared
.outofrangeerr
= createObject(REDIS_STRING
,sdsnew(
1015 "-ERR index out of range\r\n"));
1016 shared
.space
= createObject(REDIS_STRING
,sdsnew(" "));
1017 shared
.colon
= createObject(REDIS_STRING
,sdsnew(":"));
1018 shared
.plus
= createObject(REDIS_STRING
,sdsnew("+"));
1019 shared
.select0
= createStringObject("select 0\r\n",10);
1020 shared
.select1
= createStringObject("select 1\r\n",10);
1021 shared
.select2
= createStringObject("select 2\r\n",10);
1022 shared
.select3
= createStringObject("select 3\r\n",10);
1023 shared
.select4
= createStringObject("select 4\r\n",10);
1024 shared
.select5
= createStringObject("select 5\r\n",10);
1025 shared
.select6
= createStringObject("select 6\r\n",10);
1026 shared
.select7
= createStringObject("select 7\r\n",10);
1027 shared
.select8
= createStringObject("select 8\r\n",10);
1028 shared
.select9
= createStringObject("select 9\r\n",10);
1031 static void appendServerSaveParams(time_t seconds
, int changes
) {
1032 server
.saveparams
= zrealloc(server
.saveparams
,sizeof(struct saveparam
)*(server
.saveparamslen
+1));
1033 server
.saveparams
[server
.saveparamslen
].seconds
= seconds
;
1034 server
.saveparams
[server
.saveparamslen
].changes
= changes
;
1035 server
.saveparamslen
++;
1038 static void resetServerSaveParams() {
1039 zfree(server
.saveparams
);
1040 server
.saveparams
= NULL
;
1041 server
.saveparamslen
= 0;
1044 static void initServerConfig() {
1045 server
.dbnum
= REDIS_DEFAULT_DBNUM
;
1046 server
.port
= REDIS_SERVERPORT
;
1047 server
.verbosity
= REDIS_DEBUG
;
1048 server
.maxidletime
= REDIS_MAXIDLETIME
;
1049 server
.saveparams
= NULL
;
1050 server
.logfile
= NULL
; /* NULL = log on standard output */
1051 server
.bindaddr
= NULL
;
1052 server
.glueoutputbuf
= 1;
1053 server
.daemonize
= 0;
1054 server
.appendonly
= 0;
1055 server
.appendfsync
= APPENDFSYNC_ALWAYS
;
1056 server
.lastfsync
= time(NULL
);
1057 server
.appendfd
= -1;
1058 server
.appendseldb
= -1; /* Make sure the first time will not match */
1059 server
.pidfile
= "/var/run/redis.pid";
1060 server
.dbfilename
= "dump.rdb";
1061 server
.appendfilename
= "appendonly.log";
1062 server
.requirepass
= NULL
;
1063 server
.shareobjects
= 0;
1064 server
.sharingpoolsize
= 1024;
1065 server
.maxclients
= 0;
1066 server
.maxmemory
= 0;
1067 resetServerSaveParams();
1069 appendServerSaveParams(60*60,1); /* save after 1 hour and 1 change */
1070 appendServerSaveParams(300,100); /* save after 5 minutes and 100 changes */
1071 appendServerSaveParams(60,10000); /* save after 1 minute and 10000 changes */
1072 /* Replication related */
1074 server
.masterauth
= NULL
;
1075 server
.masterhost
= NULL
;
1076 server
.masterport
= 6379;
1077 server
.master
= NULL
;
1078 server
.replstate
= REDIS_REPL_NONE
;
1080 /* Double constants initialization */
1082 R_PosInf
= 1.0/R_Zero
;
1083 R_NegInf
= -1.0/R_Zero
;
1084 R_Nan
= R_Zero
/R_Zero
;
1087 static void initServer() {
1090 signal(SIGHUP
, SIG_IGN
);
1091 signal(SIGPIPE
, SIG_IGN
);
1092 setupSigSegvAction();
1094 server
.clients
= listCreate();
1095 server
.slaves
= listCreate();
1096 server
.monitors
= listCreate();
1097 server
.objfreelist
= listCreate();
1098 createSharedObjects();
1099 server
.el
= aeCreateEventLoop();
1100 server
.db
= zmalloc(sizeof(redisDb
)*server
.dbnum
);
1101 server
.sharingpool
= dictCreate(&setDictType
,NULL
);
1102 server
.fd
= anetTcpServer(server
.neterr
, server
.port
, server
.bindaddr
);
1103 if (server
.fd
== -1) {
1104 redisLog(REDIS_WARNING
, "Opening TCP port: %s", server
.neterr
);
1107 for (j
= 0; j
< server
.dbnum
; j
++) {
1108 server
.db
[j
].dict
= dictCreate(&hashDictType
,NULL
);
1109 server
.db
[j
].expires
= dictCreate(&setDictType
,NULL
);
1110 server
.db
[j
].id
= j
;
1112 server
.cronloops
= 0;
1113 server
.bgsaveinprogress
= 0;
1114 server
.bgsavechildpid
= -1;
1115 server
.lastsave
= time(NULL
);
1117 server
.usedmemory
= 0;
1118 server
.stat_numcommands
= 0;
1119 server
.stat_numconnections
= 0;
1120 server
.stat_starttime
= time(NULL
);
1121 aeCreateTimeEvent(server
.el
, 1, serverCron
, NULL
, NULL
);
1123 if (server
.appendonly
) {
1124 server
.appendfd
= open(server
.appendfilename
,O_WRONLY
|O_APPEND
|O_CREAT
,0644);
1125 if (server
.appendfd
== -1) {
1126 redisLog(REDIS_WARNING
, "Can't open the append-only file: %s",
1133 /* Empty the whole database */
1134 static long long emptyDb() {
1136 long long removed
= 0;
1138 for (j
= 0; j
< server
.dbnum
; j
++) {
1139 removed
+= dictSize(server
.db
[j
].dict
);
1140 dictEmpty(server
.db
[j
].dict
);
1141 dictEmpty(server
.db
[j
].expires
);
1146 static int yesnotoi(char *s
) {
1147 if (!strcasecmp(s
,"yes")) return 1;
1148 else if (!strcasecmp(s
,"no")) return 0;
1152 /* I agree, this is a very rudimental way to load a configuration...
1153 will improve later if the config gets more complex */
1154 static void loadServerConfig(char *filename
) {
1156 char buf
[REDIS_CONFIGLINE_MAX
+1], *err
= NULL
;
1160 if (filename
[0] == '-' && filename
[1] == '\0')
1163 if ((fp
= fopen(filename
,"r")) == NULL
) {
1164 redisLog(REDIS_WARNING
,"Fatal error, can't open config file");
1169 while(fgets(buf
,REDIS_CONFIGLINE_MAX
+1,fp
) != NULL
) {
1175 line
= sdstrim(line
," \t\r\n");
1177 /* Skip comments and blank lines*/
1178 if (line
[0] == '#' || line
[0] == '\0') {
1183 /* Split into arguments */
1184 argv
= sdssplitlen(line
,sdslen(line
)," ",1,&argc
);
1185 sdstolower(argv
[0]);
1187 /* Execute config directives */
1188 if (!strcasecmp(argv
[0],"timeout") && argc
== 2) {
1189 server
.maxidletime
= atoi(argv
[1]);
1190 if (server
.maxidletime
< 0) {
1191 err
= "Invalid timeout value"; goto loaderr
;
1193 } else if (!strcasecmp(argv
[0],"port") && argc
== 2) {
1194 server
.port
= atoi(argv
[1]);
1195 if (server
.port
< 1 || server
.port
> 65535) {
1196 err
= "Invalid port"; goto loaderr
;
1198 } else if (!strcasecmp(argv
[0],"bind") && argc
== 2) {
1199 server
.bindaddr
= zstrdup(argv
[1]);
1200 } else if (!strcasecmp(argv
[0],"save") && argc
== 3) {
1201 int seconds
= atoi(argv
[1]);
1202 int changes
= atoi(argv
[2]);
1203 if (seconds
< 1 || changes
< 0) {
1204 err
= "Invalid save parameters"; goto loaderr
;
1206 appendServerSaveParams(seconds
,changes
);
1207 } else if (!strcasecmp(argv
[0],"dir") && argc
== 2) {
1208 if (chdir(argv
[1]) == -1) {
1209 redisLog(REDIS_WARNING
,"Can't chdir to '%s': %s",
1210 argv
[1], strerror(errno
));
1213 } else if (!strcasecmp(argv
[0],"loglevel") && argc
== 2) {
1214 if (!strcasecmp(argv
[1],"debug")) server
.verbosity
= REDIS_DEBUG
;
1215 else if (!strcasecmp(argv
[1],"notice")) server
.verbosity
= REDIS_NOTICE
;
1216 else if (!strcasecmp(argv
[1],"warning")) server
.verbosity
= REDIS_WARNING
;
1218 err
= "Invalid log level. Must be one of debug, notice, warning";
1221 } else if (!strcasecmp(argv
[0],"logfile") && argc
== 2) {
1224 server
.logfile
= zstrdup(argv
[1]);
1225 if (!strcasecmp(server
.logfile
,"stdout")) {
1226 zfree(server
.logfile
);
1227 server
.logfile
= NULL
;
1229 if (server
.logfile
) {
1230 /* Test if we are able to open the file. The server will not
1231 * be able to abort just for this problem later... */
1232 logfp
= fopen(server
.logfile
,"a");
1233 if (logfp
== NULL
) {
1234 err
= sdscatprintf(sdsempty(),
1235 "Can't open the log file: %s", strerror(errno
));
1240 } else if (!strcasecmp(argv
[0],"databases") && argc
== 2) {
1241 server
.dbnum
= atoi(argv
[1]);
1242 if (server
.dbnum
< 1) {
1243 err
= "Invalid number of databases"; goto loaderr
;
1245 } else if (!strcasecmp(argv
[0],"maxclients") && argc
== 2) {
1246 server
.maxclients
= atoi(argv
[1]);
1247 } else if (!strcasecmp(argv
[0],"maxmemory") && argc
== 2) {
1248 server
.maxmemory
= strtoll(argv
[1], NULL
, 10);
1249 } else if (!strcasecmp(argv
[0],"slaveof") && argc
== 3) {
1250 server
.masterhost
= sdsnew(argv
[1]);
1251 server
.masterport
= atoi(argv
[2]);
1252 server
.replstate
= REDIS_REPL_CONNECT
;
1253 } else if (!strcasecmp(argv
[0],"masterauth") && argc
== 2) {
1254 server
.masterauth
= zstrdup(argv
[1]);
1255 } else if (!strcasecmp(argv
[0],"glueoutputbuf") && argc
== 2) {
1256 if ((server
.glueoutputbuf
= yesnotoi(argv
[1])) == -1) {
1257 err
= "argument must be 'yes' or 'no'"; goto loaderr
;
1259 } else if (!strcasecmp(argv
[0],"shareobjects") && argc
== 2) {
1260 if ((server
.shareobjects
= yesnotoi(argv
[1])) == -1) {
1261 err
= "argument must be 'yes' or 'no'"; goto loaderr
;
1263 } else if (!strcasecmp(argv
[0],"shareobjectspoolsize") && argc
== 2) {
1264 server
.sharingpoolsize
= atoi(argv
[1]);
1265 if (server
.sharingpoolsize
< 1) {
1266 err
= "invalid object sharing pool size"; goto loaderr
;
1268 } else if (!strcasecmp(argv
[0],"daemonize") && argc
== 2) {
1269 if ((server
.daemonize
= yesnotoi(argv
[1])) == -1) {
1270 err
= "argument must be 'yes' or 'no'"; goto loaderr
;
1272 } else if (!strcasecmp(argv
[0],"appendonly") && argc
== 2) {
1273 if ((server
.appendonly
= yesnotoi(argv
[1])) == -1) {
1274 err
= "argument must be 'yes' or 'no'"; goto loaderr
;
1276 } else if (!strcasecmp(argv
[0],"appendfsync") && argc
== 2) {
1277 if (!strcasecmp(argv
[1],"no")) {
1278 server
.appendfsync
= APPENDFSYNC_NO
;
1279 } else if (!strcasecmp(argv
[1],"always")) {
1280 server
.appendfsync
= APPENDFSYNC_ALWAYS
;
1281 } else if (!strcasecmp(argv
[1],"everysec")) {
1282 server
.appendfsync
= APPENDFSYNC_EVERYSEC
;
1284 err
= "argument must be 'no', 'always' or 'everysec'";
1287 } else if (!strcasecmp(argv
[0],"requirepass") && argc
== 2) {
1288 server
.requirepass
= zstrdup(argv
[1]);
1289 } else if (!strcasecmp(argv
[0],"pidfile") && argc
== 2) {
1290 server
.pidfile
= zstrdup(argv
[1]);
1291 } else if (!strcasecmp(argv
[0],"dbfilename") && argc
== 2) {
1292 server
.dbfilename
= zstrdup(argv
[1]);
1294 err
= "Bad directive or wrong number of arguments"; goto loaderr
;
1296 for (j
= 0; j
< argc
; j
++)
1301 if (fp
!= stdin
) fclose(fp
);
1305 fprintf(stderr
, "\n*** FATAL CONFIG FILE ERROR ***\n");
1306 fprintf(stderr
, "Reading the configuration file, at line %d\n", linenum
);
1307 fprintf(stderr
, ">>> '%s'\n", line
);
1308 fprintf(stderr
, "%s\n", err
);
1312 static void freeClientArgv(redisClient
*c
) {
1315 for (j
= 0; j
< c
->argc
; j
++)
1316 decrRefCount(c
->argv
[j
]);
1317 for (j
= 0; j
< c
->mbargc
; j
++)
1318 decrRefCount(c
->mbargv
[j
]);
1323 static void freeClient(redisClient
*c
) {
1326 aeDeleteFileEvent(server
.el
,c
->fd
,AE_READABLE
);
1327 aeDeleteFileEvent(server
.el
,c
->fd
,AE_WRITABLE
);
1328 sdsfree(c
->querybuf
);
1329 listRelease(c
->reply
);
1332 ln
= listSearchKey(server
.clients
,c
);
1334 listDelNode(server
.clients
,ln
);
1335 if (c
->flags
& REDIS_SLAVE
) {
1336 if (c
->replstate
== REDIS_REPL_SEND_BULK
&& c
->repldbfd
!= -1)
1338 list
*l
= (c
->flags
& REDIS_MONITOR
) ? server
.monitors
: server
.slaves
;
1339 ln
= listSearchKey(l
,c
);
1343 if (c
->flags
& REDIS_MASTER
) {
1344 server
.master
= NULL
;
1345 server
.replstate
= REDIS_REPL_CONNECT
;
1352 #define GLUEREPLY_UP_TO (1024)
1353 static void glueReplyBuffersIfNeeded(redisClient
*c
) {
1358 listRewind(c
->reply
);
1359 while((ln
= listYield(c
->reply
))) {
1361 totlen
+= sdslen(o
->ptr
);
1362 /* This optimization makes more sense if we don't have to copy
1364 if (totlen
> GLUEREPLY_UP_TO
) return;
1367 char buf
[GLUEREPLY_UP_TO
];
1370 listRewind(c
->reply
);
1371 while((ln
= listYield(c
->reply
))) {
1373 memcpy(buf
+copylen
,o
->ptr
,sdslen(o
->ptr
));
1374 copylen
+= sdslen(o
->ptr
);
1375 listDelNode(c
->reply
,ln
);
1377 /* Now the output buffer is empty, add the new single element */
1378 o
= createObject(REDIS_STRING
,sdsnewlen(buf
,totlen
));
1379 listAddNodeTail(c
->reply
,o
);
1383 static void sendReplyToClient(aeEventLoop
*el
, int fd
, void *privdata
, int mask
) {
1384 redisClient
*c
= privdata
;
1385 int nwritten
= 0, totwritten
= 0, objlen
;
1388 REDIS_NOTUSED(mask
);
1390 if (server
.glueoutputbuf
&& listLength(c
->reply
) > 1)
1391 glueReplyBuffersIfNeeded(c
);
1393 /* Use writev() if we have enough buffers to send */
1395 if (listLength(c
->reply
) > REDIS_WRITEV_THRESHOLD
&&
1396 !(c
->flags
& REDIS_MASTER
))
1398 sendReplyToClientWritev(el
, fd
, privdata
, mask
);
1403 while(listLength(c
->reply
)) {
1404 o
= listNodeValue(listFirst(c
->reply
));
1405 objlen
= sdslen(o
->ptr
);
1408 listDelNode(c
->reply
,listFirst(c
->reply
));
1412 if (c
->flags
& REDIS_MASTER
) {
1413 /* Don't reply to a master */
1414 nwritten
= objlen
- c
->sentlen
;
1416 nwritten
= write(fd
, ((char*)o
->ptr
)+c
->sentlen
, objlen
- c
->sentlen
);
1417 if (nwritten
<= 0) break;
1419 c
->sentlen
+= nwritten
;
1420 totwritten
+= nwritten
;
1421 /* If we fully sent the object on head go to the next one */
1422 if (c
->sentlen
== objlen
) {
1423 listDelNode(c
->reply
,listFirst(c
->reply
));
1426 /* Note that we avoid to send more thank REDIS_MAX_WRITE_PER_EVENT
1427 * bytes, in a single threaded server it's a good idea to serve
1428 * other clients as well, even if a very large request comes from
1429 * super fast link that is always able to accept data (in real world
1430 * scenario think about 'KEYS *' against the loopback interfae) */
1431 if (totwritten
> REDIS_MAX_WRITE_PER_EVENT
) break;
1433 if (nwritten
== -1) {
1434 if (errno
== EAGAIN
) {
1437 redisLog(REDIS_DEBUG
,
1438 "Error writing to client: %s", strerror(errno
));
1443 if (totwritten
> 0) c
->lastinteraction
= time(NULL
);
1444 if (listLength(c
->reply
) == 0) {
1446 aeDeleteFileEvent(server
.el
,c
->fd
,AE_WRITABLE
);
1450 static void sendReplyToClientWritev(aeEventLoop
*el
, int fd
, void *privdata
, int mask
)
1452 redisClient
*c
= privdata
;
1453 int nwritten
= 0, totwritten
= 0, objlen
, willwrite
;
1455 struct iovec iov
[REDIS_WRITEV_IOVEC_COUNT
];
1456 int offset
, ion
= 0;
1458 REDIS_NOTUSED(mask
);
1461 while (listLength(c
->reply
)) {
1462 offset
= c
->sentlen
;
1466 /* fill-in the iov[] array */
1467 for(node
= listFirst(c
->reply
); node
; node
= listNextNode(node
)) {
1468 o
= listNodeValue(node
);
1469 objlen
= sdslen(o
->ptr
);
1471 if (totwritten
+ objlen
- offset
> REDIS_MAX_WRITE_PER_EVENT
)
1474 if(ion
== REDIS_WRITEV_IOVEC_COUNT
)
1475 break; /* no more iovecs */
1477 iov
[ion
].iov_base
= ((char*)o
->ptr
) + offset
;
1478 iov
[ion
].iov_len
= objlen
- offset
;
1479 willwrite
+= objlen
- offset
;
1480 offset
= 0; /* just for the first item */
1487 /* write all collected blocks at once */
1488 if((nwritten
= writev(fd
, iov
, ion
)) < 0) {
1489 if (errno
!= EAGAIN
) {
1490 redisLog(REDIS_DEBUG
,
1491 "Error writing to client: %s", strerror(errno
));
1498 totwritten
+= nwritten
;
1499 offset
= c
->sentlen
;
1501 /* remove written robjs from c->reply */
1502 while (nwritten
&& listLength(c
->reply
)) {
1503 o
= listNodeValue(listFirst(c
->reply
));
1504 objlen
= sdslen(o
->ptr
);
1506 if(nwritten
>= objlen
- offset
) {
1507 listDelNode(c
->reply
, listFirst(c
->reply
));
1508 nwritten
-= objlen
- offset
;
1512 c
->sentlen
+= nwritten
;
1520 c
->lastinteraction
= time(NULL
);
1522 if (listLength(c
->reply
) == 0) {
1524 aeDeleteFileEvent(server
.el
,c
->fd
,AE_WRITABLE
);
1528 static struct redisCommand
*lookupCommand(char *name
) {
1530 while(cmdTable
[j
].name
!= NULL
) {
1531 if (!strcasecmp(name
,cmdTable
[j
].name
)) return &cmdTable
[j
];
1537 /* resetClient prepare the client to process the next command */
1538 static void resetClient(redisClient
*c
) {
1544 /* If this function gets called we already read a whole
1545 * command, argments are in the client argv/argc fields.
1546 * processCommand() execute the command or prepare the
1547 * server for a bulk read from the client.
1549 * If 1 is returned the client is still alive and valid and
1550 * and other operations can be performed by the caller. Otherwise
1551 * if 0 is returned the client was destroied (i.e. after QUIT). */
1552 static int processCommand(redisClient
*c
) {
1553 struct redisCommand
*cmd
;
1556 /* Free some memory if needed (maxmemory setting) */
1557 if (server
.maxmemory
) freeMemoryIfNeeded();
1559 /* Handle the multi bulk command type. This is an alternative protocol
1560 * supported by Redis in order to receive commands that are composed of
1561 * multiple binary-safe "bulk" arguments. The latency of processing is
1562 * a bit higher but this allows things like multi-sets, so if this
1563 * protocol is used only for MSET and similar commands this is a big win. */
1564 if (c
->multibulk
== 0 && c
->argc
== 1 && ((char*)(c
->argv
[0]->ptr
))[0] == '*') {
1565 c
->multibulk
= atoi(((char*)c
->argv
[0]->ptr
)+1);
1566 if (c
->multibulk
<= 0) {
1570 decrRefCount(c
->argv
[c
->argc
-1]);
1574 } else if (c
->multibulk
) {
1575 if (c
->bulklen
== -1) {
1576 if (((char*)c
->argv
[0]->ptr
)[0] != '$') {
1577 addReplySds(c
,sdsnew("-ERR multi bulk protocol error\r\n"));
1581 int bulklen
= atoi(((char*)c
->argv
[0]->ptr
)+1);
1582 decrRefCount(c
->argv
[0]);
1583 if (bulklen
< 0 || bulklen
> 1024*1024*1024) {
1585 addReplySds(c
,sdsnew("-ERR invalid bulk write count\r\n"));
1590 c
->bulklen
= bulklen
+2; /* add two bytes for CR+LF */
1594 c
->mbargv
= zrealloc(c
->mbargv
,(sizeof(robj
*))*(c
->mbargc
+1));
1595 c
->mbargv
[c
->mbargc
] = c
->argv
[0];
1599 if (c
->multibulk
== 0) {
1603 /* Here we need to swap the multi-bulk argc/argv with the
1604 * normal argc/argv of the client structure. */
1606 c
->argv
= c
->mbargv
;
1607 c
->mbargv
= auxargv
;
1610 c
->argc
= c
->mbargc
;
1611 c
->mbargc
= auxargc
;
1613 /* We need to set bulklen to something different than -1
1614 * in order for the code below to process the command without
1615 * to try to read the last argument of a bulk command as
1616 * a special argument. */
1618 /* continue below and process the command */
1625 /* -- end of multi bulk commands processing -- */
1627 /* The QUIT command is handled as a special case. Normal command
1628 * procs are unable to close the client connection safely */
1629 if (!strcasecmp(c
->argv
[0]->ptr
,"quit")) {
1633 cmd
= lookupCommand(c
->argv
[0]->ptr
);
1635 addReplySds(c
,sdsnew("-ERR unknown command\r\n"));
1638 } else if ((cmd
->arity
> 0 && cmd
->arity
!= c
->argc
) ||
1639 (c
->argc
< -cmd
->arity
)) {
1640 addReplySds(c
,sdsnew("-ERR wrong number of arguments\r\n"));
1643 } else if (server
.maxmemory
&& cmd
->flags
& REDIS_CMD_DENYOOM
&& zmalloc_used_memory() > server
.maxmemory
) {
1644 addReplySds(c
,sdsnew("-ERR command not allowed when used memory > 'maxmemory'\r\n"));
1647 } else if (cmd
->flags
& REDIS_CMD_BULK
&& c
->bulklen
== -1) {
1648 int bulklen
= atoi(c
->argv
[c
->argc
-1]->ptr
);
1650 decrRefCount(c
->argv
[c
->argc
-1]);
1651 if (bulklen
< 0 || bulklen
> 1024*1024*1024) {
1653 addReplySds(c
,sdsnew("-ERR invalid bulk write count\r\n"));
1658 c
->bulklen
= bulklen
+2; /* add two bytes for CR+LF */
1659 /* It is possible that the bulk read is already in the
1660 * buffer. Check this condition and handle it accordingly.
1661 * This is just a fast path, alternative to call processInputBuffer().
1662 * It's a good idea since the code is small and this condition
1663 * happens most of the times. */
1664 if ((signed)sdslen(c
->querybuf
) >= c
->bulklen
) {
1665 c
->argv
[c
->argc
] = createStringObject(c
->querybuf
,c
->bulklen
-2);
1667 c
->querybuf
= sdsrange(c
->querybuf
,c
->bulklen
,-1);
1672 /* Let's try to share objects on the command arguments vector */
1673 if (server
.shareobjects
) {
1675 for(j
= 1; j
< c
->argc
; j
++)
1676 c
->argv
[j
] = tryObjectSharing(c
->argv
[j
]);
1678 /* Let's try to encode the bulk object to save space. */
1679 if (cmd
->flags
& REDIS_CMD_BULK
)
1680 tryObjectEncoding(c
->argv
[c
->argc
-1]);
1682 /* Check if the user is authenticated */
1683 if (server
.requirepass
&& !c
->authenticated
&& cmd
->proc
!= authCommand
) {
1684 addReplySds(c
,sdsnew("-ERR operation not permitted\r\n"));
1689 /* Exec the command */
1690 dirty
= server
.dirty
;
1692 if (server
.appendonly
&& server
.dirty
-dirty
)
1693 feedAppendOnlyFile(cmd
,c
->db
->id
,c
->argv
,c
->argc
);
1694 if (server
.dirty
-dirty
&& listLength(server
.slaves
))
1695 replicationFeedSlaves(server
.slaves
,cmd
,c
->db
->id
,c
->argv
,c
->argc
);
1696 if (listLength(server
.monitors
))
1697 replicationFeedSlaves(server
.monitors
,cmd
,c
->db
->id
,c
->argv
,c
->argc
);
1698 server
.stat_numcommands
++;
1700 /* Prepare the client for the next command */
1701 if (c
->flags
& REDIS_CLOSE
) {
1709 static void replicationFeedSlaves(list
*slaves
, struct redisCommand
*cmd
, int dictid
, robj
**argv
, int argc
) {
1713 /* (args*2)+1 is enough room for args, spaces, newlines */
1714 robj
*static_outv
[REDIS_STATIC_ARGS
*2+1];
1716 if (argc
<= REDIS_STATIC_ARGS
) {
1719 outv
= zmalloc(sizeof(robj
*)*(argc
*2+1));
1722 for (j
= 0; j
< argc
; j
++) {
1723 if (j
!= 0) outv
[outc
++] = shared
.space
;
1724 if ((cmd
->flags
& REDIS_CMD_BULK
) && j
== argc
-1) {
1727 lenobj
= createObject(REDIS_STRING
,
1728 sdscatprintf(sdsempty(),"%d\r\n",
1729 stringObjectLen(argv
[j
])));
1730 lenobj
->refcount
= 0;
1731 outv
[outc
++] = lenobj
;
1733 outv
[outc
++] = argv
[j
];
1735 outv
[outc
++] = shared
.crlf
;
1737 /* Increment all the refcounts at start and decrement at end in order to
1738 * be sure to free objects if there is no slave in a replication state
1739 * able to be feed with commands */
1740 for (j
= 0; j
< outc
; j
++) incrRefCount(outv
[j
]);
1742 while((ln
= listYield(slaves
))) {
1743 redisClient
*slave
= ln
->value
;
1745 /* Don't feed slaves that are still waiting for BGSAVE to start */
1746 if (slave
->replstate
== REDIS_REPL_WAIT_BGSAVE_START
) continue;
1748 /* Feed all the other slaves, MONITORs and so on */
1749 if (slave
->slaveseldb
!= dictid
) {
1753 case 0: selectcmd
= shared
.select0
; break;
1754 case 1: selectcmd
= shared
.select1
; break;
1755 case 2: selectcmd
= shared
.select2
; break;
1756 case 3: selectcmd
= shared
.select3
; break;
1757 case 4: selectcmd
= shared
.select4
; break;
1758 case 5: selectcmd
= shared
.select5
; break;
1759 case 6: selectcmd
= shared
.select6
; break;
1760 case 7: selectcmd
= shared
.select7
; break;
1761 case 8: selectcmd
= shared
.select8
; break;
1762 case 9: selectcmd
= shared
.select9
; break;
1764 selectcmd
= createObject(REDIS_STRING
,
1765 sdscatprintf(sdsempty(),"select %d\r\n",dictid
));
1766 selectcmd
->refcount
= 0;
1769 addReply(slave
,selectcmd
);
1770 slave
->slaveseldb
= dictid
;
1772 for (j
= 0; j
< outc
; j
++) addReply(slave
,outv
[j
]);
1774 for (j
= 0; j
< outc
; j
++) decrRefCount(outv
[j
]);
1775 if (outv
!= static_outv
) zfree(outv
);
1778 static void processInputBuffer(redisClient
*c
) {
1780 if (c
->bulklen
== -1) {
1781 /* Read the first line of the query */
1782 char *p
= strchr(c
->querybuf
,'\n');
1789 query
= c
->querybuf
;
1790 c
->querybuf
= sdsempty();
1791 querylen
= 1+(p
-(query
));
1792 if (sdslen(query
) > querylen
) {
1793 /* leave data after the first line of the query in the buffer */
1794 c
->querybuf
= sdscatlen(c
->querybuf
,query
+querylen
,sdslen(query
)-querylen
);
1796 *p
= '\0'; /* remove "\n" */
1797 if (*(p
-1) == '\r') *(p
-1) = '\0'; /* and "\r" if any */
1798 sdsupdatelen(query
);
1800 /* Now we can split the query in arguments */
1801 if (sdslen(query
) == 0) {
1802 /* Ignore empty query */
1806 argv
= sdssplitlen(query
,sdslen(query
)," ",1,&argc
);
1809 if (c
->argv
) zfree(c
->argv
);
1810 c
->argv
= zmalloc(sizeof(robj
*)*argc
);
1812 for (j
= 0; j
< argc
; j
++) {
1813 if (sdslen(argv
[j
])) {
1814 c
->argv
[c
->argc
] = createObject(REDIS_STRING
,argv
[j
]);
1821 /* Execute the command. If the client is still valid
1822 * after processCommand() return and there is something
1823 * on the query buffer try to process the next command. */
1824 if (c
->argc
&& processCommand(c
) && sdslen(c
->querybuf
)) goto again
;
1826 } else if (sdslen(c
->querybuf
) >= REDIS_REQUEST_MAX_SIZE
) {
1827 redisLog(REDIS_DEBUG
, "Client protocol error");
1832 /* Bulk read handling. Note that if we are at this point
1833 the client already sent a command terminated with a newline,
1834 we are reading the bulk data that is actually the last
1835 argument of the command. */
1836 int qbl
= sdslen(c
->querybuf
);
1838 if (c
->bulklen
<= qbl
) {
1839 /* Copy everything but the final CRLF as final argument */
1840 c
->argv
[c
->argc
] = createStringObject(c
->querybuf
,c
->bulklen
-2);
1842 c
->querybuf
= sdsrange(c
->querybuf
,c
->bulklen
,-1);
1843 /* Process the command. If the client is still valid after
1844 * the processing and there is more data in the buffer
1845 * try to parse it. */
1846 if (processCommand(c
) && sdslen(c
->querybuf
)) goto again
;
1852 static void readQueryFromClient(aeEventLoop
*el
, int fd
, void *privdata
, int mask
) {
1853 redisClient
*c
= (redisClient
*) privdata
;
1854 char buf
[REDIS_IOBUF_LEN
];
1857 REDIS_NOTUSED(mask
);
1859 nread
= read(fd
, buf
, REDIS_IOBUF_LEN
);
1861 if (errno
== EAGAIN
) {
1864 redisLog(REDIS_DEBUG
, "Reading from client: %s",strerror(errno
));
1868 } else if (nread
== 0) {
1869 redisLog(REDIS_DEBUG
, "Client closed connection");
1874 c
->querybuf
= sdscatlen(c
->querybuf
, buf
, nread
);
1875 c
->lastinteraction
= time(NULL
);
1879 processInputBuffer(c
);
1882 static int selectDb(redisClient
*c
, int id
) {
1883 if (id
< 0 || id
>= server
.dbnum
)
1885 c
->db
= &server
.db
[id
];
1889 static void *dupClientReplyValue(void *o
) {
1890 incrRefCount((robj
*)o
);
1894 static redisClient
*createClient(int fd
) {
1895 redisClient
*c
= zmalloc(sizeof(*c
));
1897 anetNonBlock(NULL
,fd
);
1898 anetTcpNoDelay(NULL
,fd
);
1899 if (!c
) return NULL
;
1902 c
->querybuf
= sdsempty();
1911 c
->lastinteraction
= time(NULL
);
1912 c
->authenticated
= 0;
1913 c
->replstate
= REDIS_REPL_NONE
;
1914 c
->reply
= listCreate();
1915 listSetFreeMethod(c
->reply
,decrRefCount
);
1916 listSetDupMethod(c
->reply
,dupClientReplyValue
);
1917 if (aeCreateFileEvent(server
.el
, c
->fd
, AE_READABLE
,
1918 readQueryFromClient
, c
, NULL
) == AE_ERR
) {
1922 listAddNodeTail(server
.clients
,c
);
1926 static void addReply(redisClient
*c
, robj
*obj
) {
1927 if (listLength(c
->reply
) == 0 &&
1928 (c
->replstate
== REDIS_REPL_NONE
||
1929 c
->replstate
== REDIS_REPL_ONLINE
) &&
1930 aeCreateFileEvent(server
.el
, c
->fd
, AE_WRITABLE
,
1931 sendReplyToClient
, c
, NULL
) == AE_ERR
) return;
1932 if (obj
->encoding
!= REDIS_ENCODING_RAW
) {
1933 obj
= getDecodedObject(obj
);
1937 listAddNodeTail(c
->reply
,obj
);
1940 static void addReplySds(redisClient
*c
, sds s
) {
1941 robj
*o
= createObject(REDIS_STRING
,s
);
1946 static void addReplyBulkLen(redisClient
*c
, robj
*obj
) {
1949 if (obj
->encoding
== REDIS_ENCODING_RAW
) {
1950 len
= sdslen(obj
->ptr
);
1952 long n
= (long)obj
->ptr
;
1959 while((n
= n
/10) != 0) {
1963 addReplySds(c
,sdscatprintf(sdsempty(),"$%d\r\n",len
));
1966 static void acceptHandler(aeEventLoop
*el
, int fd
, void *privdata
, int mask
) {
1971 REDIS_NOTUSED(mask
);
1972 REDIS_NOTUSED(privdata
);
1974 cfd
= anetAccept(server
.neterr
, fd
, cip
, &cport
);
1975 if (cfd
== AE_ERR
) {
1976 redisLog(REDIS_DEBUG
,"Accepting client connection: %s", server
.neterr
);
1979 redisLog(REDIS_DEBUG
,"Accepted %s:%d", cip
, cport
);
1980 if ((c
= createClient(cfd
)) == NULL
) {
1981 redisLog(REDIS_WARNING
,"Error allocating resoures for the client");
1982 close(cfd
); /* May be already closed, just ingore errors */
1985 /* If maxclient directive is set and this is one client more... close the
1986 * connection. Note that we create the client instead to check before
1987 * for this condition, since now the socket is already set in nonblocking
1988 * mode and we can send an error for free using the Kernel I/O */
1989 if (server
.maxclients
&& listLength(server
.clients
) > server
.maxclients
) {
1990 char *err
= "-ERR max number of clients reached\r\n";
1992 /* That's a best effort error message, don't check write errors */
1993 if (write(c
->fd
,err
,strlen(err
)) == -1) {
1994 /* Nothing to do, Just to avoid the warning... */
1999 server
.stat_numconnections
++;
2002 /* ======================= Redis objects implementation ===================== */
2004 static robj
*createObject(int type
, void *ptr
) {
2007 if (listLength(server
.objfreelist
)) {
2008 listNode
*head
= listFirst(server
.objfreelist
);
2009 o
= listNodeValue(head
);
2010 listDelNode(server
.objfreelist
,head
);
2012 o
= zmalloc(sizeof(*o
));
2015 o
->encoding
= REDIS_ENCODING_RAW
;
2021 static robj
*createStringObject(char *ptr
, size_t len
) {
2022 return createObject(REDIS_STRING
,sdsnewlen(ptr
,len
));
2025 static robj
*createListObject(void) {
2026 list
*l
= listCreate();
2028 listSetFreeMethod(l
,decrRefCount
);
2029 return createObject(REDIS_LIST
,l
);
2032 static robj
*createSetObject(void) {
2033 dict
*d
= dictCreate(&setDictType
,NULL
);
2034 return createObject(REDIS_SET
,d
);
2037 static robj
*createZsetObject(void) {
2038 zset
*zs
= zmalloc(sizeof(*zs
));
2040 zs
->dict
= dictCreate(&zsetDictType
,NULL
);
2041 zs
->zsl
= zslCreate();
2042 return createObject(REDIS_ZSET
,zs
);
2045 static void freeStringObject(robj
*o
) {
2046 if (o
->encoding
== REDIS_ENCODING_RAW
) {
2051 static void freeListObject(robj
*o
) {
2052 listRelease((list
*) o
->ptr
);
2055 static void freeSetObject(robj
*o
) {
2056 dictRelease((dict
*) o
->ptr
);
2059 static void freeZsetObject(robj
*o
) {
2062 dictRelease(zs
->dict
);
2067 static void freeHashObject(robj
*o
) {
2068 dictRelease((dict
*) o
->ptr
);
2071 static void incrRefCount(robj
*o
) {
2073 #ifdef DEBUG_REFCOUNT
2074 if (o
->type
== REDIS_STRING
)
2075 printf("Increment '%s'(%p), now is: %d\n",o
->ptr
,o
,o
->refcount
);
2079 static void decrRefCount(void *obj
) {
2082 #ifdef DEBUG_REFCOUNT
2083 if (o
->type
== REDIS_STRING
)
2084 printf("Decrement '%s'(%p), now is: %d\n",o
->ptr
,o
,o
->refcount
-1);
2086 if (--(o
->refcount
) == 0) {
2088 case REDIS_STRING
: freeStringObject(o
); break;
2089 case REDIS_LIST
: freeListObject(o
); break;
2090 case REDIS_SET
: freeSetObject(o
); break;
2091 case REDIS_ZSET
: freeZsetObject(o
); break;
2092 case REDIS_HASH
: freeHashObject(o
); break;
2093 default: assert(0 != 0); break;
2095 if (listLength(server
.objfreelist
) > REDIS_OBJFREELIST_MAX
||
2096 !listAddNodeHead(server
.objfreelist
,o
))
2101 static robj
*lookupKey(redisDb
*db
, robj
*key
) {
2102 dictEntry
*de
= dictFind(db
->dict
,key
);
2103 return de
? dictGetEntryVal(de
) : NULL
;
2106 static robj
*lookupKeyRead(redisDb
*db
, robj
*key
) {
2107 expireIfNeeded(db
,key
);
2108 return lookupKey(db
,key
);
2111 static robj
*lookupKeyWrite(redisDb
*db
, robj
*key
) {
2112 deleteIfVolatile(db
,key
);
2113 return lookupKey(db
,key
);
2116 static int deleteKey(redisDb
*db
, robj
*key
) {
2119 /* We need to protect key from destruction: after the first dictDelete()
2120 * it may happen that 'key' is no longer valid if we don't increment
2121 * it's count. This may happen when we get the object reference directly
2122 * from the hash table with dictRandomKey() or dict iterators */
2124 if (dictSize(db
->expires
)) dictDelete(db
->expires
,key
);
2125 retval
= dictDelete(db
->dict
,key
);
2128 return retval
== DICT_OK
;
2131 /* Try to share an object against the shared objects pool */
2132 static robj
*tryObjectSharing(robj
*o
) {
2133 struct dictEntry
*de
;
2136 if (o
== NULL
|| server
.shareobjects
== 0) return o
;
2138 assert(o
->type
== REDIS_STRING
);
2139 de
= dictFind(server
.sharingpool
,o
);
2141 robj
*shared
= dictGetEntryKey(de
);
2143 c
= ((unsigned long) dictGetEntryVal(de
))+1;
2144 dictGetEntryVal(de
) = (void*) c
;
2145 incrRefCount(shared
);
2149 /* Here we are using a stream algorihtm: Every time an object is
2150 * shared we increment its count, everytime there is a miss we
2151 * recrement the counter of a random object. If this object reaches
2152 * zero we remove the object and put the current object instead. */
2153 if (dictSize(server
.sharingpool
) >=
2154 server
.sharingpoolsize
) {
2155 de
= dictGetRandomKey(server
.sharingpool
);
2157 c
= ((unsigned long) dictGetEntryVal(de
))-1;
2158 dictGetEntryVal(de
) = (void*) c
;
2160 dictDelete(server
.sharingpool
,de
->key
);
2163 c
= 0; /* If the pool is empty we want to add this object */
2168 retval
= dictAdd(server
.sharingpool
,o
,(void*)1);
2169 assert(retval
== DICT_OK
);
2176 /* Check if the nul-terminated string 's' can be represented by a long
2177 * (that is, is a number that fits into long without any other space or
2178 * character before or after the digits).
2180 * If so, the function returns REDIS_OK and *longval is set to the value
2181 * of the number. Otherwise REDIS_ERR is returned */
2182 static int isStringRepresentableAsLong(sds s
, long *longval
) {
2183 char buf
[32], *endptr
;
2187 value
= strtol(s
, &endptr
, 10);
2188 if (endptr
[0] != '\0') return REDIS_ERR
;
2189 slen
= snprintf(buf
,32,"%ld",value
);
2191 /* If the number converted back into a string is not identical
2192 * then it's not possible to encode the string as integer */
2193 if (sdslen(s
) != (unsigned)slen
|| memcmp(buf
,s
,slen
)) return REDIS_ERR
;
2194 if (longval
) *longval
= value
;
2198 /* Try to encode a string object in order to save space */
2199 static int tryObjectEncoding(robj
*o
) {
2203 if (o
->encoding
!= REDIS_ENCODING_RAW
)
2204 return REDIS_ERR
; /* Already encoded */
2206 /* It's not save to encode shared objects: shared objects can be shared
2207 * everywhere in the "object space" of Redis. Encoded objects can only
2208 * appear as "values" (and not, for instance, as keys) */
2209 if (o
->refcount
> 1) return REDIS_ERR
;
2211 /* Currently we try to encode only strings */
2212 assert(o
->type
== REDIS_STRING
);
2214 /* Check if we can represent this string as a long integer */
2215 if (isStringRepresentableAsLong(s
,&value
) == REDIS_ERR
) return REDIS_ERR
;
2217 /* Ok, this object can be encoded */
2218 o
->encoding
= REDIS_ENCODING_INT
;
2220 o
->ptr
= (void*) value
;
2224 /* Get a decoded version of an encoded object (returned as a new object) */
2225 static robj
*getDecodedObject(const robj
*o
) {
2228 assert(o
->encoding
!= REDIS_ENCODING_RAW
);
2229 if (o
->type
== REDIS_STRING
&& o
->encoding
== REDIS_ENCODING_INT
) {
2232 snprintf(buf
,32,"%ld",(long)o
->ptr
);
2233 dec
= createStringObject(buf
,strlen(buf
));
2240 /* Compare two string objects via strcmp() or alike.
2241 * Note that the objects may be integer-encoded. In such a case we
2242 * use snprintf() to get a string representation of the numbers on the stack
2243 * and compare the strings, it's much faster than calling getDecodedObject(). */
2244 static int compareStringObjects(robj
*a
, robj
*b
) {
2245 assert(a
->type
== REDIS_STRING
&& b
->type
== REDIS_STRING
);
2246 char bufa
[128], bufb
[128], *astr
, *bstr
;
2249 if (a
== b
) return 0;
2250 if (a
->encoding
!= REDIS_ENCODING_RAW
) {
2251 snprintf(bufa
,sizeof(bufa
),"%ld",(long) a
->ptr
);
2257 if (b
->encoding
!= REDIS_ENCODING_RAW
) {
2258 snprintf(bufb
,sizeof(bufb
),"%ld",(long) b
->ptr
);
2264 return bothsds
? sdscmp(astr
,bstr
) : strcmp(astr
,bstr
);
2267 static size_t stringObjectLen(robj
*o
) {
2268 assert(o
->type
== REDIS_STRING
);
2269 if (o
->encoding
== REDIS_ENCODING_RAW
) {
2270 return sdslen(o
->ptr
);
2274 return snprintf(buf
,32,"%ld",(long)o
->ptr
);
2278 /*============================ DB saving/loading ============================ */
2280 static int rdbSaveType(FILE *fp
, unsigned char type
) {
2281 if (fwrite(&type
,1,1,fp
) == 0) return -1;
2285 static int rdbSaveTime(FILE *fp
, time_t t
) {
2286 int32_t t32
= (int32_t) t
;
2287 if (fwrite(&t32
,4,1,fp
) == 0) return -1;
2291 /* check rdbLoadLen() comments for more info */
2292 static int rdbSaveLen(FILE *fp
, uint32_t len
) {
2293 unsigned char buf
[2];
2296 /* Save a 6 bit len */
2297 buf
[0] = (len
&0xFF)|(REDIS_RDB_6BITLEN
<<6);
2298 if (fwrite(buf
,1,1,fp
) == 0) return -1;
2299 } else if (len
< (1<<14)) {
2300 /* Save a 14 bit len */
2301 buf
[0] = ((len
>>8)&0xFF)|(REDIS_RDB_14BITLEN
<<6);
2303 if (fwrite(buf
,2,1,fp
) == 0) return -1;
2305 /* Save a 32 bit len */
2306 buf
[0] = (REDIS_RDB_32BITLEN
<<6);
2307 if (fwrite(buf
,1,1,fp
) == 0) return -1;
2309 if (fwrite(&len
,4,1,fp
) == 0) return -1;
2314 /* String objects in the form "2391" "-100" without any space and with a
2315 * range of values that can fit in an 8, 16 or 32 bit signed value can be
2316 * encoded as integers to save space */
2317 static int rdbTryIntegerEncoding(sds s
, unsigned char *enc
) {
2319 char *endptr
, buf
[32];
2321 /* Check if it's possible to encode this value as a number */
2322 value
= strtoll(s
, &endptr
, 10);
2323 if (endptr
[0] != '\0') return 0;
2324 snprintf(buf
,32,"%lld",value
);
2326 /* If the number converted back into a string is not identical
2327 * then it's not possible to encode the string as integer */
2328 if (strlen(buf
) != sdslen(s
) || memcmp(buf
,s
,sdslen(s
))) return 0;
2330 /* Finally check if it fits in our ranges */
2331 if (value
>= -(1<<7) && value
<= (1<<7)-1) {
2332 enc
[0] = (REDIS_RDB_ENCVAL
<<6)|REDIS_RDB_ENC_INT8
;
2333 enc
[1] = value
&0xFF;
2335 } else if (value
>= -(1<<15) && value
<= (1<<15)-1) {
2336 enc
[0] = (REDIS_RDB_ENCVAL
<<6)|REDIS_RDB_ENC_INT16
;
2337 enc
[1] = value
&0xFF;
2338 enc
[2] = (value
>>8)&0xFF;
2340 } else if (value
>= -((long long)1<<31) && value
<= ((long long)1<<31)-1) {
2341 enc
[0] = (REDIS_RDB_ENCVAL
<<6)|REDIS_RDB_ENC_INT32
;
2342 enc
[1] = value
&0xFF;
2343 enc
[2] = (value
>>8)&0xFF;
2344 enc
[3] = (value
>>16)&0xFF;
2345 enc
[4] = (value
>>24)&0xFF;
2352 static int rdbSaveLzfStringObject(FILE *fp
, robj
*obj
) {
2353 unsigned int comprlen
, outlen
;
2357 /* We require at least four bytes compression for this to be worth it */
2358 outlen
= sdslen(obj
->ptr
)-4;
2359 if (outlen
<= 0) return 0;
2360 if ((out
= zmalloc(outlen
+1)) == NULL
) return 0;
2361 comprlen
= lzf_compress(obj
->ptr
, sdslen(obj
->ptr
), out
, outlen
);
2362 if (comprlen
== 0) {
2366 /* Data compressed! Let's save it on disk */
2367 byte
= (REDIS_RDB_ENCVAL
<<6)|REDIS_RDB_ENC_LZF
;
2368 if (fwrite(&byte
,1,1,fp
) == 0) goto writeerr
;
2369 if (rdbSaveLen(fp
,comprlen
) == -1) goto writeerr
;
2370 if (rdbSaveLen(fp
,sdslen(obj
->ptr
)) == -1) goto writeerr
;
2371 if (fwrite(out
,comprlen
,1,fp
) == 0) goto writeerr
;
2380 /* Save a string objet as [len][data] on disk. If the object is a string
2381 * representation of an integer value we try to safe it in a special form */
2382 static int rdbSaveStringObjectRaw(FILE *fp
, robj
*obj
) {
2386 len
= sdslen(obj
->ptr
);
2388 /* Try integer encoding */
2390 unsigned char buf
[5];
2391 if ((enclen
= rdbTryIntegerEncoding(obj
->ptr
,buf
)) > 0) {
2392 if (fwrite(buf
,enclen
,1,fp
) == 0) return -1;
2397 /* Try LZF compression - under 20 bytes it's unable to compress even
2398 * aaaaaaaaaaaaaaaaaa so skip it */
2402 retval
= rdbSaveLzfStringObject(fp
,obj
);
2403 if (retval
== -1) return -1;
2404 if (retval
> 0) return 0;
2405 /* retval == 0 means data can't be compressed, save the old way */
2408 /* Store verbatim */
2409 if (rdbSaveLen(fp
,len
) == -1) return -1;
2410 if (len
&& fwrite(obj
->ptr
,len
,1,fp
) == 0) return -1;
2414 /* Like rdbSaveStringObjectRaw() but handle encoded objects */
2415 static int rdbSaveStringObject(FILE *fp
, robj
*obj
) {
2419 if (obj
->encoding
!= REDIS_ENCODING_RAW
) {
2420 dec
= getDecodedObject(obj
);
2421 retval
= rdbSaveStringObjectRaw(fp
,dec
);
2425 return rdbSaveStringObjectRaw(fp
,obj
);
2429 /* Save a double value. Doubles are saved as strings prefixed by an unsigned
2430 * 8 bit integer specifing the length of the representation.
2431 * This 8 bit integer has special values in order to specify the following
2437 static int rdbSaveDoubleValue(FILE *fp
, double val
) {
2438 unsigned char buf
[128];
2444 } else if (!isfinite(val
)) {
2446 buf
[0] = (val
< 0) ? 255 : 254;
2448 snprintf((char*)buf
+1,sizeof(buf
)-1,"%.17g",val
);
2449 buf
[0] = strlen((char*)buf
);
2452 if (fwrite(buf
,len
,1,fp
) == 0) return -1;
2456 /* Save the DB on disk. Return REDIS_ERR on error, REDIS_OK on success */
2457 static int rdbSave(char *filename
) {
2458 dictIterator
*di
= NULL
;
2463 time_t now
= time(NULL
);
2465 snprintf(tmpfile
,256,"temp-%d.rdb", (int) getpid());
2466 fp
= fopen(tmpfile
,"w");
2468 redisLog(REDIS_WARNING
, "Failed saving the DB: %s", strerror(errno
));
2471 if (fwrite("REDIS0001",9,1,fp
) == 0) goto werr
;
2472 for (j
= 0; j
< server
.dbnum
; j
++) {
2473 redisDb
*db
= server
.db
+j
;
2475 if (dictSize(d
) == 0) continue;
2476 di
= dictGetIterator(d
);
2482 /* Write the SELECT DB opcode */
2483 if (rdbSaveType(fp
,REDIS_SELECTDB
) == -1) goto werr
;
2484 if (rdbSaveLen(fp
,j
) == -1) goto werr
;
2486 /* Iterate this DB writing every entry */
2487 while((de
= dictNext(di
)) != NULL
) {
2488 robj
*key
= dictGetEntryKey(de
);
2489 robj
*o
= dictGetEntryVal(de
);
2490 time_t expiretime
= getExpire(db
,key
);
2492 /* Save the expire time */
2493 if (expiretime
!= -1) {
2494 /* If this key is already expired skip it */
2495 if (expiretime
< now
) continue;
2496 if (rdbSaveType(fp
,REDIS_EXPIRETIME
) == -1) goto werr
;
2497 if (rdbSaveTime(fp
,expiretime
) == -1) goto werr
;
2499 /* Save the key and associated value */
2500 if (rdbSaveType(fp
,o
->type
) == -1) goto werr
;
2501 if (rdbSaveStringObject(fp
,key
) == -1) goto werr
;
2502 if (o
->type
== REDIS_STRING
) {
2503 /* Save a string value */
2504 if (rdbSaveStringObject(fp
,o
) == -1) goto werr
;
2505 } else if (o
->type
== REDIS_LIST
) {
2506 /* Save a list value */
2507 list
*list
= o
->ptr
;
2511 if (rdbSaveLen(fp
,listLength(list
)) == -1) goto werr
;
2512 while((ln
= listYield(list
))) {
2513 robj
*eleobj
= listNodeValue(ln
);
2515 if (rdbSaveStringObject(fp
,eleobj
) == -1) goto werr
;
2517 } else if (o
->type
== REDIS_SET
) {
2518 /* Save a set value */
2520 dictIterator
*di
= dictGetIterator(set
);
2523 if (rdbSaveLen(fp
,dictSize(set
)) == -1) goto werr
;
2524 while((de
= dictNext(di
)) != NULL
) {
2525 robj
*eleobj
= dictGetEntryKey(de
);
2527 if (rdbSaveStringObject(fp
,eleobj
) == -1) goto werr
;
2529 dictReleaseIterator(di
);
2530 } else if (o
->type
== REDIS_ZSET
) {
2531 /* Save a set value */
2533 dictIterator
*di
= dictGetIterator(zs
->dict
);
2536 if (rdbSaveLen(fp
,dictSize(zs
->dict
)) == -1) goto werr
;
2537 while((de
= dictNext(di
)) != NULL
) {
2538 robj
*eleobj
= dictGetEntryKey(de
);
2539 double *score
= dictGetEntryVal(de
);
2541 if (rdbSaveStringObject(fp
,eleobj
) == -1) goto werr
;
2542 if (rdbSaveDoubleValue(fp
,*score
) == -1) goto werr
;
2544 dictReleaseIterator(di
);
2549 dictReleaseIterator(di
);
2552 if (rdbSaveType(fp
,REDIS_EOF
) == -1) goto werr
;
2554 /* Make sure data will not remain on the OS's output buffers */
2559 /* Use RENAME to make sure the DB file is changed atomically only
2560 * if the generate DB file is ok. */
2561 if (rename(tmpfile
,filename
) == -1) {
2562 redisLog(REDIS_WARNING
,"Error moving temp DB file on the final destination: %s", strerror(errno
));
2566 redisLog(REDIS_NOTICE
,"DB saved on disk");
2568 server
.lastsave
= time(NULL
);
2574 redisLog(REDIS_WARNING
,"Write error saving DB on disk: %s", strerror(errno
));
2575 if (di
) dictReleaseIterator(di
);
2579 static int rdbSaveBackground(char *filename
) {
2582 if (server
.bgsaveinprogress
) return REDIS_ERR
;
2583 if ((childpid
= fork()) == 0) {
2586 if (rdbSave(filename
) == REDIS_OK
) {
2593 if (childpid
== -1) {
2594 redisLog(REDIS_WARNING
,"Can't save in background: fork: %s",
2598 redisLog(REDIS_NOTICE
,"Background saving started by pid %d",childpid
);
2599 server
.bgsaveinprogress
= 1;
2600 server
.bgsavechildpid
= childpid
;
2603 return REDIS_OK
; /* unreached */
2606 static void rdbRemoveTempFile(pid_t childpid
) {
2609 snprintf(tmpfile
,256,"temp-%d.rdb", (int) childpid
);
2613 static int rdbLoadType(FILE *fp
) {
2615 if (fread(&type
,1,1,fp
) == 0) return -1;
2619 static time_t rdbLoadTime(FILE *fp
) {
2621 if (fread(&t32
,4,1,fp
) == 0) return -1;
2622 return (time_t) t32
;
2625 /* Load an encoded length from the DB, see the REDIS_RDB_* defines on the top
2626 * of this file for a description of how this are stored on disk.
2628 * isencoded is set to 1 if the readed length is not actually a length but
2629 * an "encoding type", check the above comments for more info */
2630 static uint32_t rdbLoadLen(FILE *fp
, int rdbver
, int *isencoded
) {
2631 unsigned char buf
[2];
2634 if (isencoded
) *isencoded
= 0;
2636 if (fread(&len
,4,1,fp
) == 0) return REDIS_RDB_LENERR
;
2641 if (fread(buf
,1,1,fp
) == 0) return REDIS_RDB_LENERR
;
2642 type
= (buf
[0]&0xC0)>>6;
2643 if (type
== REDIS_RDB_6BITLEN
) {
2644 /* Read a 6 bit len */
2646 } else if (type
== REDIS_RDB_ENCVAL
) {
2647 /* Read a 6 bit len encoding type */
2648 if (isencoded
) *isencoded
= 1;
2650 } else if (type
== REDIS_RDB_14BITLEN
) {
2651 /* Read a 14 bit len */
2652 if (fread(buf
+1,1,1,fp
) == 0) return REDIS_RDB_LENERR
;
2653 return ((buf
[0]&0x3F)<<8)|buf
[1];
2655 /* Read a 32 bit len */
2656 if (fread(&len
,4,1,fp
) == 0) return REDIS_RDB_LENERR
;
2662 static robj
*rdbLoadIntegerObject(FILE *fp
, int enctype
) {
2663 unsigned char enc
[4];
2666 if (enctype
== REDIS_RDB_ENC_INT8
) {
2667 if (fread(enc
,1,1,fp
) == 0) return NULL
;
2668 val
= (signed char)enc
[0];
2669 } else if (enctype
== REDIS_RDB_ENC_INT16
) {
2671 if (fread(enc
,2,1,fp
) == 0) return NULL
;
2672 v
= enc
[0]|(enc
[1]<<8);
2674 } else if (enctype
== REDIS_RDB_ENC_INT32
) {
2676 if (fread(enc
,4,1,fp
) == 0) return NULL
;
2677 v
= enc
[0]|(enc
[1]<<8)|(enc
[2]<<16)|(enc
[3]<<24);
2680 val
= 0; /* anti-warning */
2683 return createObject(REDIS_STRING
,sdscatprintf(sdsempty(),"%lld",val
));
2686 static robj
*rdbLoadLzfStringObject(FILE*fp
, int rdbver
) {
2687 unsigned int len
, clen
;
2688 unsigned char *c
= NULL
;
2691 if ((clen
= rdbLoadLen(fp
,rdbver
,NULL
)) == REDIS_RDB_LENERR
) return NULL
;
2692 if ((len
= rdbLoadLen(fp
,rdbver
,NULL
)) == REDIS_RDB_LENERR
) return NULL
;
2693 if ((c
= zmalloc(clen
)) == NULL
) goto err
;
2694 if ((val
= sdsnewlen(NULL
,len
)) == NULL
) goto err
;
2695 if (fread(c
,clen
,1,fp
) == 0) goto err
;
2696 if (lzf_decompress(c
,clen
,val
,len
) == 0) goto err
;
2698 return createObject(REDIS_STRING
,val
);
2705 static robj
*rdbLoadStringObject(FILE*fp
, int rdbver
) {
2710 len
= rdbLoadLen(fp
,rdbver
,&isencoded
);
2713 case REDIS_RDB_ENC_INT8
:
2714 case REDIS_RDB_ENC_INT16
:
2715 case REDIS_RDB_ENC_INT32
:
2716 return tryObjectSharing(rdbLoadIntegerObject(fp
,len
));
2717 case REDIS_RDB_ENC_LZF
:
2718 return tryObjectSharing(rdbLoadLzfStringObject(fp
,rdbver
));
2724 if (len
== REDIS_RDB_LENERR
) return NULL
;
2725 val
= sdsnewlen(NULL
,len
);
2726 if (len
&& fread(val
,len
,1,fp
) == 0) {
2730 return tryObjectSharing(createObject(REDIS_STRING
,val
));
2733 /* For information about double serialization check rdbSaveDoubleValue() */
2734 static int rdbLoadDoubleValue(FILE *fp
, double *val
) {
2738 if (fread(&len
,1,1,fp
) == 0) return -1;
2740 case 255: *val
= R_NegInf
; return 0;
2741 case 254: *val
= R_PosInf
; return 0;
2742 case 253: *val
= R_Nan
; return 0;
2744 if (fread(buf
,len
,1,fp
) == 0) return -1;
2745 sscanf(buf
, "%lg", val
);
2750 static int rdbLoad(char *filename
) {
2752 robj
*keyobj
= NULL
;
2754 int type
, retval
, rdbver
;
2755 dict
*d
= server
.db
[0].dict
;
2756 redisDb
*db
= server
.db
+0;
2758 time_t expiretime
= -1, now
= time(NULL
);
2760 fp
= fopen(filename
,"r");
2761 if (!fp
) return REDIS_ERR
;
2762 if (fread(buf
,9,1,fp
) == 0) goto eoferr
;
2764 if (memcmp(buf
,"REDIS",5) != 0) {
2766 redisLog(REDIS_WARNING
,"Wrong signature trying to load DB from file");
2769 rdbver
= atoi(buf
+5);
2772 redisLog(REDIS_WARNING
,"Can't handle RDB format version %d",rdbver
);
2779 if ((type
= rdbLoadType(fp
)) == -1) goto eoferr
;
2780 if (type
== REDIS_EXPIRETIME
) {
2781 if ((expiretime
= rdbLoadTime(fp
)) == -1) goto eoferr
;
2782 /* We read the time so we need to read the object type again */
2783 if ((type
= rdbLoadType(fp
)) == -1) goto eoferr
;
2785 if (type
== REDIS_EOF
) break;
2786 /* Handle SELECT DB opcode as a special case */
2787 if (type
== REDIS_SELECTDB
) {
2788 if ((dbid
= rdbLoadLen(fp
,rdbver
,NULL
)) == REDIS_RDB_LENERR
)
2790 if (dbid
>= (unsigned)server
.dbnum
) {
2791 redisLog(REDIS_WARNING
,"FATAL: Data file was created with a Redis server configured to handle more than %d databases. Exiting\n", server
.dbnum
);
2794 db
= server
.db
+dbid
;
2799 if ((keyobj
= rdbLoadStringObject(fp
,rdbver
)) == NULL
) goto eoferr
;
2801 if (type
== REDIS_STRING
) {
2802 /* Read string value */
2803 if ((o
= rdbLoadStringObject(fp
,rdbver
)) == NULL
) goto eoferr
;
2804 tryObjectEncoding(o
);
2805 } else if (type
== REDIS_LIST
|| type
== REDIS_SET
) {
2806 /* Read list/set value */
2809 if ((listlen
= rdbLoadLen(fp
,rdbver
,NULL
)) == REDIS_RDB_LENERR
)
2811 o
= (type
== REDIS_LIST
) ? createListObject() : createSetObject();
2812 /* Load every single element of the list/set */
2816 if ((ele
= rdbLoadStringObject(fp
,rdbver
)) == NULL
) goto eoferr
;
2817 tryObjectEncoding(ele
);
2818 if (type
== REDIS_LIST
) {
2819 listAddNodeTail((list
*)o
->ptr
,ele
);
2821 dictAdd((dict
*)o
->ptr
,ele
,NULL
);
2824 } else if (type
== REDIS_ZSET
) {
2825 /* Read list/set value */
2829 if ((zsetlen
= rdbLoadLen(fp
,rdbver
,NULL
)) == REDIS_RDB_LENERR
)
2831 o
= createZsetObject();
2833 /* Load every single element of the list/set */
2836 double *score
= zmalloc(sizeof(double));
2838 if ((ele
= rdbLoadStringObject(fp
,rdbver
)) == NULL
) goto eoferr
;
2839 tryObjectEncoding(ele
);
2840 if (rdbLoadDoubleValue(fp
,score
) == -1) goto eoferr
;
2841 dictAdd(zs
->dict
,ele
,score
);
2842 zslInsert(zs
->zsl
,*score
,ele
);
2843 incrRefCount(ele
); /* added to skiplist */
2848 /* Add the new object in the hash table */
2849 retval
= dictAdd(d
,keyobj
,o
);
2850 if (retval
== DICT_ERR
) {
2851 redisLog(REDIS_WARNING
,"Loading DB, duplicated key (%s) found! Unrecoverable error, exiting now.", keyobj
->ptr
);
2854 /* Set the expire time if needed */
2855 if (expiretime
!= -1) {
2856 setExpire(db
,keyobj
,expiretime
);
2857 /* Delete this key if already expired */
2858 if (expiretime
< now
) deleteKey(db
,keyobj
);
2866 eoferr
: /* unexpected end of file is handled here with a fatal exit */
2867 if (keyobj
) decrRefCount(keyobj
);
2868 redisLog(REDIS_WARNING
,"Short read or OOM loading DB. Unrecoverable error, aborting now.");
2870 return REDIS_ERR
; /* Just to avoid warning */
2873 /*================================== Commands =============================== */
2875 static void authCommand(redisClient
*c
) {
2876 if (!server
.requirepass
|| !strcmp(c
->argv
[1]->ptr
, server
.requirepass
)) {
2877 c
->authenticated
= 1;
2878 addReply(c
,shared
.ok
);
2880 c
->authenticated
= 0;
2881 addReplySds(c
,sdscatprintf(sdsempty(),"-ERR invalid password\r\n"));
2885 static void pingCommand(redisClient
*c
) {
2886 addReply(c
,shared
.pong
);
2889 static void echoCommand(redisClient
*c
) {
2890 addReplyBulkLen(c
,c
->argv
[1]);
2891 addReply(c
,c
->argv
[1]);
2892 addReply(c
,shared
.crlf
);
2895 /*=================================== Strings =============================== */
2897 static void setGenericCommand(redisClient
*c
, int nx
) {
2900 retval
= dictAdd(c
->db
->dict
,c
->argv
[1],c
->argv
[2]);
2901 if (retval
== DICT_ERR
) {
2903 dictReplace(c
->db
->dict
,c
->argv
[1],c
->argv
[2]);
2904 incrRefCount(c
->argv
[2]);
2906 addReply(c
,shared
.czero
);
2910 incrRefCount(c
->argv
[1]);
2911 incrRefCount(c
->argv
[2]);
2914 removeExpire(c
->db
,c
->argv
[1]);
2915 addReply(c
, nx
? shared
.cone
: shared
.ok
);
2918 static void setCommand(redisClient
*c
) {
2919 setGenericCommand(c
,0);
2922 static void setnxCommand(redisClient
*c
) {
2923 setGenericCommand(c
,1);
2926 static void getCommand(redisClient
*c
) {
2927 robj
*o
= lookupKeyRead(c
->db
,c
->argv
[1]);
2930 addReply(c
,shared
.nullbulk
);
2932 if (o
->type
!= REDIS_STRING
) {
2933 addReply(c
,shared
.wrongtypeerr
);
2935 addReplyBulkLen(c
,o
);
2937 addReply(c
,shared
.crlf
);
2942 static void getsetCommand(redisClient
*c
) {
2944 if (dictAdd(c
->db
->dict
,c
->argv
[1],c
->argv
[2]) == DICT_ERR
) {
2945 dictReplace(c
->db
->dict
,c
->argv
[1],c
->argv
[2]);
2947 incrRefCount(c
->argv
[1]);
2949 incrRefCount(c
->argv
[2]);
2951 removeExpire(c
->db
,c
->argv
[1]);
2954 static void mgetCommand(redisClient
*c
) {
2957 addReplySds(c
,sdscatprintf(sdsempty(),"*%d\r\n",c
->argc
-1));
2958 for (j
= 1; j
< c
->argc
; j
++) {
2959 robj
*o
= lookupKeyRead(c
->db
,c
->argv
[j
]);
2961 addReply(c
,shared
.nullbulk
);
2963 if (o
->type
!= REDIS_STRING
) {
2964 addReply(c
,shared
.nullbulk
);
2966 addReplyBulkLen(c
,o
);
2968 addReply(c
,shared
.crlf
);
2974 static void incrDecrCommand(redisClient
*c
, long long incr
) {
2979 o
= lookupKeyWrite(c
->db
,c
->argv
[1]);
2983 if (o
->type
!= REDIS_STRING
) {
2988 if (o
->encoding
== REDIS_ENCODING_RAW
)
2989 value
= strtoll(o
->ptr
, &eptr
, 10);
2990 else if (o
->encoding
== REDIS_ENCODING_INT
)
2991 value
= (long)o
->ptr
;
2998 o
= createObject(REDIS_STRING
,sdscatprintf(sdsempty(),"%lld",value
));
2999 tryObjectEncoding(o
);
3000 retval
= dictAdd(c
->db
->dict
,c
->argv
[1],o
);
3001 if (retval
== DICT_ERR
) {
3002 dictReplace(c
->db
->dict
,c
->argv
[1],o
);
3003 removeExpire(c
->db
,c
->argv
[1]);
3005 incrRefCount(c
->argv
[1]);
3008 addReply(c
,shared
.colon
);
3010 addReply(c
,shared
.crlf
);
3013 static void incrCommand(redisClient
*c
) {
3014 incrDecrCommand(c
,1);
3017 static void decrCommand(redisClient
*c
) {
3018 incrDecrCommand(c
,-1);
3021 static void incrbyCommand(redisClient
*c
) {
3022 long long incr
= strtoll(c
->argv
[2]->ptr
, NULL
, 10);
3023 incrDecrCommand(c
,incr
);
3026 static void decrbyCommand(redisClient
*c
) {
3027 long long incr
= strtoll(c
->argv
[2]->ptr
, NULL
, 10);
3028 incrDecrCommand(c
,-incr
);
3031 /* ========================= Type agnostic commands ========================= */
3033 static void delCommand(redisClient
*c
) {
3036 for (j
= 1; j
< c
->argc
; j
++) {
3037 if (deleteKey(c
->db
,c
->argv
[j
])) {
3044 addReply(c
,shared
.czero
);
3047 addReply(c
,shared
.cone
);
3050 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",deleted
));
3055 static void existsCommand(redisClient
*c
) {
3056 addReply(c
,lookupKeyRead(c
->db
,c
->argv
[1]) ? shared
.cone
: shared
.czero
);
3059 static void selectCommand(redisClient
*c
) {
3060 int id
= atoi(c
->argv
[1]->ptr
);
3062 if (selectDb(c
,id
) == REDIS_ERR
) {
3063 addReplySds(c
,sdsnew("-ERR invalid DB index\r\n"));
3065 addReply(c
,shared
.ok
);
3069 static void randomkeyCommand(redisClient
*c
) {
3073 de
= dictGetRandomKey(c
->db
->dict
);
3074 if (!de
|| expireIfNeeded(c
->db
,dictGetEntryKey(de
)) == 0) break;
3077 addReply(c
,shared
.plus
);
3078 addReply(c
,shared
.crlf
);
3080 addReply(c
,shared
.plus
);
3081 addReply(c
,dictGetEntryKey(de
));
3082 addReply(c
,shared
.crlf
);
3086 static void keysCommand(redisClient
*c
) {
3089 sds pattern
= c
->argv
[1]->ptr
;
3090 int plen
= sdslen(pattern
);
3091 int numkeys
= 0, keyslen
= 0;
3092 robj
*lenobj
= createObject(REDIS_STRING
,NULL
);
3094 di
= dictGetIterator(c
->db
->dict
);
3096 decrRefCount(lenobj
);
3097 while((de
= dictNext(di
)) != NULL
) {
3098 robj
*keyobj
= dictGetEntryKey(de
);
3100 sds key
= keyobj
->ptr
;
3101 if ((pattern
[0] == '*' && pattern
[1] == '\0') ||
3102 stringmatchlen(pattern
,plen
,key
,sdslen(key
),0)) {
3103 if (expireIfNeeded(c
->db
,keyobj
) == 0) {
3105 addReply(c
,shared
.space
);
3108 keyslen
+= sdslen(key
);
3112 dictReleaseIterator(di
);
3113 lenobj
->ptr
= sdscatprintf(sdsempty(),"$%lu\r\n",keyslen
+(numkeys
? (numkeys
-1) : 0));
3114 addReply(c
,shared
.crlf
);
3117 static void dbsizeCommand(redisClient
*c
) {
3119 sdscatprintf(sdsempty(),":%lu\r\n",dictSize(c
->db
->dict
)));
3122 static void lastsaveCommand(redisClient
*c
) {
3124 sdscatprintf(sdsempty(),":%lu\r\n",server
.lastsave
));
3127 static void typeCommand(redisClient
*c
) {
3131 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
3136 case REDIS_STRING
: type
= "+string"; break;
3137 case REDIS_LIST
: type
= "+list"; break;
3138 case REDIS_SET
: type
= "+set"; break;
3139 case REDIS_ZSET
: type
= "+zset"; break;
3140 default: type
= "unknown"; break;
3143 addReplySds(c
,sdsnew(type
));
3144 addReply(c
,shared
.crlf
);
3147 static void saveCommand(redisClient
*c
) {
3148 if (server
.bgsaveinprogress
) {
3149 addReplySds(c
,sdsnew("-ERR background save in progress\r\n"));
3152 if (rdbSave(server
.dbfilename
) == REDIS_OK
) {
3153 addReply(c
,shared
.ok
);
3155 addReply(c
,shared
.err
);
3159 static void bgsaveCommand(redisClient
*c
) {
3160 if (server
.bgsaveinprogress
) {
3161 addReplySds(c
,sdsnew("-ERR background save already in progress\r\n"));
3164 if (rdbSaveBackground(server
.dbfilename
) == REDIS_OK
) {
3165 addReply(c
,shared
.ok
);
3167 addReply(c
,shared
.err
);
3171 static void shutdownCommand(redisClient
*c
) {
3172 redisLog(REDIS_WARNING
,"User requested shutdown, saving DB...");
3173 /* Kill the saving child if there is a background saving in progress.
3174 We want to avoid race conditions, for instance our saving child may
3175 overwrite the synchronous saving did by SHUTDOWN. */
3176 if (server
.bgsaveinprogress
) {
3177 redisLog(REDIS_WARNING
,"There is a live saving child. Killing it!");
3178 kill(server
.bgsavechildpid
,SIGKILL
);
3179 rdbRemoveTempFile(server
.bgsavechildpid
);
3182 if (rdbSave(server
.dbfilename
) == REDIS_OK
) {
3183 if (server
.daemonize
)
3184 unlink(server
.pidfile
);
3185 redisLog(REDIS_WARNING
,"%zu bytes used at exit",zmalloc_used_memory());
3186 redisLog(REDIS_WARNING
,"Server exit now, bye bye...");
3189 /* Ooops.. error saving! The best we can do is to continue operating.
3190 * Note that if there was a background saving process, in the next
3191 * cron() Redis will be notified that the background saving aborted,
3192 * handling special stuff like slaves pending for synchronization... */
3193 redisLog(REDIS_WARNING
,"Error trying to save the DB, can't exit");
3194 addReplySds(c
,sdsnew("-ERR can't quit, problems saving the DB\r\n"));
3198 static void renameGenericCommand(redisClient
*c
, int nx
) {
3201 /* To use the same key as src and dst is probably an error */
3202 if (sdscmp(c
->argv
[1]->ptr
,c
->argv
[2]->ptr
) == 0) {
3203 addReply(c
,shared
.sameobjecterr
);
3207 o
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3209 addReply(c
,shared
.nokeyerr
);
3213 deleteIfVolatile(c
->db
,c
->argv
[2]);
3214 if (dictAdd(c
->db
->dict
,c
->argv
[2],o
) == DICT_ERR
) {
3217 addReply(c
,shared
.czero
);
3220 dictReplace(c
->db
->dict
,c
->argv
[2],o
);
3222 incrRefCount(c
->argv
[2]);
3224 deleteKey(c
->db
,c
->argv
[1]);
3226 addReply(c
,nx
? shared
.cone
: shared
.ok
);
3229 static void renameCommand(redisClient
*c
) {
3230 renameGenericCommand(c
,0);
3233 static void renamenxCommand(redisClient
*c
) {
3234 renameGenericCommand(c
,1);
3237 static void moveCommand(redisClient
*c
) {
3242 /* Obtain source and target DB pointers */
3245 if (selectDb(c
,atoi(c
->argv
[2]->ptr
)) == REDIS_ERR
) {
3246 addReply(c
,shared
.outofrangeerr
);
3250 selectDb(c
,srcid
); /* Back to the source DB */
3252 /* If the user is moving using as target the same
3253 * DB as the source DB it is probably an error. */
3255 addReply(c
,shared
.sameobjecterr
);
3259 /* Check if the element exists and get a reference */
3260 o
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3262 addReply(c
,shared
.czero
);
3266 /* Try to add the element to the target DB */
3267 deleteIfVolatile(dst
,c
->argv
[1]);
3268 if (dictAdd(dst
->dict
,c
->argv
[1],o
) == DICT_ERR
) {
3269 addReply(c
,shared
.czero
);
3272 incrRefCount(c
->argv
[1]);
3275 /* OK! key moved, free the entry in the source DB */
3276 deleteKey(src
,c
->argv
[1]);
3278 addReply(c
,shared
.cone
);
3281 /* =================================== Lists ================================ */
3282 static void pushGenericCommand(redisClient
*c
, int where
) {
3286 lobj
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3288 lobj
= createListObject();
3290 if (where
== REDIS_HEAD
) {
3291 listAddNodeHead(list
,c
->argv
[2]);
3293 listAddNodeTail(list
,c
->argv
[2]);
3295 dictAdd(c
->db
->dict
,c
->argv
[1],lobj
);
3296 incrRefCount(c
->argv
[1]);
3297 incrRefCount(c
->argv
[2]);
3299 if (lobj
->type
!= REDIS_LIST
) {
3300 addReply(c
,shared
.wrongtypeerr
);
3304 if (where
== REDIS_HEAD
) {
3305 listAddNodeHead(list
,c
->argv
[2]);
3307 listAddNodeTail(list
,c
->argv
[2]);
3309 incrRefCount(c
->argv
[2]);
3312 addReply(c
,shared
.ok
);
3315 static void lpushCommand(redisClient
*c
) {
3316 pushGenericCommand(c
,REDIS_HEAD
);
3319 static void rpushCommand(redisClient
*c
) {
3320 pushGenericCommand(c
,REDIS_TAIL
);
3323 static void llenCommand(redisClient
*c
) {
3327 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
3329 addReply(c
,shared
.czero
);
3332 if (o
->type
!= REDIS_LIST
) {
3333 addReply(c
,shared
.wrongtypeerr
);
3336 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",listLength(l
)));
3341 static void lindexCommand(redisClient
*c
) {
3343 int index
= atoi(c
->argv
[2]->ptr
);
3345 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
3347 addReply(c
,shared
.nullbulk
);
3349 if (o
->type
!= REDIS_LIST
) {
3350 addReply(c
,shared
.wrongtypeerr
);
3352 list
*list
= o
->ptr
;
3355 ln
= listIndex(list
, index
);
3357 addReply(c
,shared
.nullbulk
);
3359 robj
*ele
= listNodeValue(ln
);
3360 addReplyBulkLen(c
,ele
);
3362 addReply(c
,shared
.crlf
);
3368 static void lsetCommand(redisClient
*c
) {
3370 int index
= atoi(c
->argv
[2]->ptr
);
3372 o
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3374 addReply(c
,shared
.nokeyerr
);
3376 if (o
->type
!= REDIS_LIST
) {
3377 addReply(c
,shared
.wrongtypeerr
);
3379 list
*list
= o
->ptr
;
3382 ln
= listIndex(list
, index
);
3384 addReply(c
,shared
.outofrangeerr
);
3386 robj
*ele
= listNodeValue(ln
);
3389 listNodeValue(ln
) = c
->argv
[3];
3390 incrRefCount(c
->argv
[3]);
3391 addReply(c
,shared
.ok
);
3398 static void popGenericCommand(redisClient
*c
, int where
) {
3401 o
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3403 addReply(c
,shared
.nullbulk
);
3405 if (o
->type
!= REDIS_LIST
) {
3406 addReply(c
,shared
.wrongtypeerr
);
3408 list
*list
= o
->ptr
;
3411 if (where
== REDIS_HEAD
)
3412 ln
= listFirst(list
);
3414 ln
= listLast(list
);
3417 addReply(c
,shared
.nullbulk
);
3419 robj
*ele
= listNodeValue(ln
);
3420 addReplyBulkLen(c
,ele
);
3422 addReply(c
,shared
.crlf
);
3423 listDelNode(list
,ln
);
3430 static void lpopCommand(redisClient
*c
) {
3431 popGenericCommand(c
,REDIS_HEAD
);
3434 static void rpopCommand(redisClient
*c
) {
3435 popGenericCommand(c
,REDIS_TAIL
);
3438 static void lrangeCommand(redisClient
*c
) {
3440 int start
= atoi(c
->argv
[2]->ptr
);
3441 int end
= atoi(c
->argv
[3]->ptr
);
3443 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
3445 addReply(c
,shared
.nullmultibulk
);
3447 if (o
->type
!= REDIS_LIST
) {
3448 addReply(c
,shared
.wrongtypeerr
);
3450 list
*list
= o
->ptr
;
3452 int llen
= listLength(list
);
3456 /* convert negative indexes */
3457 if (start
< 0) start
= llen
+start
;
3458 if (end
< 0) end
= llen
+end
;
3459 if (start
< 0) start
= 0;
3460 if (end
< 0) end
= 0;
3462 /* indexes sanity checks */
3463 if (start
> end
|| start
>= llen
) {
3464 /* Out of range start or start > end result in empty list */
3465 addReply(c
,shared
.emptymultibulk
);
3468 if (end
>= llen
) end
= llen
-1;
3469 rangelen
= (end
-start
)+1;
3471 /* Return the result in form of a multi-bulk reply */
3472 ln
= listIndex(list
, start
);
3473 addReplySds(c
,sdscatprintf(sdsempty(),"*%d\r\n",rangelen
));
3474 for (j
= 0; j
< rangelen
; j
++) {
3475 ele
= listNodeValue(ln
);
3476 addReplyBulkLen(c
,ele
);
3478 addReply(c
,shared
.crlf
);
3485 static void ltrimCommand(redisClient
*c
) {
3487 int start
= atoi(c
->argv
[2]->ptr
);
3488 int end
= atoi(c
->argv
[3]->ptr
);
3490 o
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3492 addReply(c
,shared
.nokeyerr
);
3494 if (o
->type
!= REDIS_LIST
) {
3495 addReply(c
,shared
.wrongtypeerr
);
3497 list
*list
= o
->ptr
;
3499 int llen
= listLength(list
);
3500 int j
, ltrim
, rtrim
;
3502 /* convert negative indexes */
3503 if (start
< 0) start
= llen
+start
;
3504 if (end
< 0) end
= llen
+end
;
3505 if (start
< 0) start
= 0;
3506 if (end
< 0) end
= 0;
3508 /* indexes sanity checks */
3509 if (start
> end
|| start
>= llen
) {
3510 /* Out of range start or start > end result in empty list */
3514 if (end
>= llen
) end
= llen
-1;
3519 /* Remove list elements to perform the trim */
3520 for (j
= 0; j
< ltrim
; j
++) {
3521 ln
= listFirst(list
);
3522 listDelNode(list
,ln
);
3524 for (j
= 0; j
< rtrim
; j
++) {
3525 ln
= listLast(list
);
3526 listDelNode(list
,ln
);
3529 addReply(c
,shared
.ok
);
3534 static void lremCommand(redisClient
*c
) {
3537 o
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3539 addReply(c
,shared
.czero
);
3541 if (o
->type
!= REDIS_LIST
) {
3542 addReply(c
,shared
.wrongtypeerr
);
3544 list
*list
= o
->ptr
;
3545 listNode
*ln
, *next
;
3546 int toremove
= atoi(c
->argv
[2]->ptr
);
3551 toremove
= -toremove
;
3554 ln
= fromtail
? list
->tail
: list
->head
;
3556 robj
*ele
= listNodeValue(ln
);
3558 next
= fromtail
? ln
->prev
: ln
->next
;
3559 if (compareStringObjects(ele
,c
->argv
[3]) == 0) {
3560 listDelNode(list
,ln
);
3563 if (toremove
&& removed
== toremove
) break;
3567 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",removed
));
3572 /* This is the semantic of this command:
3573 * RPOPLPUSH srclist dstlist:
3574 * IF LLEN(srclist) > 0
3575 * element = RPOP srclist
3576 * LPUSH dstlist element
3583 * The idea is to be able to get an element from a list in a reliable way
3584 * since the element is not just returned but pushed against another list
3585 * as well. This command was originally proposed by Ezra Zygmuntowicz.
3587 static void rpoplpushcommand(redisClient
*c
) {
3590 sobj
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3592 addReply(c
,shared
.nullbulk
);
3594 if (sobj
->type
!= REDIS_LIST
) {
3595 addReply(c
,shared
.wrongtypeerr
);
3597 list
*srclist
= sobj
->ptr
;
3598 listNode
*ln
= listLast(srclist
);
3601 addReply(c
,shared
.nullbulk
);
3603 robj
*dobj
= lookupKeyWrite(c
->db
,c
->argv
[2]);
3604 robj
*ele
= listNodeValue(ln
);
3609 /* Create the list if the key does not exist */
3610 dobj
= createListObject();
3611 dictAdd(c
->db
->dict
,c
->argv
[2],dobj
);
3612 incrRefCount(c
->argv
[2]);
3613 } else if (dobj
->type
!= REDIS_LIST
) {
3614 addReply(c
,shared
.wrongtypeerr
);
3617 /* Add the element to the target list */
3618 dstlist
= dobj
->ptr
;
3619 listAddNodeHead(dstlist
,ele
);
3622 /* Send the element to the client as reply as well */
3623 addReplyBulkLen(c
,ele
);
3625 addReply(c
,shared
.crlf
);
3627 /* Finally remove the element from the source list */
3628 listDelNode(srclist
,ln
);
3636 /* ==================================== Sets ================================ */
3638 static void saddCommand(redisClient
*c
) {
3641 set
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3643 set
= createSetObject();
3644 dictAdd(c
->db
->dict
,c
->argv
[1],set
);
3645 incrRefCount(c
->argv
[1]);
3647 if (set
->type
!= REDIS_SET
) {
3648 addReply(c
,shared
.wrongtypeerr
);
3652 if (dictAdd(set
->ptr
,c
->argv
[2],NULL
) == DICT_OK
) {
3653 incrRefCount(c
->argv
[2]);
3655 addReply(c
,shared
.cone
);
3657 addReply(c
,shared
.czero
);
3661 static void sremCommand(redisClient
*c
) {
3664 set
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3666 addReply(c
,shared
.czero
);
3668 if (set
->type
!= REDIS_SET
) {
3669 addReply(c
,shared
.wrongtypeerr
);
3672 if (dictDelete(set
->ptr
,c
->argv
[2]) == DICT_OK
) {
3674 if (htNeedsResize(set
->ptr
)) dictResize(set
->ptr
);
3675 addReply(c
,shared
.cone
);
3677 addReply(c
,shared
.czero
);
3682 static void smoveCommand(redisClient
*c
) {
3683 robj
*srcset
, *dstset
;
3685 srcset
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3686 dstset
= lookupKeyWrite(c
->db
,c
->argv
[2]);
3688 /* If the source key does not exist return 0, if it's of the wrong type
3690 if (srcset
== NULL
|| srcset
->type
!= REDIS_SET
) {
3691 addReply(c
, srcset
? shared
.wrongtypeerr
: shared
.czero
);
3694 /* Error if the destination key is not a set as well */
3695 if (dstset
&& dstset
->type
!= REDIS_SET
) {
3696 addReply(c
,shared
.wrongtypeerr
);
3699 /* Remove the element from the source set */
3700 if (dictDelete(srcset
->ptr
,c
->argv
[3]) == DICT_ERR
) {
3701 /* Key not found in the src set! return zero */
3702 addReply(c
,shared
.czero
);
3706 /* Add the element to the destination set */
3708 dstset
= createSetObject();
3709 dictAdd(c
->db
->dict
,c
->argv
[2],dstset
);
3710 incrRefCount(c
->argv
[2]);
3712 if (dictAdd(dstset
->ptr
,c
->argv
[3],NULL
) == DICT_OK
)
3713 incrRefCount(c
->argv
[3]);
3714 addReply(c
,shared
.cone
);
3717 static void sismemberCommand(redisClient
*c
) {
3720 set
= lookupKeyRead(c
->db
,c
->argv
[1]);
3722 addReply(c
,shared
.czero
);
3724 if (set
->type
!= REDIS_SET
) {
3725 addReply(c
,shared
.wrongtypeerr
);
3728 if (dictFind(set
->ptr
,c
->argv
[2]))
3729 addReply(c
,shared
.cone
);
3731 addReply(c
,shared
.czero
);
3735 static void scardCommand(redisClient
*c
) {
3739 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
3741 addReply(c
,shared
.czero
);
3744 if (o
->type
!= REDIS_SET
) {
3745 addReply(c
,shared
.wrongtypeerr
);
3748 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",
3754 static void spopCommand(redisClient
*c
) {
3758 set
= lookupKeyWrite(c
->db
,c
->argv
[1]);
3760 addReply(c
,shared
.nullbulk
);
3762 if (set
->type
!= REDIS_SET
) {
3763 addReply(c
,shared
.wrongtypeerr
);
3766 de
= dictGetRandomKey(set
->ptr
);
3768 addReply(c
,shared
.nullbulk
);
3770 robj
*ele
= dictGetEntryKey(de
);
3772 addReplyBulkLen(c
,ele
);
3774 addReply(c
,shared
.crlf
);
3775 dictDelete(set
->ptr
,ele
);
3776 if (htNeedsResize(set
->ptr
)) dictResize(set
->ptr
);
3782 static void srandmemberCommand(redisClient
*c
) {
3786 set
= lookupKeyRead(c
->db
,c
->argv
[1]);
3788 addReply(c
,shared
.nullbulk
);
3790 if (set
->type
!= REDIS_SET
) {
3791 addReply(c
,shared
.wrongtypeerr
);
3794 de
= dictGetRandomKey(set
->ptr
);
3796 addReply(c
,shared
.nullbulk
);
3798 robj
*ele
= dictGetEntryKey(de
);
3800 addReplyBulkLen(c
,ele
);
3802 addReply(c
,shared
.crlf
);
3807 static int qsortCompareSetsByCardinality(const void *s1
, const void *s2
) {
3808 dict
**d1
= (void*) s1
, **d2
= (void*) s2
;
3810 return dictSize(*d1
)-dictSize(*d2
);
3813 static void sinterGenericCommand(redisClient
*c
, robj
**setskeys
, int setsnum
, robj
*dstkey
) {
3814 dict
**dv
= zmalloc(sizeof(dict
*)*setsnum
);
3817 robj
*lenobj
= NULL
, *dstset
= NULL
;
3818 int j
, cardinality
= 0;
3820 for (j
= 0; j
< setsnum
; j
++) {
3824 lookupKeyWrite(c
->db
,setskeys
[j
]) :
3825 lookupKeyRead(c
->db
,setskeys
[j
]);
3829 deleteKey(c
->db
,dstkey
);
3830 addReply(c
,shared
.ok
);
3832 addReply(c
,shared
.nullmultibulk
);
3836 if (setobj
->type
!= REDIS_SET
) {
3838 addReply(c
,shared
.wrongtypeerr
);
3841 dv
[j
] = setobj
->ptr
;
3843 /* Sort sets from the smallest to largest, this will improve our
3844 * algorithm's performace */
3845 qsort(dv
,setsnum
,sizeof(dict
*),qsortCompareSetsByCardinality
);
3847 /* The first thing we should output is the total number of elements...
3848 * since this is a multi-bulk write, but at this stage we don't know
3849 * the intersection set size, so we use a trick, append an empty object
3850 * to the output list and save the pointer to later modify it with the
3853 lenobj
= createObject(REDIS_STRING
,NULL
);
3855 decrRefCount(lenobj
);
3857 /* If we have a target key where to store the resulting set
3858 * create this key with an empty set inside */
3859 dstset
= createSetObject();
3862 /* Iterate all the elements of the first (smallest) set, and test
3863 * the element against all the other sets, if at least one set does
3864 * not include the element it is discarded */
3865 di
= dictGetIterator(dv
[0]);
3867 while((de
= dictNext(di
)) != NULL
) {
3870 for (j
= 1; j
< setsnum
; j
++)
3871 if (dictFind(dv
[j
],dictGetEntryKey(de
)) == NULL
) break;
3873 continue; /* at least one set does not contain the member */
3874 ele
= dictGetEntryKey(de
);
3876 addReplyBulkLen(c
,ele
);
3878 addReply(c
,shared
.crlf
);
3881 dictAdd(dstset
->ptr
,ele
,NULL
);
3885 dictReleaseIterator(di
);
3888 /* Store the resulting set into the target */
3889 deleteKey(c
->db
,dstkey
);
3890 dictAdd(c
->db
->dict
,dstkey
,dstset
);
3891 incrRefCount(dstkey
);
3895 lenobj
->ptr
= sdscatprintf(sdsempty(),"*%d\r\n",cardinality
);
3897 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",
3898 dictSize((dict
*)dstset
->ptr
)));
3904 static void sinterCommand(redisClient
*c
) {
3905 sinterGenericCommand(c
,c
->argv
+1,c
->argc
-1,NULL
);
3908 static void sinterstoreCommand(redisClient
*c
) {
3909 sinterGenericCommand(c
,c
->argv
+2,c
->argc
-2,c
->argv
[1]);
3912 #define REDIS_OP_UNION 0
3913 #define REDIS_OP_DIFF 1
3915 static void sunionDiffGenericCommand(redisClient
*c
, robj
**setskeys
, int setsnum
, robj
*dstkey
, int op
) {
3916 dict
**dv
= zmalloc(sizeof(dict
*)*setsnum
);
3919 robj
*dstset
= NULL
;
3920 int j
, cardinality
= 0;
3922 for (j
= 0; j
< setsnum
; j
++) {
3926 lookupKeyWrite(c
->db
,setskeys
[j
]) :
3927 lookupKeyRead(c
->db
,setskeys
[j
]);
3932 if (setobj
->type
!= REDIS_SET
) {
3934 addReply(c
,shared
.wrongtypeerr
);
3937 dv
[j
] = setobj
->ptr
;
3940 /* We need a temp set object to store our union. If the dstkey
3941 * is not NULL (that is, we are inside an SUNIONSTORE operation) then
3942 * this set object will be the resulting object to set into the target key*/
3943 dstset
= createSetObject();
3945 /* Iterate all the elements of all the sets, add every element a single
3946 * time to the result set */
3947 for (j
= 0; j
< setsnum
; j
++) {
3948 if (op
== REDIS_OP_DIFF
&& j
== 0 && !dv
[j
]) break; /* result set is empty */
3949 if (!dv
[j
]) continue; /* non existing keys are like empty sets */
3951 di
= dictGetIterator(dv
[j
]);
3953 while((de
= dictNext(di
)) != NULL
) {
3956 /* dictAdd will not add the same element multiple times */
3957 ele
= dictGetEntryKey(de
);
3958 if (op
== REDIS_OP_UNION
|| j
== 0) {
3959 if (dictAdd(dstset
->ptr
,ele
,NULL
) == DICT_OK
) {
3963 } else if (op
== REDIS_OP_DIFF
) {
3964 if (dictDelete(dstset
->ptr
,ele
) == DICT_OK
) {
3969 dictReleaseIterator(di
);
3971 if (op
== REDIS_OP_DIFF
&& cardinality
== 0) break; /* result set is empty */
3974 /* Output the content of the resulting set, if not in STORE mode */
3976 addReplySds(c
,sdscatprintf(sdsempty(),"*%d\r\n",cardinality
));
3977 di
= dictGetIterator(dstset
->ptr
);
3978 while((de
= dictNext(di
)) != NULL
) {
3981 ele
= dictGetEntryKey(de
);
3982 addReplyBulkLen(c
,ele
);
3984 addReply(c
,shared
.crlf
);
3986 dictReleaseIterator(di
);
3988 /* If we have a target key where to store the resulting set
3989 * create this key with the result set inside */
3990 deleteKey(c
->db
,dstkey
);
3991 dictAdd(c
->db
->dict
,dstkey
,dstset
);
3992 incrRefCount(dstkey
);
3997 decrRefCount(dstset
);
3999 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",
4000 dictSize((dict
*)dstset
->ptr
)));
4006 static void sunionCommand(redisClient
*c
) {
4007 sunionDiffGenericCommand(c
,c
->argv
+1,c
->argc
-1,NULL
,REDIS_OP_UNION
);
4010 static void sunionstoreCommand(redisClient
*c
) {
4011 sunionDiffGenericCommand(c
,c
->argv
+2,c
->argc
-2,c
->argv
[1],REDIS_OP_UNION
);
4014 static void sdiffCommand(redisClient
*c
) {
4015 sunionDiffGenericCommand(c
,c
->argv
+1,c
->argc
-1,NULL
,REDIS_OP_DIFF
);
4018 static void sdiffstoreCommand(redisClient
*c
) {
4019 sunionDiffGenericCommand(c
,c
->argv
+2,c
->argc
-2,c
->argv
[1],REDIS_OP_DIFF
);
4022 /* ==================================== ZSets =============================== */
4024 /* ZSETs are ordered sets using two data structures to hold the same elements
4025 * in order to get O(log(N)) INSERT and REMOVE operations into a sorted
4028 * The elements are added to an hash table mapping Redis objects to scores.
4029 * At the same time the elements are added to a skip list mapping scores
4030 * to Redis objects (so objects are sorted by scores in this "view"). */
4032 /* This skiplist implementation is almost a C translation of the original
4033 * algorithm described by William Pugh in "Skip Lists: A Probabilistic
4034 * Alternative to Balanced Trees", modified in three ways:
4035 * a) this implementation allows for repeated values.
4036 * b) the comparison is not just by key (our 'score') but by satellite data.
4037 * c) there is a back pointer, so it's a doubly linked list with the back
4038 * pointers being only at "level 1". This allows to traverse the list
4039 * from tail to head, useful for ZREVRANGE. */
4041 static zskiplistNode
*zslCreateNode(int level
, double score
, robj
*obj
) {
4042 zskiplistNode
*zn
= zmalloc(sizeof(*zn
));
4044 zn
->forward
= zmalloc(sizeof(zskiplistNode
*) * level
);
4050 static zskiplist
*zslCreate(void) {
4054 zsl
= zmalloc(sizeof(*zsl
));
4057 zsl
->header
= zslCreateNode(ZSKIPLIST_MAXLEVEL
,0,NULL
);
4058 for (j
= 0; j
< ZSKIPLIST_MAXLEVEL
; j
++)
4059 zsl
->header
->forward
[j
] = NULL
;
4060 zsl
->header
->backward
= NULL
;
4065 static void zslFreeNode(zskiplistNode
*node
) {
4066 decrRefCount(node
->obj
);
4067 zfree(node
->forward
);
4071 static void zslFree(zskiplist
*zsl
) {
4072 zskiplistNode
*node
= zsl
->header
->forward
[0], *next
;
4074 zfree(zsl
->header
->forward
);
4077 next
= node
->forward
[0];
4084 static int zslRandomLevel(void) {
4086 while ((random()&0xFFFF) < (ZSKIPLIST_P
* 0xFFFF))
4091 static void zslInsert(zskiplist
*zsl
, double score
, robj
*obj
) {
4092 zskiplistNode
*update
[ZSKIPLIST_MAXLEVEL
], *x
;
4096 for (i
= zsl
->level
-1; i
>= 0; i
--) {
4097 while (x
->forward
[i
] &&
4098 (x
->forward
[i
]->score
< score
||
4099 (x
->forward
[i
]->score
== score
&&
4100 compareStringObjects(x
->forward
[i
]->obj
,obj
) < 0)))
4104 /* we assume the key is not already inside, since we allow duplicated
4105 * scores, and the re-insertion of score and redis object should never
4106 * happpen since the caller of zslInsert() should test in the hash table
4107 * if the element is already inside or not. */
4108 level
= zslRandomLevel();
4109 if (level
> zsl
->level
) {
4110 for (i
= zsl
->level
; i
< level
; i
++)
4111 update
[i
] = zsl
->header
;
4114 x
= zslCreateNode(level
,score
,obj
);
4115 for (i
= 0; i
< level
; i
++) {
4116 x
->forward
[i
] = update
[i
]->forward
[i
];
4117 update
[i
]->forward
[i
] = x
;
4119 x
->backward
= (update
[0] == zsl
->header
) ? NULL
: update
[0];
4121 x
->forward
[0]->backward
= x
;
4127 /* Delete an element with matching score/object from the skiplist. */
4128 static int zslDelete(zskiplist
*zsl
, double score
, robj
*obj
) {
4129 zskiplistNode
*update
[ZSKIPLIST_MAXLEVEL
], *x
;
4133 for (i
= zsl
->level
-1; i
>= 0; i
--) {
4134 while (x
->forward
[i
] &&
4135 (x
->forward
[i
]->score
< score
||
4136 (x
->forward
[i
]->score
== score
&&
4137 compareStringObjects(x
->forward
[i
]->obj
,obj
) < 0)))
4141 /* We may have multiple elements with the same score, what we need
4142 * is to find the element with both the right score and object. */
4144 if (x
&& score
== x
->score
&& compareStringObjects(x
->obj
,obj
) == 0) {
4145 for (i
= 0; i
< zsl
->level
; i
++) {
4146 if (update
[i
]->forward
[i
] != x
) break;
4147 update
[i
]->forward
[i
] = x
->forward
[i
];
4149 if (x
->forward
[0]) {
4150 x
->forward
[0]->backward
= (x
->backward
== zsl
->header
) ?
4153 zsl
->tail
= x
->backward
;
4156 while(zsl
->level
> 1 && zsl
->header
->forward
[zsl
->level
-1] == NULL
)
4161 return 0; /* not found */
4163 return 0; /* not found */
4166 /* Delete all the elements with score between min and max from the skiplist.
4167 * Min and mx are inclusive, so a score >= min || score <= max is deleted.
4168 * Note that this function takes the reference to the hash table view of the
4169 * sorted set, in order to remove the elements from the hash table too. */
4170 static unsigned long zslDeleteRange(zskiplist
*zsl
, double min
, double max
, dict
*dict
) {
4171 zskiplistNode
*update
[ZSKIPLIST_MAXLEVEL
], *x
;
4172 unsigned long removed
= 0;
4176 for (i
= zsl
->level
-1; i
>= 0; i
--) {
4177 while (x
->forward
[i
] && x
->forward
[i
]->score
< min
)
4181 /* We may have multiple elements with the same score, what we need
4182 * is to find the element with both the right score and object. */
4184 while (x
&& x
->score
<= max
) {
4185 zskiplistNode
*next
;
4187 for (i
= 0; i
< zsl
->level
; i
++) {
4188 if (update
[i
]->forward
[i
] != x
) break;
4189 update
[i
]->forward
[i
] = x
->forward
[i
];
4191 if (x
->forward
[0]) {
4192 x
->forward
[0]->backward
= (x
->backward
== zsl
->header
) ?
4195 zsl
->tail
= x
->backward
;
4197 next
= x
->forward
[0];
4198 dictDelete(dict
,x
->obj
);
4200 while(zsl
->level
> 1 && zsl
->header
->forward
[zsl
->level
-1] == NULL
)
4206 return removed
; /* not found */
4209 /* Find the first node having a score equal or greater than the specified one.
4210 * Returns NULL if there is no match. */
4211 static zskiplistNode
*zslFirstWithScore(zskiplist
*zsl
, double score
) {
4216 for (i
= zsl
->level
-1; i
>= 0; i
--) {
4217 while (x
->forward
[i
] && x
->forward
[i
]->score
< score
)
4220 /* We may have multiple elements with the same score, what we need
4221 * is to find the element with both the right score and object. */
4222 return x
->forward
[0];
4225 /* The actual Z-commands implementations */
4227 static void zaddCommand(redisClient
*c
) {
4232 zsetobj
= lookupKeyWrite(c
->db
,c
->argv
[1]);
4233 if (zsetobj
== NULL
) {
4234 zsetobj
= createZsetObject();
4235 dictAdd(c
->db
->dict
,c
->argv
[1],zsetobj
);
4236 incrRefCount(c
->argv
[1]);
4238 if (zsetobj
->type
!= REDIS_ZSET
) {
4239 addReply(c
,shared
.wrongtypeerr
);
4243 score
= zmalloc(sizeof(double));
4244 *score
= strtod(c
->argv
[2]->ptr
,NULL
);
4246 if (dictAdd(zs
->dict
,c
->argv
[3],score
) == DICT_OK
) {
4247 /* case 1: New element */
4248 incrRefCount(c
->argv
[3]); /* added to hash */
4249 zslInsert(zs
->zsl
,*score
,c
->argv
[3]);
4250 incrRefCount(c
->argv
[3]); /* added to skiplist */
4252 addReply(c
,shared
.cone
);
4257 /* case 2: Score update operation */
4258 de
= dictFind(zs
->dict
,c
->argv
[3]);
4260 oldscore
= dictGetEntryVal(de
);
4261 if (*score
!= *oldscore
) {
4264 deleted
= zslDelete(zs
->zsl
,*oldscore
,c
->argv
[3]);
4265 assert(deleted
!= 0);
4266 zslInsert(zs
->zsl
,*score
,c
->argv
[3]);
4267 incrRefCount(c
->argv
[3]);
4268 dictReplace(zs
->dict
,c
->argv
[3],score
);
4273 addReply(c
,shared
.czero
);
4277 static void zremCommand(redisClient
*c
) {
4281 zsetobj
= lookupKeyWrite(c
->db
,c
->argv
[1]);
4282 if (zsetobj
== NULL
) {
4283 addReply(c
,shared
.czero
);
4289 if (zsetobj
->type
!= REDIS_ZSET
) {
4290 addReply(c
,shared
.wrongtypeerr
);
4294 de
= dictFind(zs
->dict
,c
->argv
[2]);
4296 addReply(c
,shared
.czero
);
4299 /* Delete from the skiplist */
4300 oldscore
= dictGetEntryVal(de
);
4301 deleted
= zslDelete(zs
->zsl
,*oldscore
,c
->argv
[2]);
4302 assert(deleted
!= 0);
4304 /* Delete from the hash table */
4305 dictDelete(zs
->dict
,c
->argv
[2]);
4306 if (htNeedsResize(zs
->dict
)) dictResize(zs
->dict
);
4308 addReply(c
,shared
.cone
);
4312 static void zremrangebyscoreCommand(redisClient
*c
) {
4313 double min
= strtod(c
->argv
[2]->ptr
,NULL
);
4314 double max
= strtod(c
->argv
[3]->ptr
,NULL
);
4318 zsetobj
= lookupKeyWrite(c
->db
,c
->argv
[1]);
4319 if (zsetobj
== NULL
) {
4320 addReply(c
,shared
.czero
);
4324 if (zsetobj
->type
!= REDIS_ZSET
) {
4325 addReply(c
,shared
.wrongtypeerr
);
4329 deleted
= zslDeleteRange(zs
->zsl
,min
,max
,zs
->dict
);
4330 if (htNeedsResize(zs
->dict
)) dictResize(zs
->dict
);
4331 server
.dirty
+= deleted
;
4332 addReplySds(c
,sdscatprintf(sdsempty(),":%lu\r\n",deleted
));
4336 static void zrangeGenericCommand(redisClient
*c
, int reverse
) {
4338 int start
= atoi(c
->argv
[2]->ptr
);
4339 int end
= atoi(c
->argv
[3]->ptr
);
4341 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
4343 addReply(c
,shared
.nullmultibulk
);
4345 if (o
->type
!= REDIS_ZSET
) {
4346 addReply(c
,shared
.wrongtypeerr
);
4348 zset
*zsetobj
= o
->ptr
;
4349 zskiplist
*zsl
= zsetobj
->zsl
;
4352 int llen
= zsl
->length
;
4356 /* convert negative indexes */
4357 if (start
< 0) start
= llen
+start
;
4358 if (end
< 0) end
= llen
+end
;
4359 if (start
< 0) start
= 0;
4360 if (end
< 0) end
= 0;
4362 /* indexes sanity checks */
4363 if (start
> end
|| start
>= llen
) {
4364 /* Out of range start or start > end result in empty list */
4365 addReply(c
,shared
.emptymultibulk
);
4368 if (end
>= llen
) end
= llen
-1;
4369 rangelen
= (end
-start
)+1;
4371 /* Return the result in form of a multi-bulk reply */
4377 ln
= zsl
->header
->forward
[0];
4379 ln
= ln
->forward
[0];
4382 addReplySds(c
,sdscatprintf(sdsempty(),"*%d\r\n",rangelen
));
4383 for (j
= 0; j
< rangelen
; j
++) {
4385 addReplyBulkLen(c
,ele
);
4387 addReply(c
,shared
.crlf
);
4388 ln
= reverse
? ln
->backward
: ln
->forward
[0];
4394 static void zrangeCommand(redisClient
*c
) {
4395 zrangeGenericCommand(c
,0);
4398 static void zrevrangeCommand(redisClient
*c
) {
4399 zrangeGenericCommand(c
,1);
4402 static void zrangebyscoreCommand(redisClient
*c
) {
4404 double min
= strtod(c
->argv
[2]->ptr
,NULL
);
4405 double max
= strtod(c
->argv
[3]->ptr
,NULL
);
4407 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
4409 addReply(c
,shared
.nullmultibulk
);
4411 if (o
->type
!= REDIS_ZSET
) {
4412 addReply(c
,shared
.wrongtypeerr
);
4414 zset
*zsetobj
= o
->ptr
;
4415 zskiplist
*zsl
= zsetobj
->zsl
;
4418 unsigned int rangelen
= 0;
4420 /* Get the first node with the score >= min */
4421 ln
= zslFirstWithScore(zsl
,min
);
4423 /* No element matching the speciifed interval */
4424 addReply(c
,shared
.emptymultibulk
);
4428 /* We don't know in advance how many matching elements there
4429 * are in the list, so we push this object that will represent
4430 * the multi-bulk length in the output buffer, and will "fix"
4432 lenobj
= createObject(REDIS_STRING
,NULL
);
4435 while(ln
&& ln
->score
<= max
) {
4437 addReplyBulkLen(c
,ele
);
4439 addReply(c
,shared
.crlf
);
4440 ln
= ln
->forward
[0];
4443 lenobj
->ptr
= sdscatprintf(sdsempty(),"*%d\r\n",rangelen
);
4448 static void zcardCommand(redisClient
*c
) {
4452 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
4454 addReply(c
,shared
.czero
);
4457 if (o
->type
!= REDIS_ZSET
) {
4458 addReply(c
,shared
.wrongtypeerr
);
4461 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",zs
->zsl
->length
));
4466 static void zscoreCommand(redisClient
*c
) {
4470 o
= lookupKeyRead(c
->db
,c
->argv
[1]);
4472 addReply(c
,shared
.nullbulk
);
4475 if (o
->type
!= REDIS_ZSET
) {
4476 addReply(c
,shared
.wrongtypeerr
);
4481 de
= dictFind(zs
->dict
,c
->argv
[2]);
4483 addReply(c
,shared
.nullbulk
);
4486 double *score
= dictGetEntryVal(de
);
4488 snprintf(buf
,sizeof(buf
),"%.17g",*score
);
4489 addReplySds(c
,sdscatprintf(sdsempty(),"$%d\r\n%s\r\n",
4496 /* ========================= Non type-specific commands ==================== */
4498 static void flushdbCommand(redisClient
*c
) {
4499 server
.dirty
+= dictSize(c
->db
->dict
);
4500 dictEmpty(c
->db
->dict
);
4501 dictEmpty(c
->db
->expires
);
4502 addReply(c
,shared
.ok
);
4505 static void flushallCommand(redisClient
*c
) {
4506 server
.dirty
+= emptyDb();
4507 addReply(c
,shared
.ok
);
4508 rdbSave(server
.dbfilename
);
4512 static redisSortOperation
*createSortOperation(int type
, robj
*pattern
) {
4513 redisSortOperation
*so
= zmalloc(sizeof(*so
));
4515 so
->pattern
= pattern
;
4519 /* Return the value associated to the key with a name obtained
4520 * substituting the first occurence of '*' in 'pattern' with 'subst' */
4521 static robj
*lookupKeyByPattern(redisDb
*db
, robj
*pattern
, robj
*subst
) {
4525 int prefixlen
, sublen
, postfixlen
;
4526 /* Expoit the internal sds representation to create a sds string allocated on the stack in order to make this function faster */
4530 char buf
[REDIS_SORTKEY_MAX
+1];
4533 if (subst
->encoding
== REDIS_ENCODING_RAW
)
4534 incrRefCount(subst
);
4536 subst
= getDecodedObject(subst
);
4539 spat
= pattern
->ptr
;
4541 if (sdslen(spat
)+sdslen(ssub
)-1 > REDIS_SORTKEY_MAX
) return NULL
;
4542 p
= strchr(spat
,'*');
4543 if (!p
) return NULL
;
4546 sublen
= sdslen(ssub
);
4547 postfixlen
= sdslen(spat
)-(prefixlen
+1);
4548 memcpy(keyname
.buf
,spat
,prefixlen
);
4549 memcpy(keyname
.buf
+prefixlen
,ssub
,sublen
);
4550 memcpy(keyname
.buf
+prefixlen
+sublen
,p
+1,postfixlen
);
4551 keyname
.buf
[prefixlen
+sublen
+postfixlen
] = '\0';
4552 keyname
.len
= prefixlen
+sublen
+postfixlen
;
4554 keyobj
.refcount
= 1;
4555 keyobj
.type
= REDIS_STRING
;
4556 keyobj
.ptr
= ((char*)&keyname
)+(sizeof(long)*2);
4558 decrRefCount(subst
);
4560 /* printf("lookup '%s' => %p\n", keyname.buf,de); */
4561 return lookupKeyRead(db
,&keyobj
);
4564 /* sortCompare() is used by qsort in sortCommand(). Given that qsort_r with
4565 * the additional parameter is not standard but a BSD-specific we have to
4566 * pass sorting parameters via the global 'server' structure */
4567 static int sortCompare(const void *s1
, const void *s2
) {
4568 const redisSortObject
*so1
= s1
, *so2
= s2
;
4571 if (!server
.sort_alpha
) {
4572 /* Numeric sorting. Here it's trivial as we precomputed scores */
4573 if (so1
->u
.score
> so2
->u
.score
) {
4575 } else if (so1
->u
.score
< so2
->u
.score
) {
4581 /* Alphanumeric sorting */
4582 if (server
.sort_bypattern
) {
4583 if (!so1
->u
.cmpobj
|| !so2
->u
.cmpobj
) {
4584 /* At least one compare object is NULL */
4585 if (so1
->u
.cmpobj
== so2
->u
.cmpobj
)
4587 else if (so1
->u
.cmpobj
== NULL
)
4592 /* We have both the objects, use strcoll */
4593 cmp
= strcoll(so1
->u
.cmpobj
->ptr
,so2
->u
.cmpobj
->ptr
);
4596 /* Compare elements directly */
4597 if (so1
->obj
->encoding
== REDIS_ENCODING_RAW
&&
4598 so2
->obj
->encoding
== REDIS_ENCODING_RAW
) {
4599 cmp
= strcoll(so1
->obj
->ptr
,so2
->obj
->ptr
);
4603 dec1
= so1
->obj
->encoding
== REDIS_ENCODING_RAW
?
4604 so1
->obj
: getDecodedObject(so1
->obj
);
4605 dec2
= so2
->obj
->encoding
== REDIS_ENCODING_RAW
?
4606 so2
->obj
: getDecodedObject(so2
->obj
);
4607 cmp
= strcoll(dec1
->ptr
,dec2
->ptr
);
4608 if (dec1
!= so1
->obj
) decrRefCount(dec1
);
4609 if (dec2
!= so2
->obj
) decrRefCount(dec2
);
4613 return server
.sort_desc
? -cmp
: cmp
;
4616 /* The SORT command is the most complex command in Redis. Warning: this code
4617 * is optimized for speed and a bit less for readability */
4618 static void sortCommand(redisClient
*c
) {
4621 int desc
= 0, alpha
= 0;
4622 int limit_start
= 0, limit_count
= -1, start
, end
;
4623 int j
, dontsort
= 0, vectorlen
;
4624 int getop
= 0; /* GET operation counter */
4625 robj
*sortval
, *sortby
= NULL
, *storekey
= NULL
;
4626 redisSortObject
*vector
; /* Resulting vector to sort */
4628 /* Lookup the key to sort. It must be of the right types */
4629 sortval
= lookupKeyRead(c
->db
,c
->argv
[1]);
4630 if (sortval
== NULL
) {
4631 addReply(c
,shared
.nokeyerr
);
4634 if (sortval
->type
!= REDIS_SET
&& sortval
->type
!= REDIS_LIST
) {
4635 addReply(c
,shared
.wrongtypeerr
);
4639 /* Create a list of operations to perform for every sorted element.
4640 * Operations can be GET/DEL/INCR/DECR */
4641 operations
= listCreate();
4642 listSetFreeMethod(operations
,zfree
);
4645 /* Now we need to protect sortval incrementing its count, in the future
4646 * SORT may have options able to overwrite/delete keys during the sorting
4647 * and the sorted key itself may get destroied */
4648 incrRefCount(sortval
);
4650 /* The SORT command has an SQL-alike syntax, parse it */
4651 while(j
< c
->argc
) {
4652 int leftargs
= c
->argc
-j
-1;
4653 if (!strcasecmp(c
->argv
[j
]->ptr
,"asc")) {
4655 } else if (!strcasecmp(c
->argv
[j
]->ptr
,"desc")) {
4657 } else if (!strcasecmp(c
->argv
[j
]->ptr
,"alpha")) {
4659 } else if (!strcasecmp(c
->argv
[j
]->ptr
,"limit") && leftargs
>= 2) {
4660 limit_start
= atoi(c
->argv
[j
+1]->ptr
);
4661 limit_count
= atoi(c
->argv
[j
+2]->ptr
);
4663 } else if (!strcasecmp(c
->argv
[j
]->ptr
,"store") && leftargs
>= 1) {
4664 storekey
= c
->argv
[j
+1];
4666 } else if (!strcasecmp(c
->argv
[j
]->ptr
,"by") && leftargs
>= 1) {
4667 sortby
= c
->argv
[j
+1];
4668 /* If the BY pattern does not contain '*', i.e. it is constant,
4669 * we don't need to sort nor to lookup the weight keys. */
4670 if (strchr(c
->argv
[j
+1]->ptr
,'*') == NULL
) dontsort
= 1;
4672 } else if (!strcasecmp(c
->argv
[j
]->ptr
,"get") && leftargs
>= 1) {
4673 listAddNodeTail(operations
,createSortOperation(
4674 REDIS_SORT_GET
,c
->argv
[j
+1]));
4678 decrRefCount(sortval
);
4679 listRelease(operations
);
4680 addReply(c
,shared
.syntaxerr
);
4686 /* Load the sorting vector with all the objects to sort */
4687 vectorlen
= (sortval
->type
== REDIS_LIST
) ?
4688 listLength((list
*)sortval
->ptr
) :
4689 dictSize((dict
*)sortval
->ptr
);
4690 vector
= zmalloc(sizeof(redisSortObject
)*vectorlen
);
4692 if (sortval
->type
== REDIS_LIST
) {
4693 list
*list
= sortval
->ptr
;
4697 while((ln
= listYield(list
))) {
4698 robj
*ele
= ln
->value
;
4699 vector
[j
].obj
= ele
;
4700 vector
[j
].u
.score
= 0;
4701 vector
[j
].u
.cmpobj
= NULL
;
4705 dict
*set
= sortval
->ptr
;
4709 di
= dictGetIterator(set
);
4710 while((setele
= dictNext(di
)) != NULL
) {
4711 vector
[j
].obj
= dictGetEntryKey(setele
);
4712 vector
[j
].u
.score
= 0;
4713 vector
[j
].u
.cmpobj
= NULL
;
4716 dictReleaseIterator(di
);
4718 assert(j
== vectorlen
);
4720 /* Now it's time to load the right scores in the sorting vector */
4721 if (dontsort
== 0) {
4722 for (j
= 0; j
< vectorlen
; j
++) {
4726 byval
= lookupKeyByPattern(c
->db
,sortby
,vector
[j
].obj
);
4727 if (!byval
|| byval
->type
!= REDIS_STRING
) continue;
4729 if (byval
->encoding
== REDIS_ENCODING_RAW
) {
4730 vector
[j
].u
.cmpobj
= byval
;
4731 incrRefCount(byval
);
4733 vector
[j
].u
.cmpobj
= getDecodedObject(byval
);
4736 if (byval
->encoding
== REDIS_ENCODING_RAW
) {
4737 vector
[j
].u
.score
= strtod(byval
->ptr
,NULL
);
4739 if (byval
->encoding
== REDIS_ENCODING_INT
) {
4740 vector
[j
].u
.score
= (long)byval
->ptr
;
4747 if (vector
[j
].obj
->encoding
== REDIS_ENCODING_RAW
)
4748 vector
[j
].u
.score
= strtod(vector
[j
].obj
->ptr
,NULL
);
4750 if (vector
[j
].obj
->encoding
== REDIS_ENCODING_INT
)
4751 vector
[j
].u
.score
= (long) vector
[j
].obj
->ptr
;
4760 /* We are ready to sort the vector... perform a bit of sanity check
4761 * on the LIMIT option too. We'll use a partial version of quicksort. */
4762 start
= (limit_start
< 0) ? 0 : limit_start
;
4763 end
= (limit_count
< 0) ? vectorlen
-1 : start
+limit_count
-1;
4764 if (start
>= vectorlen
) {
4765 start
= vectorlen
-1;
4768 if (end
>= vectorlen
) end
= vectorlen
-1;
4770 if (dontsort
== 0) {
4771 server
.sort_desc
= desc
;
4772 server
.sort_alpha
= alpha
;
4773 server
.sort_bypattern
= sortby
? 1 : 0;
4774 if (sortby
&& (start
!= 0 || end
!= vectorlen
-1))
4775 pqsort(vector
,vectorlen
,sizeof(redisSortObject
),sortCompare
, start
,end
);
4777 qsort(vector
,vectorlen
,sizeof(redisSortObject
),sortCompare
);
4780 /* Send command output to the output buffer, performing the specified
4781 * GET/DEL/INCR/DECR operations if any. */
4782 outputlen
= getop
? getop
*(end
-start
+1) : end
-start
+1;
4783 if (storekey
== NULL
) {
4784 /* STORE option not specified, sent the sorting result to client */
4785 addReplySds(c
,sdscatprintf(sdsempty(),"*%d\r\n",outputlen
));
4786 for (j
= start
; j
<= end
; j
++) {
4789 addReplyBulkLen(c
,vector
[j
].obj
);
4790 addReply(c
,vector
[j
].obj
);
4791 addReply(c
,shared
.crlf
);
4793 listRewind(operations
);
4794 while((ln
= listYield(operations
))) {
4795 redisSortOperation
*sop
= ln
->value
;
4796 robj
*val
= lookupKeyByPattern(c
->db
,sop
->pattern
,
4799 if (sop
->type
== REDIS_SORT_GET
) {
4800 if (!val
|| val
->type
!= REDIS_STRING
) {
4801 addReply(c
,shared
.nullbulk
);
4803 addReplyBulkLen(c
,val
);
4805 addReply(c
,shared
.crlf
);
4808 assert(sop
->type
== REDIS_SORT_GET
); /* always fails */
4813 robj
*listObject
= createListObject();
4814 list
*listPtr
= (list
*) listObject
->ptr
;
4816 /* STORE option specified, set the sorting result as a List object */
4817 for (j
= start
; j
<= end
; j
++) {
4820 listAddNodeTail(listPtr
,vector
[j
].obj
);
4821 incrRefCount(vector
[j
].obj
);
4823 listRewind(operations
);
4824 while((ln
= listYield(operations
))) {
4825 redisSortOperation
*sop
= ln
->value
;
4826 robj
*val
= lookupKeyByPattern(c
->db
,sop
->pattern
,
4829 if (sop
->type
== REDIS_SORT_GET
) {
4830 if (!val
|| val
->type
!= REDIS_STRING
) {
4831 listAddNodeTail(listPtr
,createStringObject("",0));
4833 listAddNodeTail(listPtr
,val
);
4837 assert(sop
->type
== REDIS_SORT_GET
); /* always fails */
4841 if (dictReplace(c
->db
->dict
,storekey
,listObject
)) {
4842 incrRefCount(storekey
);
4844 /* Note: we add 1 because the DB is dirty anyway since even if the
4845 * SORT result is empty a new key is set and maybe the old content
4847 server
.dirty
+= 1+outputlen
;
4848 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",outputlen
));
4852 decrRefCount(sortval
);
4853 listRelease(operations
);
4854 for (j
= 0; j
< vectorlen
; j
++) {
4855 if (sortby
&& alpha
&& vector
[j
].u
.cmpobj
)
4856 decrRefCount(vector
[j
].u
.cmpobj
);
4861 static void infoCommand(redisClient
*c
) {
4863 time_t uptime
= time(NULL
)-server
.stat_starttime
;
4866 info
= sdscatprintf(sdsempty(),
4867 "redis_version:%s\r\n"
4869 "uptime_in_seconds:%d\r\n"
4870 "uptime_in_days:%d\r\n"
4871 "connected_clients:%d\r\n"
4872 "connected_slaves:%d\r\n"
4873 "used_memory:%zu\r\n"
4874 "changes_since_last_save:%lld\r\n"
4875 "bgsave_in_progress:%d\r\n"
4876 "last_save_time:%d\r\n"
4877 "total_connections_received:%lld\r\n"
4878 "total_commands_processed:%lld\r\n"
4881 (sizeof(long) == 8) ? "64" : "32",
4884 listLength(server
.clients
)-listLength(server
.slaves
),
4885 listLength(server
.slaves
),
4888 server
.bgsaveinprogress
,
4890 server
.stat_numconnections
,
4891 server
.stat_numcommands
,
4892 server
.masterhost
== NULL
? "master" : "slave"
4894 if (server
.masterhost
) {
4895 info
= sdscatprintf(info
,
4896 "master_host:%s\r\n"
4897 "master_port:%d\r\n"
4898 "master_link_status:%s\r\n"
4899 "master_last_io_seconds_ago:%d\r\n"
4902 (server
.replstate
== REDIS_REPL_CONNECTED
) ?
4904 server
.master
? ((int)(time(NULL
)-server
.master
->lastinteraction
)) : -1
4907 for (j
= 0; j
< server
.dbnum
; j
++) {
4908 long long keys
, vkeys
;
4910 keys
= dictSize(server
.db
[j
].dict
);
4911 vkeys
= dictSize(server
.db
[j
].expires
);
4912 if (keys
|| vkeys
) {
4913 info
= sdscatprintf(info
, "db%d: keys=%lld,expires=%lld\r\n",
4917 addReplySds(c
,sdscatprintf(sdsempty(),"$%d\r\n",sdslen(info
)));
4918 addReplySds(c
,info
);
4919 addReply(c
,shared
.crlf
);
4922 static void monitorCommand(redisClient
*c
) {
4923 /* ignore MONITOR if aleady slave or in monitor mode */
4924 if (c
->flags
& REDIS_SLAVE
) return;
4926 c
->flags
|= (REDIS_SLAVE
|REDIS_MONITOR
);
4928 listAddNodeTail(server
.monitors
,c
);
4929 addReply(c
,shared
.ok
);
4932 /* ================================= Expire ================================= */
4933 static int removeExpire(redisDb
*db
, robj
*key
) {
4934 if (dictDelete(db
->expires
,key
) == DICT_OK
) {
4941 static int setExpire(redisDb
*db
, robj
*key
, time_t when
) {
4942 if (dictAdd(db
->expires
,key
,(void*)when
) == DICT_ERR
) {
4950 /* Return the expire time of the specified key, or -1 if no expire
4951 * is associated with this key (i.e. the key is non volatile) */
4952 static time_t getExpire(redisDb
*db
, robj
*key
) {
4955 /* No expire? return ASAP */
4956 if (dictSize(db
->expires
) == 0 ||
4957 (de
= dictFind(db
->expires
,key
)) == NULL
) return -1;
4959 return (time_t) dictGetEntryVal(de
);
4962 static int expireIfNeeded(redisDb
*db
, robj
*key
) {
4966 /* No expire? return ASAP */
4967 if (dictSize(db
->expires
) == 0 ||
4968 (de
= dictFind(db
->expires
,key
)) == NULL
) return 0;
4970 /* Lookup the expire */
4971 when
= (time_t) dictGetEntryVal(de
);
4972 if (time(NULL
) <= when
) return 0;
4974 /* Delete the key */
4975 dictDelete(db
->expires
,key
);
4976 return dictDelete(db
->dict
,key
) == DICT_OK
;
4979 static int deleteIfVolatile(redisDb
*db
, robj
*key
) {
4982 /* No expire? return ASAP */
4983 if (dictSize(db
->expires
) == 0 ||
4984 (de
= dictFind(db
->expires
,key
)) == NULL
) return 0;
4986 /* Delete the key */
4988 dictDelete(db
->expires
,key
);
4989 return dictDelete(db
->dict
,key
) == DICT_OK
;
4992 static void expireGenericCommand(redisClient
*c
, robj
*key
, time_t seconds
) {
4995 de
= dictFind(c
->db
->dict
,key
);
4997 addReply(c
,shared
.czero
);
5001 if (deleteKey(c
->db
,key
)) server
.dirty
++;
5002 addReply(c
, shared
.cone
);
5005 time_t when
= time(NULL
)+seconds
;
5006 if (setExpire(c
->db
,key
,when
)) {
5007 addReply(c
,shared
.cone
);
5010 addReply(c
,shared
.czero
);
5016 static void expireCommand(redisClient
*c
) {
5017 expireGenericCommand(c
,c
->argv
[1],strtol(c
->argv
[2]->ptr
,NULL
,10));
5020 static void expireatCommand(redisClient
*c
) {
5021 expireGenericCommand(c
,c
->argv
[1],strtol(c
->argv
[2]->ptr
,NULL
,10)-time(NULL
));
5024 static void ttlCommand(redisClient
*c
) {
5028 expire
= getExpire(c
->db
,c
->argv
[1]);
5030 ttl
= (int) (expire
-time(NULL
));
5031 if (ttl
< 0) ttl
= -1;
5033 addReplySds(c
,sdscatprintf(sdsempty(),":%d\r\n",ttl
));
5036 static void msetGenericCommand(redisClient
*c
, int nx
) {
5039 if ((c
->argc
% 2) == 0) {
5040 addReplySds(c
,sdsnew("-ERR wrong number of arguments\r\n"));
5043 /* Handle the NX flag. The MSETNX semantic is to return zero and don't
5044 * set nothing at all if at least one already key exists. */
5046 for (j
= 1; j
< c
->argc
; j
+= 2) {
5047 if (dictFind(c
->db
->dict
,c
->argv
[j
]) != NULL
) {
5048 addReply(c
, shared
.czero
);
5054 for (j
= 1; j
< c
->argc
; j
+= 2) {
5057 retval
= dictAdd(c
->db
->dict
,c
->argv
[j
],c
->argv
[j
+1]);
5058 if (retval
== DICT_ERR
) {
5059 dictReplace(c
->db
->dict
,c
->argv
[j
],c
->argv
[j
+1]);
5060 incrRefCount(c
->argv
[j
+1]);
5062 incrRefCount(c
->argv
[j
]);
5063 incrRefCount(c
->argv
[j
+1]);
5065 removeExpire(c
->db
,c
->argv
[j
]);
5067 server
.dirty
+= (c
->argc
-1)/2;
5068 addReply(c
, nx
? shared
.cone
: shared
.ok
);
5071 static void msetCommand(redisClient
*c
) {
5072 msetGenericCommand(c
,0);
5075 static void msetnxCommand(redisClient
*c
) {
5076 msetGenericCommand(c
,1);
5079 /* =============================== Replication ============================= */
5081 static int syncWrite(int fd
, char *ptr
, ssize_t size
, int timeout
) {
5082 ssize_t nwritten
, ret
= size
;
5083 time_t start
= time(NULL
);
5087 if (aeWait(fd
,AE_WRITABLE
,1000) & AE_WRITABLE
) {
5088 nwritten
= write(fd
,ptr
,size
);
5089 if (nwritten
== -1) return -1;
5093 if ((time(NULL
)-start
) > timeout
) {
5101 static int syncRead(int fd
, char *ptr
, ssize_t size
, int timeout
) {
5102 ssize_t nread
, totread
= 0;
5103 time_t start
= time(NULL
);
5107 if (aeWait(fd
,AE_READABLE
,1000) & AE_READABLE
) {
5108 nread
= read(fd
,ptr
,size
);
5109 if (nread
== -1) return -1;
5114 if ((time(NULL
)-start
) > timeout
) {
5122 static int syncReadLine(int fd
, char *ptr
, ssize_t size
, int timeout
) {
5129 if (syncRead(fd
,&c
,1,timeout
) == -1) return -1;
5132 if (nread
&& *(ptr
-1) == '\r') *(ptr
-1) = '\0';
5143 static void syncCommand(redisClient
*c
) {
5144 /* ignore SYNC if aleady slave or in monitor mode */
5145 if (c
->flags
& REDIS_SLAVE
) return;
5147 /* SYNC can't be issued when the server has pending data to send to
5148 * the client about already issued commands. We need a fresh reply
5149 * buffer registering the differences between the BGSAVE and the current
5150 * dataset, so that we can copy to other slaves if needed. */
5151 if (listLength(c
->reply
) != 0) {
5152 addReplySds(c
,sdsnew("-ERR SYNC is invalid with pending input\r\n"));
5156 redisLog(REDIS_NOTICE
,"Slave ask for synchronization");
5157 /* Here we need to check if there is a background saving operation
5158 * in progress, or if it is required to start one */
5159 if (server
.bgsaveinprogress
) {
5160 /* Ok a background save is in progress. Let's check if it is a good
5161 * one for replication, i.e. if there is another slave that is
5162 * registering differences since the server forked to save */
5166 listRewind(server
.slaves
);
5167 while((ln
= listYield(server
.slaves
))) {
5169 if (slave
->replstate
== REDIS_REPL_WAIT_BGSAVE_END
) break;
5172 /* Perfect, the server is already registering differences for
5173 * another slave. Set the right state, and copy the buffer. */
5174 listRelease(c
->reply
);
5175 c
->reply
= listDup(slave
->reply
);
5176 c
->replstate
= REDIS_REPL_WAIT_BGSAVE_END
;
5177 redisLog(REDIS_NOTICE
,"Waiting for end of BGSAVE for SYNC");
5179 /* No way, we need to wait for the next BGSAVE in order to
5180 * register differences */
5181 c
->replstate
= REDIS_REPL_WAIT_BGSAVE_START
;
5182 redisLog(REDIS_NOTICE
,"Waiting for next BGSAVE for SYNC");
5185 /* Ok we don't have a BGSAVE in progress, let's start one */
5186 redisLog(REDIS_NOTICE
,"Starting BGSAVE for SYNC");
5187 if (rdbSaveBackground(server
.dbfilename
) != REDIS_OK
) {
5188 redisLog(REDIS_NOTICE
,"Replication failed, can't BGSAVE");
5189 addReplySds(c
,sdsnew("-ERR Unalbe to perform background save\r\n"));
5192 c
->replstate
= REDIS_REPL_WAIT_BGSAVE_END
;
5195 c
->flags
|= REDIS_SLAVE
;
5197 listAddNodeTail(server
.slaves
,c
);
5201 static void sendBulkToSlave(aeEventLoop
*el
, int fd
, void *privdata
, int mask
) {
5202 redisClient
*slave
= privdata
;
5204 REDIS_NOTUSED(mask
);
5205 char buf
[REDIS_IOBUF_LEN
];
5206 ssize_t nwritten
, buflen
;
5208 if (slave
->repldboff
== 0) {
5209 /* Write the bulk write count before to transfer the DB. In theory here
5210 * we don't know how much room there is in the output buffer of the
5211 * socket, but in pratice SO_SNDLOWAT (the minimum count for output
5212 * operations) will never be smaller than the few bytes we need. */
5215 bulkcount
= sdscatprintf(sdsempty(),"$%lld\r\n",(unsigned long long)
5217 if (write(fd
,bulkcount
,sdslen(bulkcount
)) != (signed)sdslen(bulkcount
))
5225 lseek(slave
->repldbfd
,slave
->repldboff
,SEEK_SET
);
5226 buflen
= read(slave
->repldbfd
,buf
,REDIS_IOBUF_LEN
);
5228 redisLog(REDIS_WARNING
,"Read error sending DB to slave: %s",
5229 (buflen
== 0) ? "premature EOF" : strerror(errno
));
5233 if ((nwritten
= write(fd
,buf
,buflen
)) == -1) {
5234 redisLog(REDIS_DEBUG
,"Write error sending DB to slave: %s",
5239 slave
->repldboff
+= nwritten
;
5240 if (slave
->repldboff
== slave
->repldbsize
) {
5241 close(slave
->repldbfd
);
5242 slave
->repldbfd
= -1;
5243 aeDeleteFileEvent(server
.el
,slave
->fd
,AE_WRITABLE
);
5244 slave
->replstate
= REDIS_REPL_ONLINE
;
5245 if (aeCreateFileEvent(server
.el
, slave
->fd
, AE_WRITABLE
,
5246 sendReplyToClient
, slave
, NULL
) == AE_ERR
) {
5250 addReplySds(slave
,sdsempty());
5251 redisLog(REDIS_NOTICE
,"Synchronization with slave succeeded");
5255 /* This function is called at the end of every backgrond saving.
5256 * The argument bgsaveerr is REDIS_OK if the background saving succeeded
5257 * otherwise REDIS_ERR is passed to the function.
5259 * The goal of this function is to handle slaves waiting for a successful
5260 * background saving in order to perform non-blocking synchronization. */
5261 static void updateSlavesWaitingBgsave(int bgsaveerr
) {
5263 int startbgsave
= 0;
5265 listRewind(server
.slaves
);
5266 while((ln
= listYield(server
.slaves
))) {
5267 redisClient
*slave
= ln
->value
;
5269 if (slave
->replstate
== REDIS_REPL_WAIT_BGSAVE_START
) {
5271 slave
->replstate
= REDIS_REPL_WAIT_BGSAVE_END
;
5272 } else if (slave
->replstate
== REDIS_REPL_WAIT_BGSAVE_END
) {
5273 struct redis_stat buf
;
5275 if (bgsaveerr
!= REDIS_OK
) {
5277 redisLog(REDIS_WARNING
,"SYNC failed. BGSAVE child returned an error");
5280 if ((slave
->repldbfd
= open(server
.dbfilename
,O_RDONLY
)) == -1 ||
5281 redis_fstat(slave
->repldbfd
,&buf
) == -1) {
5283 redisLog(REDIS_WARNING
,"SYNC failed. Can't open/stat DB after BGSAVE: %s", strerror(errno
));
5286 slave
->repldboff
= 0;
5287 slave
->repldbsize
= buf
.st_size
;
5288 slave
->replstate
= REDIS_REPL_SEND_BULK
;
5289 aeDeleteFileEvent(server
.el
,slave
->fd
,AE_WRITABLE
);
5290 if (aeCreateFileEvent(server
.el
, slave
->fd
, AE_WRITABLE
, sendBulkToSlave
, slave
, NULL
) == AE_ERR
) {
5297 if (rdbSaveBackground(server
.dbfilename
) != REDIS_OK
) {
5298 listRewind(server
.slaves
);
5299 redisLog(REDIS_WARNING
,"SYNC failed. BGSAVE failed");
5300 while((ln
= listYield(server
.slaves
))) {
5301 redisClient
*slave
= ln
->value
;
5303 if (slave
->replstate
== REDIS_REPL_WAIT_BGSAVE_START
)
5310 static int syncWithMaster(void) {
5311 char buf
[1024], tmpfile
[256], authcmd
[1024];
5313 int fd
= anetTcpConnect(NULL
,server
.masterhost
,server
.masterport
);
5317 redisLog(REDIS_WARNING
,"Unable to connect to MASTER: %s",
5322 /* AUTH with the master if required. */
5323 if(server
.masterauth
) {
5324 snprintf(authcmd
, 1024, "AUTH %s\r\n", server
.masterauth
);
5325 if (syncWrite(fd
, authcmd
, strlen(server
.masterauth
)+7, 5) == -1) {
5327 redisLog(REDIS_WARNING
,"Unable to AUTH to MASTER: %s",
5331 /* Read the AUTH result. */
5332 if (syncReadLine(fd
,buf
,1024,3600) == -1) {
5334 redisLog(REDIS_WARNING
,"I/O error reading auth result from MASTER: %s",
5338 if (buf
[0] != '+') {
5340 redisLog(REDIS_WARNING
,"Cannot AUTH to MASTER, is the masterauth password correct?");
5345 /* Issue the SYNC command */
5346 if (syncWrite(fd
,"SYNC \r\n",7,5) == -1) {
5348 redisLog(REDIS_WARNING
,"I/O error writing to MASTER: %s",
5352 /* Read the bulk write count */
5353 if (syncReadLine(fd
,buf
,1024,3600) == -1) {
5355 redisLog(REDIS_WARNING
,"I/O error reading bulk count from MASTER: %s",
5359 if (buf
[0] != '$') {
5361 redisLog(REDIS_WARNING
,"Bad protocol from MASTER, the first byte is not '$', are you sure the host and port are right?");
5364 dumpsize
= atoi(buf
+1);
5365 redisLog(REDIS_NOTICE
,"Receiving %d bytes data dump from MASTER",dumpsize
);
5366 /* Read the bulk write data on a temp file */
5367 snprintf(tmpfile
,256,"temp-%d.%ld.rdb",(int)time(NULL
),(long int)random());
5368 dfd
= open(tmpfile
,O_CREAT
|O_WRONLY
,0644);
5371 redisLog(REDIS_WARNING
,"Opening the temp file needed for MASTER <-> SLAVE synchronization: %s",strerror(errno
));
5375 int nread
, nwritten
;
5377 nread
= read(fd
,buf
,(dumpsize
< 1024)?dumpsize
:1024);
5379 redisLog(REDIS_WARNING
,"I/O error trying to sync with MASTER: %s",
5385 nwritten
= write(dfd
,buf
,nread
);
5386 if (nwritten
== -1) {
5387 redisLog(REDIS_WARNING
,"Write error writing to the DB dump file needed for MASTER <-> SLAVE synchrnonization: %s", strerror(errno
));
5395 if (rename(tmpfile
,server
.dbfilename
) == -1) {
5396 redisLog(REDIS_WARNING
,"Failed trying to rename the temp DB into dump.rdb in MASTER <-> SLAVE synchronization: %s", strerror(errno
));
5402 if (rdbLoad(server
.dbfilename
) != REDIS_OK
) {
5403 redisLog(REDIS_WARNING
,"Failed trying to load the MASTER synchronization DB from disk");
5407 server
.master
= createClient(fd
);
5408 server
.master
->flags
|= REDIS_MASTER
;
5409 server
.replstate
= REDIS_REPL_CONNECTED
;
5413 static void slaveofCommand(redisClient
*c
) {
5414 if (!strcasecmp(c
->argv
[1]->ptr
,"no") &&
5415 !strcasecmp(c
->argv
[2]->ptr
,"one")) {
5416 if (server
.masterhost
) {
5417 sdsfree(server
.masterhost
);
5418 server
.masterhost
= NULL
;
5419 if (server
.master
) freeClient(server
.master
);
5420 server
.replstate
= REDIS_REPL_NONE
;
5421 redisLog(REDIS_NOTICE
,"MASTER MODE enabled (user request)");
5424 sdsfree(server
.masterhost
);
5425 server
.masterhost
= sdsdup(c
->argv
[1]->ptr
);
5426 server
.masterport
= atoi(c
->argv
[2]->ptr
);
5427 if (server
.master
) freeClient(server
.master
);
5428 server
.replstate
= REDIS_REPL_CONNECT
;
5429 redisLog(REDIS_NOTICE
,"SLAVE OF %s:%d enabled (user request)",
5430 server
.masterhost
, server
.masterport
);
5432 addReply(c
,shared
.ok
);
5435 /* ============================ Maxmemory directive ======================== */
5437 /* This function gets called when 'maxmemory' is set on the config file to limit
5438 * the max memory used by the server, and we are out of memory.
5439 * This function will try to, in order:
5441 * - Free objects from the free list
5442 * - Try to remove keys with an EXPIRE set
5444 * It is not possible to free enough memory to reach used-memory < maxmemory
5445 * the server will start refusing commands that will enlarge even more the
5448 static void freeMemoryIfNeeded(void) {
5449 while (server
.maxmemory
&& zmalloc_used_memory() > server
.maxmemory
) {
5450 if (listLength(server
.objfreelist
)) {
5453 listNode
*head
= listFirst(server
.objfreelist
);
5454 o
= listNodeValue(head
);
5455 listDelNode(server
.objfreelist
,head
);
5458 int j
, k
, freed
= 0;
5460 for (j
= 0; j
< server
.dbnum
; j
++) {
5462 robj
*minkey
= NULL
;
5463 struct dictEntry
*de
;
5465 if (dictSize(server
.db
[j
].expires
)) {
5467 /* From a sample of three keys drop the one nearest to
5468 * the natural expire */
5469 for (k
= 0; k
< 3; k
++) {
5472 de
= dictGetRandomKey(server
.db
[j
].expires
);
5473 t
= (time_t) dictGetEntryVal(de
);
5474 if (minttl
== -1 || t
< minttl
) {
5475 minkey
= dictGetEntryKey(de
);
5479 deleteKey(server
.db
+j
,minkey
);
5482 if (!freed
) return; /* nothing to free... */
5487 /* ============================== Append Only file ========================== */
5489 static void feedAppendOnlyFile(struct redisCommand
*cmd
, int dictid
, robj
**argv
, int argc
) {
5490 sds buf
= sdsempty();
5496 /* The DB this command was targetting is not the same as the last command
5497 * we appendend. To issue a SELECT command is needed. */
5498 if (dictid
!= server
.appendseldb
) {
5501 snprintf(seldb
,sizeof(seldb
),"%d",dictid
);
5502 buf
= sdscatprintf(buf
,"*2\r\n$6\r\nSELECT\r\n$%d\r\n%s\r\n",
5503 strlen(seldb
),seldb
);
5504 server
.appendseldb
= dictid
;
5507 /* "Fix" the argv vector if the command is EXPIRE. We want to translate
5508 * EXPIREs into EXPIREATs calls */
5509 if (cmd
->proc
== expireCommand
) {
5512 tmpargv
[0] = createStringObject("EXPIREAT",8);
5513 tmpargv
[1] = argv
[1];
5514 incrRefCount(argv
[1]);
5515 when
= time(NULL
)+strtol(argv
[2]->ptr
,NULL
,10);
5516 tmpargv
[2] = createObject(REDIS_STRING
,
5517 sdscatprintf(sdsempty(),"%ld",when
));
5521 /* Append the actual command */
5522 buf
= sdscatprintf(buf
,"*%d\r\n",argc
);
5523 for (j
= 0; j
< argc
; j
++) {
5526 if (o
->encoding
!= REDIS_ENCODING_RAW
)
5527 o
= getDecodedObject(o
);
5528 buf
= sdscatprintf(buf
,"$%d\r\n",sdslen(o
->ptr
));
5529 buf
= sdscatlen(buf
,o
->ptr
,sdslen(o
->ptr
));
5530 buf
= sdscatlen(buf
,"\r\n",2);
5535 /* Free the objects from the modified argv for EXPIREAT */
5536 if (cmd
->proc
== expireCommand
) {
5537 for (j
= 0; j
< 3; j
++)
5538 decrRefCount(argv
[j
]);
5541 /* We want to perform a single write. This should be guaranteed atomic
5542 * at least if the filesystem we are writing is a real physical one.
5543 * While this will save us against the server being killed I don't think
5544 * there is much to do about the whole server stopping for power problems
5546 nwritten
= write(server
.appendfd
,buf
,sdslen(buf
));
5547 if (nwritten
!= (signed)sdslen(buf
)) {
5548 /* Ooops, we are in troubles. The best thing to do for now is
5549 * to simply exit instead to give the illusion that everything is
5550 * working as expected. */
5551 if (nwritten
== -1) {
5552 redisLog(REDIS_WARNING
,"Exiting on error writing to the append-only file: %s",strerror(errno
));
5554 redisLog(REDIS_WARNING
,"Exiting on short write while writing to the append-only file: %s",strerror(errno
));
5559 if (server
.appendfsync
== APPENDFSYNC_ALWAYS
||
5560 (server
.appendfsync
== APPENDFSYNC_EVERYSEC
&&
5561 now
-server
.lastfsync
> 1))
5563 fsync(server
.appendfd
); /* Let's try to get this data on the disk */
5564 server
.lastfsync
= now
;
5568 /* In Redis commands are always executed in the context of a client, so in
5569 * order to load the append only file we need to create a fake client. */
5570 static struct redisClient
*createFakeClient(void) {
5571 struct redisClient
*c
= zmalloc(sizeof(*c
));
5575 c
->querybuf
= sdsempty();
5579 /* We set the fake client as a slave waiting for the synchronization
5580 * so that Redis will not try to send replies to this client. */
5581 c
->replstate
= REDIS_REPL_WAIT_BGSAVE_START
;
5582 c
->reply
= listCreate();
5583 listSetFreeMethod(c
->reply
,decrRefCount
);
5584 listSetDupMethod(c
->reply
,dupClientReplyValue
);
5588 static void freeFakeClient(struct redisClient
*c
) {
5589 sdsfree(c
->querybuf
);
5590 listRelease(c
->reply
);
5594 /* Replay the append log file. On error REDIS_OK is returned. On non fatal
5595 * error (the append only file is zero-length) REDIS_ERR is returned. On
5596 * fatal error an error message is logged and the program exists. */
5597 int loadAppendOnlyFile(char *filename
) {
5598 struct redisClient
*fakeClient
;
5599 FILE *fp
= fopen(filename
,"r");
5600 struct redis_stat sb
;
5602 if (redis_fstat(fileno(fp
),&sb
) != -1 && sb
.st_size
== 0)
5606 redisLog(REDIS_WARNING
,"Fatal error: can't open the append log file for reading: %s",strerror(errno
));
5610 fakeClient
= createFakeClient();
5617 struct redisCommand
*cmd
;
5619 if (fgets(buf
,sizeof(buf
),fp
) == NULL
) {
5625 if (buf
[0] != '*') goto fmterr
;
5627 argv
= zmalloc(sizeof(robj
*)*argc
);
5628 for (j
= 0; j
< argc
; j
++) {
5629 if (fgets(buf
,sizeof(buf
),fp
) == NULL
) goto readerr
;
5630 if (buf
[0] != '$') goto fmterr
;
5631 len
= strtol(buf
+1,NULL
,10);
5632 argsds
= sdsnewlen(NULL
,len
);
5633 if (fread(argsds
,len
,1,fp
) == 0) goto fmterr
;
5634 argv
[j
] = createObject(REDIS_STRING
,argsds
);
5635 if (fread(buf
,2,1,fp
) == 0) goto fmterr
; /* discard CRLF */
5638 /* Command lookup */
5639 cmd
= lookupCommand(argv
[0]->ptr
);
5641 redisLog(REDIS_WARNING
,"Unknown command '%s' reading the append only file", argv
[0]->ptr
);
5644 /* Try object sharing and encoding */
5645 if (server
.shareobjects
) {
5647 for(j
= 1; j
< argc
; j
++)
5648 argv
[j
] = tryObjectSharing(argv
[j
]);
5650 if (cmd
->flags
& REDIS_CMD_BULK
)
5651 tryObjectEncoding(argv
[argc
-1]);
5652 /* Run the command in the context of a fake client */
5653 fakeClient
->argc
= argc
;
5654 fakeClient
->argv
= argv
;
5655 cmd
->proc(fakeClient
);
5656 /* Discard the reply objects list from the fake client */
5657 while(listLength(fakeClient
->reply
))
5658 listDelNode(fakeClient
->reply
,listFirst(fakeClient
->reply
));
5659 /* Clean up, ready for the next command */
5660 for (j
= 0; j
< argc
; j
++) decrRefCount(argv
[j
]);
5664 freeFakeClient(fakeClient
);
5669 redisLog(REDIS_WARNING
,"Unexpected end of file reading the append only file");
5671 redisLog(REDIS_WARNING
,"Unrecoverable error reading the append only file: %s", strerror(errno
));
5675 redisLog(REDIS_WARNING
,"Bad file format reading the append only file");
5679 /* ================================= Debugging ============================== */
5681 static void debugCommand(redisClient
*c
) {
5682 if (!strcasecmp(c
->argv
[1]->ptr
,"segfault")) {
5684 } else if (!strcasecmp(c
->argv
[1]->ptr
,"object") && c
->argc
== 3) {
5685 dictEntry
*de
= dictFind(c
->db
->dict
,c
->argv
[2]);
5689 addReply(c
,shared
.nokeyerr
);
5692 key
= dictGetEntryKey(de
);
5693 val
= dictGetEntryVal(de
);
5694 addReplySds(c
,sdscatprintf(sdsempty(),
5695 "+Key at:%p refcount:%d, value at:%p refcount:%d encoding:%d\r\n",
5696 key
, key
->refcount
, val
, val
->refcount
, val
->encoding
));
5698 addReplySds(c
,sdsnew(
5699 "-ERR Syntax error, try DEBUG [SEGFAULT|OBJECT <key>]\r\n"));
5703 /* =================================== Main! ================================ */
5706 int linuxOvercommitMemoryValue(void) {
5707 FILE *fp
= fopen("/proc/sys/vm/overcommit_memory","r");
5711 if (fgets(buf
,64,fp
) == NULL
) {
5720 void linuxOvercommitMemoryWarning(void) {
5721 if (linuxOvercommitMemoryValue() == 0) {
5722 redisLog(REDIS_WARNING
,"WARNING overcommit_memory is set to 0! Background save may fail under low condition memory. To fix this issue add 'vm.overcommit_memory = 1' to /etc/sysctl.conf and then reboot or run the command 'sysctl vm.overcommit_memory=1' for this to take effect.");
5725 #endif /* __linux__ */
5727 static void daemonize(void) {
5731 if (fork() != 0) exit(0); /* parent exits */
5732 setsid(); /* create a new session */
5734 /* Every output goes to /dev/null. If Redis is daemonized but
5735 * the 'logfile' is set to 'stdout' in the configuration file
5736 * it will not log at all. */
5737 if ((fd
= open("/dev/null", O_RDWR
, 0)) != -1) {
5738 dup2(fd
, STDIN_FILENO
);
5739 dup2(fd
, STDOUT_FILENO
);
5740 dup2(fd
, STDERR_FILENO
);
5741 if (fd
> STDERR_FILENO
) close(fd
);
5743 /* Try to write the pid file */
5744 fp
= fopen(server
.pidfile
,"w");
5746 fprintf(fp
,"%d\n",getpid());
5751 int main(int argc
, char **argv
) {
5754 resetServerSaveParams();
5755 loadServerConfig(argv
[1]);
5756 } else if (argc
> 2) {
5757 fprintf(stderr
,"Usage: ./redis-server [/path/to/redis.conf]\n");
5760 redisLog(REDIS_WARNING
,"Warning: no config file specified, using the default config. In order to specify a config file use 'redis-server /path/to/redis.conf'");
5763 if (server
.daemonize
) daemonize();
5764 redisLog(REDIS_NOTICE
,"Server started, Redis version " REDIS_VERSION
);
5766 linuxOvercommitMemoryWarning();
5768 if (server
.appendonly
) {
5769 if (loadAppendOnlyFile(server
.appendfilename
) == REDIS_OK
)
5770 redisLog(REDIS_NOTICE
,"DB loaded from append only file");
5772 if (rdbLoad(server
.dbfilename
) == REDIS_OK
)
5773 redisLog(REDIS_NOTICE
,"DB loaded from disk");
5775 if (aeCreateFileEvent(server
.el
, server
.fd
, AE_READABLE
,
5776 acceptHandler
, NULL
, NULL
) == AE_ERR
) oom("creating file event");
5777 redisLog(REDIS_NOTICE
,"The server is now ready to accept connections on port %d", server
.port
);
5779 aeDeleteEventLoop(server
.el
);
5783 /* ============================= Backtrace support ========================= */
5785 #ifdef HAVE_BACKTRACE
5786 static char *findFuncName(void *pointer
, unsigned long *offset
);
5788 static void *getMcontextEip(ucontext_t
*uc
) {
5789 #if defined(__FreeBSD__)
5790 return (void*) uc
->uc_mcontext
.mc_eip
;
5791 #elif defined(__dietlibc__)
5792 return (void*) uc
->uc_mcontext
.eip
;
5793 #elif defined(__APPLE__) && !defined(MAC_OS_X_VERSION_10_6)
5794 return (void*) uc
->uc_mcontext
->__ss
.__eip
;
5795 #elif defined(__APPLE__) && defined(MAC_OS_X_VERSION_10_6)
5796 #if defined(_STRUCT_X86_THREAD_STATE64) && !defined(__i386__)
5797 return (void*) uc
->uc_mcontext
->__ss
.__rip
;
5799 return (void*) uc
->uc_mcontext
->__ss
.__eip
;
5801 #elif defined(__i386__) || defined(__X86_64__) /* Linux x86 */
5802 return (void*) uc
->uc_mcontext
.gregs
[REG_EIP
];
5803 #elif defined(__ia64__) /* Linux IA64 */
5804 return (void*) uc
->uc_mcontext
.sc_ip
;
5810 static void segvHandler(int sig
, siginfo_t
*info
, void *secret
) {
5812 char **messages
= NULL
;
5813 int i
, trace_size
= 0;
5814 unsigned long offset
=0;
5815 time_t uptime
= time(NULL
)-server
.stat_starttime
;
5816 ucontext_t
*uc
= (ucontext_t
*) secret
;
5817 REDIS_NOTUSED(info
);
5819 redisLog(REDIS_WARNING
,
5820 "======= Ooops! Redis %s got signal: -%d- =======", REDIS_VERSION
, sig
);
5821 redisLog(REDIS_WARNING
, "%s", sdscatprintf(sdsempty(),
5822 "redis_version:%s; "
5823 "uptime_in_seconds:%d; "
5824 "connected_clients:%d; "
5825 "connected_slaves:%d; "
5827 "changes_since_last_save:%lld; "
5828 "bgsave_in_progress:%d; "
5829 "last_save_time:%d; "
5830 "total_connections_received:%lld; "
5831 "total_commands_processed:%lld; "
5835 listLength(server
.clients
)-listLength(server
.slaves
),
5836 listLength(server
.slaves
),
5839 server
.bgsaveinprogress
,
5841 server
.stat_numconnections
,
5842 server
.stat_numcommands
,
5843 server
.masterhost
== NULL
? "master" : "slave"
5846 trace_size
= backtrace(trace
, 100);
5847 /* overwrite sigaction with caller's address */
5848 if (getMcontextEip(uc
) != NULL
) {
5849 trace
[1] = getMcontextEip(uc
);
5851 messages
= backtrace_symbols(trace
, trace_size
);
5853 for (i
=1; i
<trace_size
; ++i
) {
5854 char *fn
= findFuncName(trace
[i
], &offset
), *p
;
5856 p
= strchr(messages
[i
],'+');
5857 if (!fn
|| (p
&& ((unsigned long)strtol(p
+1,NULL
,10)) < offset
)) {
5858 redisLog(REDIS_WARNING
,"%s", messages
[i
]);
5860 redisLog(REDIS_WARNING
,"%d redis-server %p %s + %d", i
, trace
[i
], fn
, (unsigned int)offset
);
5867 static void setupSigSegvAction(void) {
5868 struct sigaction act
;
5870 sigemptyset (&act
.sa_mask
);
5871 /* When the SA_SIGINFO flag is set in sa_flags then sa_sigaction
5872 * is used. Otherwise, sa_handler is used */
5873 act
.sa_flags
= SA_NODEFER
| SA_ONSTACK
| SA_RESETHAND
| SA_SIGINFO
;
5874 act
.sa_sigaction
= segvHandler
;
5875 sigaction (SIGSEGV
, &act
, NULL
);
5876 sigaction (SIGBUS
, &act
, NULL
);
5877 sigaction (SIGFPE
, &act
, NULL
);
5878 sigaction (SIGILL
, &act
, NULL
);
5879 sigaction (SIGBUS
, &act
, NULL
);
5883 #include "staticsymbols.h"
5884 /* This function try to convert a pointer into a function name. It's used in
5885 * oreder to provide a backtrace under segmentation fault that's able to
5886 * display functions declared as static (otherwise the backtrace is useless). */
5887 static char *findFuncName(void *pointer
, unsigned long *offset
){
5889 unsigned long off
, minoff
= 0;
5891 /* Try to match against the Symbol with the smallest offset */
5892 for (i
=0; symsTable
[i
].pointer
; i
++) {
5893 unsigned long lp
= (unsigned long) pointer
;
5895 if (lp
!= (unsigned long)-1 && lp
>= symsTable
[i
].pointer
) {
5896 off
=lp
-symsTable
[i
].pointer
;
5897 if (ret
< 0 || off
< minoff
) {
5903 if (ret
== -1) return NULL
;
5905 return symsTable
[ret
].name
;
5907 #else /* HAVE_BACKTRACE */
5908 static void setupSigSegvAction(void) {
5910 #endif /* HAVE_BACKTRACE */