4 void *dupClientReplyValue(void *o
) {
5 incrRefCount((robj
*)o
);
9 int listMatchObjects(void *a
, void *b
) {
10 return equalStringObjects(a
,b
);
13 redisClient
*createClient(int fd
) {
16 /* Make sure to allocate a multiple of the page size to prevent wasting
17 * memory. A page size of 4096 is assumed here. We need to compensate
18 * for the zmalloc overhead of sizeof(size_t) bytes. */
19 size_t size
= 8192-sizeof(size_t);
20 redisAssert(size
> sizeof(redisClient
));
22 c
->buflen
= size
-sizeof(redisClient
);
25 anetNonBlock(NULL
,fd
);
26 anetTcpNoDelay(NULL
,fd
);
30 c
->querybuf
= sdsempty();
39 c
->lastinteraction
= time(NULL
);
41 c
->replstate
= REDIS_REPL_NONE
;
42 c
->reply
= listCreate();
43 listSetFreeMethod(c
->reply
,decrRefCount
);
44 listSetDupMethod(c
->reply
,dupClientReplyValue
);
45 c
->blocking_keys
= NULL
;
46 c
->blocking_keys_num
= 0;
47 c
->io_keys
= listCreate();
48 c
->watched_keys
= listCreate();
49 listSetFreeMethod(c
->io_keys
,decrRefCount
);
50 c
->pubsub_channels
= dictCreate(&setDictType
,NULL
);
51 c
->pubsub_patterns
= listCreate();
52 listSetFreeMethod(c
->pubsub_patterns
,decrRefCount
);
53 listSetMatchMethod(c
->pubsub_patterns
,listMatchObjects
);
54 if (aeCreateFileEvent(server
.el
, c
->fd
, AE_READABLE
,
55 readQueryFromClient
, c
) == AE_ERR
) {
59 listAddNodeTail(server
.clients
,c
);
60 initClientMultiState(c
);
64 int _ensureFileEvent(redisClient
*c
) {
65 if (c
->fd
<= 0) return REDIS_ERR
;
66 if (c
->bufpos
== 0 && listLength(c
->reply
) == 0 &&
67 (c
->replstate
== REDIS_REPL_NONE
||
68 c
->replstate
== REDIS_REPL_ONLINE
) &&
69 aeCreateFileEvent(server
.el
, c
->fd
, AE_WRITABLE
,
70 sendReplyToClient
, c
) == AE_ERR
) return REDIS_ERR
;
74 void _addReplyObjectToList(redisClient
*c
, robj
*obj
) {
75 redisAssert(obj
->type
== REDIS_STRING
&&
76 obj
->encoding
== REDIS_ENCODING_RAW
);
77 listAddNodeTail(c
->reply
,obj
);
80 void _ensureBufferInReplyList(redisClient
*c
) {
81 sds buffer
= sdsnewlen(NULL
,REDIS_REPLY_CHUNK_SIZE
);
82 sdsupdatelen(buffer
); /* sdsnewlen expects non-empty string */
83 listAddNodeTail(c
->reply
,createObject(REDIS_REPLY_NODE
,buffer
));
86 void _addReplyStringToBuffer(redisClient
*c
, char *s
, size_t len
) {
88 redisAssert(len
< REDIS_REPLY_CHUNK_THRESHOLD
);
89 if (listLength(c
->reply
) > 0) {
90 robj
*o
= listNodeValue(listLast(c
->reply
));
92 /* Make sure to append to a reply node with enough bytes available. */
93 if (o
->type
== REDIS_REPLY_NODE
) available
= sdsavail(o
->ptr
);
94 if (o
->type
!= REDIS_REPLY_NODE
|| len
> available
) {
95 _ensureBufferInReplyList(c
);
96 _addReplyStringToBuffer(c
,s
,len
);
98 o
->ptr
= sdscatlen(o
->ptr
,s
,len
);
101 available
= c
->buflen
-c
->bufpos
;
102 if (len
> available
) {
103 _ensureBufferInReplyList(c
);
104 _addReplyStringToBuffer(c
,s
,len
);
106 memcpy(c
->buf
+c
->bufpos
,s
,len
);
112 void addReply(redisClient
*c
, robj
*obj
) {
113 if (_ensureFileEvent(c
) != REDIS_OK
) return;
114 if (server
.vm_enabled
&& obj
->storage
!= REDIS_VM_MEMORY
) {
115 /* Returns a new object with refcount 1 */
116 obj
= dupStringObject(obj
);
118 /* This increments the refcount. */
119 obj
= getDecodedObject(obj
);
122 if (sdslen(obj
->ptr
) < REDIS_REPLY_CHUNK_THRESHOLD
) {
123 _addReplyStringToBuffer(c
,obj
->ptr
,sdslen(obj
->ptr
));
126 _addReplyObjectToList(c
,obj
);
130 void addReplySds(redisClient
*c
, sds s
) {
131 if (_ensureFileEvent(c
) != REDIS_OK
) return;
132 if (sdslen(s
) < REDIS_REPLY_CHUNK_THRESHOLD
) {
133 _addReplyStringToBuffer(c
,s
,sdslen(s
));
136 _addReplyObjectToList(c
,createObject(REDIS_STRING
,s
));
140 void addReplyString(redisClient
*c
, char *s
, size_t len
) {
141 if (_ensureFileEvent(c
) != REDIS_OK
) return;
142 if (len
< REDIS_REPLY_CHUNK_THRESHOLD
) {
143 _addReplyStringToBuffer(c
,s
,len
);
145 _addReplyObjectToList(c
,createStringObject(s
,len
));
149 /* Adds an empty object to the reply list that will contain the multi bulk
150 * length, which is not known when this function is called. */
151 void *addDeferredMultiBulkLength(redisClient
*c
) {
152 if (_ensureFileEvent(c
) != REDIS_OK
) return NULL
;
153 _addReplyObjectToList(c
,createObject(REDIS_STRING
,NULL
));
154 return listLast(c
->reply
);
157 /* Populate the length object and try glueing it to the next chunk. */
158 void setDeferredMultiBulkLength(redisClient
*c
, void *node
, long length
) {
159 listNode
*ln
= (listNode
*)node
;
162 /* Abort when *node is NULL (see addDeferredMultiBulkLength). */
163 if (node
== NULL
) return;
165 len
= listNodeValue(ln
);
166 len
->ptr
= sdscatprintf(sdsempty(),"*%ld\r\n",length
);
167 if (ln
->next
!= NULL
) {
168 next
= listNodeValue(ln
->next
);
169 /* Only glue when the next node is a reply chunk. */
170 if (next
->type
== REDIS_REPLY_NODE
) {
171 len
->ptr
= sdscatlen(len
->ptr
,next
->ptr
,sdslen(next
->ptr
));
172 listDelNode(c
->reply
,ln
->next
);
177 void addReplyDouble(redisClient
*c
, double d
) {
178 char dbuf
[128], sbuf
[128];
180 dlen
= snprintf(dbuf
,sizeof(dbuf
),"%.17g",d
);
181 slen
= snprintf(sbuf
,sizeof(sbuf
),"$%d\r\n%s\r\n",dlen
,dbuf
);
182 addReplyString(c
,sbuf
,slen
);
185 void _addReplyLongLong(redisClient
*c
, long long ll
, char prefix
) {
189 len
= ll2string(buf
+1,sizeof(buf
)-1,ll
);
192 addReplyString(c
,buf
,len
+3);
195 void addReplyLongLong(redisClient
*c
, long long ll
) {
196 _addReplyLongLong(c
,ll
,':');
199 void addReplyUlong(redisClient
*c
, unsigned long ul
) {
200 _addReplyLongLong(c
,(long long)ul
,':');
203 void addReplyBulkLen(redisClient
*c
, robj
*obj
) {
206 if (obj
->encoding
== REDIS_ENCODING_RAW
) {
207 len
= sdslen(obj
->ptr
);
209 long n
= (long)obj
->ptr
;
211 /* Compute how many bytes will take this integer as a radix 10 string */
217 while((n
= n
/10) != 0) {
221 _addReplyLongLong(c
,len
,'$');
224 void addReplyBulk(redisClient
*c
, robj
*obj
) {
225 addReplyBulkLen(c
,obj
);
227 addReply(c
,shared
.crlf
);
230 /* In the CONFIG command we need to add vanilla C string as bulk replies */
231 void addReplyBulkCString(redisClient
*c
, char *s
) {
233 addReply(c
,shared
.nullbulk
);
235 robj
*o
= createStringObject(s
,strlen(s
));
241 void acceptHandler(aeEventLoop
*el
, int fd
, void *privdata
, int mask
) {
247 REDIS_NOTUSED(privdata
);
249 cfd
= anetAccept(server
.neterr
, fd
, cip
, &cport
);
251 redisLog(REDIS_VERBOSE
,"Accepting client connection: %s", server
.neterr
);
254 redisLog(REDIS_VERBOSE
,"Accepted %s:%d", cip
, cport
);
255 if ((c
= createClient(cfd
)) == NULL
) {
256 redisLog(REDIS_WARNING
,"Error allocating resoures for the client");
257 close(cfd
); /* May be already closed, just ingore errors */
260 /* If maxclient directive is set and this is one client more... close the
261 * connection. Note that we create the client instead to check before
262 * for this condition, since now the socket is already set in nonblocking
263 * mode and we can send an error for free using the Kernel I/O */
264 if (server
.maxclients
&& listLength(server
.clients
) > server
.maxclients
) {
265 char *err
= "-ERR max number of clients reached\r\n";
267 /* That's a best effort error message, don't check write errors */
268 if (write(c
->fd
,err
,strlen(err
)) == -1) {
269 /* Nothing to do, Just to avoid the warning... */
274 server
.stat_numconnections
++;
277 static void freeClientArgv(redisClient
*c
) {
280 for (j
= 0; j
< c
->argc
; j
++)
281 decrRefCount(c
->argv
[j
]);
282 for (j
= 0; j
< c
->mbargc
; j
++)
283 decrRefCount(c
->mbargv
[j
]);
288 void freeClient(redisClient
*c
) {
291 /* Note that if the client we are freeing is blocked into a blocking
292 * call, we have to set querybuf to NULL *before* to call
293 * unblockClientWaitingData() to avoid processInputBuffer() will get
294 * called. Also it is important to remove the file events after
295 * this, because this call adds the READABLE event. */
296 sdsfree(c
->querybuf
);
298 if (c
->flags
& REDIS_BLOCKED
)
299 unblockClientWaitingData(c
);
301 /* UNWATCH all the keys */
303 listRelease(c
->watched_keys
);
304 /* Unsubscribe from all the pubsub channels */
305 pubsubUnsubscribeAllChannels(c
,0);
306 pubsubUnsubscribeAllPatterns(c
,0);
307 dictRelease(c
->pubsub_channels
);
308 listRelease(c
->pubsub_patterns
);
309 /* Obvious cleanup */
310 aeDeleteFileEvent(server
.el
,c
->fd
,AE_READABLE
);
311 aeDeleteFileEvent(server
.el
,c
->fd
,AE_WRITABLE
);
312 listRelease(c
->reply
);
315 /* Remove from the list of clients */
316 ln
= listSearchKey(server
.clients
,c
);
317 redisAssert(ln
!= NULL
);
318 listDelNode(server
.clients
,ln
);
319 /* Remove from the list of clients waiting for swapped keys, or ready
320 * to be restarted, but not yet woken up again. */
321 if (c
->flags
& REDIS_IO_WAIT
) {
322 redisAssert(server
.vm_enabled
);
323 if (listLength(c
->io_keys
) == 0) {
324 ln
= listSearchKey(server
.io_ready_clients
,c
);
326 /* When this client is waiting to be woken up (REDIS_IO_WAIT),
327 * it should be present in the list io_ready_clients */
328 redisAssert(ln
!= NULL
);
329 listDelNode(server
.io_ready_clients
,ln
);
331 while (listLength(c
->io_keys
)) {
332 ln
= listFirst(c
->io_keys
);
333 dontWaitForSwappedKey(c
,ln
->value
);
336 server
.vm_blocked_clients
--;
338 listRelease(c
->io_keys
);
339 /* Master/slave cleanup.
340 * Case 1: we lost the connection with a slave. */
341 if (c
->flags
& REDIS_SLAVE
) {
342 if (c
->replstate
== REDIS_REPL_SEND_BULK
&& c
->repldbfd
!= -1)
344 list
*l
= (c
->flags
& REDIS_MONITOR
) ? server
.monitors
: server
.slaves
;
345 ln
= listSearchKey(l
,c
);
346 redisAssert(ln
!= NULL
);
350 /* Case 2: we lost the connection with the master. */
351 if (c
->flags
& REDIS_MASTER
) {
352 server
.master
= NULL
;
353 server
.replstate
= REDIS_REPL_CONNECT
;
354 /* Since we lost the connection with the master, we should also
355 * close the connection with all our slaves if we have any, so
356 * when we'll resync with the master the other slaves will sync again
357 * with us as well. Note that also when the slave is not connected
358 * to the master it will keep refusing connections by other slaves. */
359 while (listLength(server
.slaves
)) {
360 ln
= listFirst(server
.slaves
);
361 freeClient((redisClient
*)ln
->value
);
367 freeClientMultiState(c
);
371 void sendReplyToClient(aeEventLoop
*el
, int fd
, void *privdata
, int mask
) {
372 redisClient
*c
= privdata
;
373 int nwritten
= 0, totwritten
= 0, objlen
;
378 /* Use writev() if we have enough buffers to send */
379 if (!server
.glueoutputbuf
&&
380 listLength(c
->reply
) > REDIS_WRITEV_THRESHOLD
&&
381 !(c
->flags
& REDIS_MASTER
))
383 sendReplyToClientWritev(el
, fd
, privdata
, mask
);
387 while(c
->bufpos
> 0 || listLength(c
->reply
)) {
389 if (c
->flags
& REDIS_MASTER
) {
390 /* Don't reply to a master */
391 nwritten
= c
->bufpos
- c
->sentlen
;
393 nwritten
= write(fd
,c
->buf
+c
->sentlen
,c
->bufpos
-c
->sentlen
);
394 if (nwritten
<= 0) break;
396 c
->sentlen
+= nwritten
;
397 totwritten
+= nwritten
;
399 /* If the buffer was sent, set bufpos to zero to continue with
400 * the remainder of the reply. */
401 if (c
->sentlen
== c
->bufpos
) {
406 o
= listNodeValue(listFirst(c
->reply
));
407 objlen
= sdslen(o
->ptr
);
410 listDelNode(c
->reply
,listFirst(c
->reply
));
414 if (c
->flags
& REDIS_MASTER
) {
415 /* Don't reply to a master */
416 nwritten
= objlen
- c
->sentlen
;
418 nwritten
= write(fd
, ((char*)o
->ptr
)+c
->sentlen
,objlen
-c
->sentlen
);
419 if (nwritten
<= 0) break;
421 c
->sentlen
+= nwritten
;
422 totwritten
+= nwritten
;
424 /* If we fully sent the object on head go to the next one */
425 if (c
->sentlen
== objlen
) {
426 listDelNode(c
->reply
,listFirst(c
->reply
));
430 /* Note that we avoid to send more thank REDIS_MAX_WRITE_PER_EVENT
431 * bytes, in a single threaded server it's a good idea to serve
432 * other clients as well, even if a very large request comes from
433 * super fast link that is always able to accept data (in real world
434 * scenario think about 'KEYS *' against the loopback interfae) */
435 if (totwritten
> REDIS_MAX_WRITE_PER_EVENT
) break;
437 if (nwritten
== -1) {
438 if (errno
== EAGAIN
) {
441 redisLog(REDIS_VERBOSE
,
442 "Error writing to client: %s", strerror(errno
));
447 if (totwritten
> 0) c
->lastinteraction
= time(NULL
);
448 if (listLength(c
->reply
) == 0) {
450 aeDeleteFileEvent(server
.el
,c
->fd
,AE_WRITABLE
);
454 void sendReplyToClientWritev(aeEventLoop
*el
, int fd
, void *privdata
, int mask
)
456 redisClient
*c
= privdata
;
457 int nwritten
= 0, totwritten
= 0, objlen
, willwrite
;
459 struct iovec iov
[REDIS_WRITEV_IOVEC_COUNT
];
465 while (listLength(c
->reply
)) {
470 /* fill-in the iov[] array */
471 for(node
= listFirst(c
->reply
); node
; node
= listNextNode(node
)) {
472 o
= listNodeValue(node
);
473 objlen
= sdslen(o
->ptr
);
475 if (totwritten
+ objlen
- offset
> REDIS_MAX_WRITE_PER_EVENT
)
478 if(ion
== REDIS_WRITEV_IOVEC_COUNT
)
479 break; /* no more iovecs */
481 iov
[ion
].iov_base
= ((char*)o
->ptr
) + offset
;
482 iov
[ion
].iov_len
= objlen
- offset
;
483 willwrite
+= objlen
- offset
;
484 offset
= 0; /* just for the first item */
491 /* write all collected blocks at once */
492 if((nwritten
= writev(fd
, iov
, ion
)) < 0) {
493 if (errno
!= EAGAIN
) {
494 redisLog(REDIS_VERBOSE
,
495 "Error writing to client: %s", strerror(errno
));
502 totwritten
+= nwritten
;
505 /* remove written robjs from c->reply */
506 while (nwritten
&& listLength(c
->reply
)) {
507 o
= listNodeValue(listFirst(c
->reply
));
508 objlen
= sdslen(o
->ptr
);
510 if(nwritten
>= objlen
- offset
) {
511 listDelNode(c
->reply
, listFirst(c
->reply
));
512 nwritten
-= objlen
- offset
;
516 c
->sentlen
+= nwritten
;
524 c
->lastinteraction
= time(NULL
);
526 if (listLength(c
->reply
) == 0) {
528 aeDeleteFileEvent(server
.el
,c
->fd
,AE_WRITABLE
);
532 /* resetClient prepare the client to process the next command */
533 void resetClient(redisClient
*c
) {
539 void closeTimedoutClients(void) {
542 time_t now
= time(NULL
);
545 listRewind(server
.clients
,&li
);
546 while ((ln
= listNext(&li
)) != NULL
) {
547 c
= listNodeValue(ln
);
548 if (server
.maxidletime
&&
549 !(c
->flags
& REDIS_SLAVE
) && /* no timeout for slaves */
550 !(c
->flags
& REDIS_MASTER
) && /* no timeout for masters */
551 !(c
->flags
& REDIS_BLOCKED
) && /* no timeout for BLPOP */
552 dictSize(c
->pubsub_channels
) == 0 && /* no timeout for pubsub */
553 listLength(c
->pubsub_patterns
) == 0 &&
554 (now
- c
->lastinteraction
> server
.maxidletime
))
556 redisLog(REDIS_VERBOSE
,"Closing idle client");
558 } else if (c
->flags
& REDIS_BLOCKED
) {
559 if (c
->blockingto
!= 0 && c
->blockingto
< now
) {
560 addReply(c
,shared
.nullmultibulk
);
561 unblockClientWaitingData(c
);
567 void processInputBuffer(redisClient
*c
) {
569 /* Before to process the input buffer, make sure the client is not
570 * waitig for a blocking operation such as BLPOP. Note that the first
571 * iteration the client is never blocked, otherwise the processInputBuffer
572 * would not be called at all, but after the execution of the first commands
573 * in the input buffer the client may be blocked, and the "goto again"
574 * will try to reiterate. The following line will make it return asap. */
575 if (c
->flags
& REDIS_BLOCKED
|| c
->flags
& REDIS_IO_WAIT
) return;
576 if (c
->bulklen
== -1) {
577 /* Read the first line of the query */
578 char *p
= strchr(c
->querybuf
,'\n');
586 c
->querybuf
= sdsempty();
587 querylen
= 1+(p
-(query
));
588 if (sdslen(query
) > querylen
) {
589 /* leave data after the first line of the query in the buffer */
590 c
->querybuf
= sdscatlen(c
->querybuf
,query
+querylen
,sdslen(query
)-querylen
);
592 *p
= '\0'; /* remove "\n" */
593 if (*(p
-1) == '\r') *(p
-1) = '\0'; /* and "\r" if any */
596 /* Now we can split the query in arguments */
597 argv
= sdssplitlen(query
,sdslen(query
)," ",1,&argc
);
600 if (c
->argv
) zfree(c
->argv
);
601 c
->argv
= zmalloc(sizeof(robj
*)*argc
);
603 for (j
= 0; j
< argc
; j
++) {
604 if (sdslen(argv
[j
])) {
605 c
->argv
[c
->argc
] = createObject(REDIS_STRING
,argv
[j
]);
613 /* Execute the command. If the client is still valid
614 * after processCommand() return and there is something
615 * on the query buffer try to process the next command. */
616 if (processCommand(c
) && sdslen(c
->querybuf
)) goto again
;
618 /* Nothing to process, argc == 0. Just process the query
619 * buffer if it's not empty or return to the caller */
620 if (sdslen(c
->querybuf
)) goto again
;
623 } else if (sdslen(c
->querybuf
) >= REDIS_REQUEST_MAX_SIZE
) {
624 redisLog(REDIS_VERBOSE
, "Client protocol error");
629 /* Bulk read handling. Note that if we are at this point
630 the client already sent a command terminated with a newline,
631 we are reading the bulk data that is actually the last
632 argument of the command. */
633 int qbl
= sdslen(c
->querybuf
);
635 if (c
->bulklen
<= qbl
) {
636 /* Copy everything but the final CRLF as final argument */
637 c
->argv
[c
->argc
] = createStringObject(c
->querybuf
,c
->bulklen
-2);
639 c
->querybuf
= sdsrange(c
->querybuf
,c
->bulklen
,-1);
640 /* Process the command. If the client is still valid after
641 * the processing and there is more data in the buffer
642 * try to parse it. */
643 if (processCommand(c
) && sdslen(c
->querybuf
)) goto again
;
649 void readQueryFromClient(aeEventLoop
*el
, int fd
, void *privdata
, int mask
) {
650 redisClient
*c
= (redisClient
*) privdata
;
651 char buf
[REDIS_IOBUF_LEN
];
656 nread
= read(fd
, buf
, REDIS_IOBUF_LEN
);
658 if (errno
== EAGAIN
) {
661 redisLog(REDIS_VERBOSE
, "Reading from client: %s",strerror(errno
));
665 } else if (nread
== 0) {
666 redisLog(REDIS_VERBOSE
, "Client closed connection");
671 c
->querybuf
= sdscatlen(c
->querybuf
, buf
, nread
);
672 c
->lastinteraction
= time(NULL
);
676 processInputBuffer(c
);