]> git.saurik.com Git - redis.git/blame - src/redis.h
Check other blocked clients when value could not be pushed
[redis.git] / src / redis.h
CommitLineData
e2641e09 1#ifndef __REDIS_H
2#define __REDIS_H
3
4#include "fmacros.h"
5#include "config.h"
6
7#if defined(__sun)
8#include "solarisfixes.h"
9#endif
10
11#include <stdio.h>
12#include <stdlib.h>
13#include <string.h>
14#include <time.h>
15#include <limits.h>
16#include <unistd.h>
17#include <errno.h>
3688d7f3 18#include <inttypes.h>
d06a5b23 19#include <pthread.h>
e2641e09 20
21#include "ae.h" /* Event driven programming library */
22#include "sds.h" /* Dynamic safe strings */
23#include "dict.h" /* Hash tables */
24#include "adlist.h" /* Linked lists */
25#include "zmalloc.h" /* total memory usage aware version of malloc/free */
26#include "anet.h" /* Networking the easy way */
27#include "zipmap.h" /* Compact string -> string data structure */
28#include "ziplist.h" /* Compact list data structure */
96ffb2fe 29#include "intset.h" /* Compact integer set structure */
e2641e09 30#include "version.h"
31
32/* Error codes */
33#define REDIS_OK 0
34#define REDIS_ERR -1
35
36/* Static server configuration */
37#define REDIS_SERVERPORT 6379 /* TCP port */
38#define REDIS_MAXIDLETIME (60*5) /* default client timeout */
39#define REDIS_IOBUF_LEN 1024
40#define REDIS_LOADBUF_LEN 1024
41#define REDIS_STATIC_ARGS 8
42#define REDIS_DEFAULT_DBNUM 16
43#define REDIS_CONFIGLINE_MAX 1024
e2641e09 44#define REDIS_MAX_SYNC_TIME 60 /* Slave can't take more to sync */
45#define REDIS_EXPIRELOOKUPS_PER_CRON 10 /* lookup 10 expires per loop */
46#define REDIS_MAX_WRITE_PER_EVENT (1024*64)
47#define REDIS_REQUEST_MAX_SIZE (1024*1024*256) /* max bytes in inline command */
48#define REDIS_SHARED_INTEGERS 10000
36c19d03 49#define REDIS_REPLY_CHUNK_BYTES (5*1500) /* 5 TCP packets with default MTU */
834ef78e 50
e2641e09 51/* If more then REDIS_WRITEV_THRESHOLD write packets are pending use writev */
52#define REDIS_WRITEV_THRESHOLD 3
53/* Max number of iovecs used for each writev call */
54#define REDIS_WRITEV_IOVEC_COUNT 256
55
56/* Hash table parameters */
57#define REDIS_HT_MINFILL 10 /* Minimal hash table fill 10% */
58
33aba595
PN
59/* Command flags:
60 * REDIS_CMD_DENYOOM:
61 * Commands marked with this flag will return an error when 'maxmemory' is
62 * set and the server is using more than 'maxmemory' bytes of memory.
63 * In short: commands with this flag are denied on low memory conditions.
64 * REDIS_CMD_FORCE_REPLICATION:
65 * Force replication even if dirty is 0. */
66#define REDIS_CMD_DENYOOM 4
67#define REDIS_CMD_FORCE_REPLICATION 8
e2641e09 68
69/* Object types */
70#define REDIS_STRING 0
71#define REDIS_LIST 1
72#define REDIS_SET 2
73#define REDIS_ZSET 3
74#define REDIS_HASH 4
75#define REDIS_VMPOINTER 8
76
77/* Objects encoding. Some kind of objects like Strings and Hashes can be
78 * internally represented in multiple ways. The 'encoding' field of the object
79 * is set to one of this fields for this object. */
80#define REDIS_ENCODING_RAW 0 /* Raw representation */
81#define REDIS_ENCODING_INT 1 /* Encoded as integer */
82#define REDIS_ENCODING_HT 2 /* Encoded as hash table */
83#define REDIS_ENCODING_ZIPMAP 3 /* Encoded as zipmap */
84#define REDIS_ENCODING_LINKEDLIST 4 /* Encoded as regular linked list */
85#define REDIS_ENCODING_ZIPLIST 5 /* Encoded as ziplist */
96ffb2fe 86#define REDIS_ENCODING_INTSET 6 /* Encoded as intset */
e2641e09 87
88/* Object types only used for dumping to disk */
89#define REDIS_EXPIRETIME 253
90#define REDIS_SELECTDB 254
91#define REDIS_EOF 255
92
93/* Defines related to the dump file format. To store 32 bits lengths for short
94 * keys requires a lot of space, so we check the most significant 2 bits of
95 * the first byte to interpreter the length:
96 *
97 * 00|000000 => if the two MSB are 00 the len is the 6 bits of this byte
98 * 01|000000 00000000 => 01, the len is 14 byes, 6 bits + 8 bits of next byte
99 * 10|000000 [32 bit integer] => if it's 01, a full 32 bit len will follow
100 * 11|000000 this means: specially encoded object will follow. The six bits
101 * number specify the kind of object that follows.
102 * See the REDIS_RDB_ENC_* defines.
103 *
104 * Lenghts up to 63 are stored using a single byte, most DB keys, and may
105 * values, will fit inside. */
106#define REDIS_RDB_6BITLEN 0
107#define REDIS_RDB_14BITLEN 1
108#define REDIS_RDB_32BITLEN 2
109#define REDIS_RDB_ENCVAL 3
110#define REDIS_RDB_LENERR UINT_MAX
111
112/* When a length of a string object stored on disk has the first two bits
113 * set, the remaining two bits specify a special encoding for the object
114 * accordingly to the following defines: */
115#define REDIS_RDB_ENC_INT8 0 /* 8 bit signed integer */
116#define REDIS_RDB_ENC_INT16 1 /* 16 bit signed integer */
117#define REDIS_RDB_ENC_INT32 2 /* 32 bit signed integer */
118#define REDIS_RDB_ENC_LZF 3 /* string compressed with FASTLZ */
119
120/* Virtual memory object->where field. */
121#define REDIS_VM_MEMORY 0 /* The object is on memory */
122#define REDIS_VM_SWAPPED 1 /* The object is on disk */
123#define REDIS_VM_SWAPPING 2 /* Redis is swapping this object on disk */
124#define REDIS_VM_LOADING 3 /* Redis is loading this object from disk */
125
126/* Virtual memory static configuration stuff.
127 * Check vmFindContiguousPages() to know more about this magic numbers. */
128#define REDIS_VM_MAX_NEAR_PAGES 65536
129#define REDIS_VM_MAX_RANDOM_JUMP 4096
130#define REDIS_VM_MAX_THREADS 32
131#define REDIS_THREAD_STACK_SIZE (1024*1024*4)
132/* The following is the *percentage* of completed I/O jobs to process when the
133 * handelr is called. While Virtual Memory I/O operations are performed by
134 * threads, this operations must be processed by the main thread when completed
135 * in order to take effect. */
136#define REDIS_MAX_COMPLETED_JOBS_PROCESSED 1
137
138/* Client flags */
139#define REDIS_SLAVE 1 /* This client is a slave server */
140#define REDIS_MASTER 2 /* This client is a master server */
141#define REDIS_MONITOR 4 /* This client is a slave monitor, see MONITOR */
142#define REDIS_MULTI 8 /* This client is in a MULTI context */
143#define REDIS_BLOCKED 16 /* The client is waiting in a blocking operation */
144#define REDIS_IO_WAIT 32 /* The client is waiting for Virtual Memory I/O */
145#define REDIS_DIRTY_CAS 64 /* Watched keys modified. EXEC will fail. */
5e78edb3 146#define REDIS_CLOSE_AFTER_REPLY 128 /* Close after writing entire reply. */
cd8788f2
PN
147
148/* Client request types */
149#define REDIS_REQ_INLINE 1
150#define REDIS_REQ_MULTIBULK 2
e2641e09 151
152/* Slave replication state - slave side */
153#define REDIS_REPL_NONE 0 /* No active replication */
154#define REDIS_REPL_CONNECT 1 /* Must connect to master */
62ec599c 155#define REDIS_REPL_TRANSFER 2 /* Receiving .rdb from master */
f4aa600b 156#define REDIS_REPL_CONNECTED 3 /* Connected to master */
e2641e09 157
158/* Slave replication state - from the point of view of master
159 * Note that in SEND_BULK and ONLINE state the slave receives new updates
160 * in its output queue. In the WAIT_BGSAVE state instead the server is waiting
161 * to start the next background saving in order to send updates to it. */
162#define REDIS_REPL_WAIT_BGSAVE_START 3 /* master waits bgsave to start feeding it */
163#define REDIS_REPL_WAIT_BGSAVE_END 4 /* master waits bgsave to start bulk DB transmission */
164#define REDIS_REPL_SEND_BULK 5 /* master is sending the bulk DB */
165#define REDIS_REPL_ONLINE 6 /* bulk DB already transmitted, receive updates */
166
167/* List related stuff */
168#define REDIS_HEAD 0
169#define REDIS_TAIL 1
170
171/* Sort operations */
172#define REDIS_SORT_GET 0
173#define REDIS_SORT_ASC 1
174#define REDIS_SORT_DESC 2
175#define REDIS_SORTKEY_MAX 1024
176
177/* Log levels */
178#define REDIS_DEBUG 0
179#define REDIS_VERBOSE 1
180#define REDIS_NOTICE 2
181#define REDIS_WARNING 3
182
183/* Anti-warning macro... */
184#define REDIS_NOTUSED(V) ((void) V)
185
186#define ZSKIPLIST_MAXLEVEL 32 /* Should be enough for 2^32 elements */
187#define ZSKIPLIST_P 0.25 /* Skiplist P = 1/4 */
188
189/* Append only defines */
190#define APPENDFSYNC_NO 0
191#define APPENDFSYNC_ALWAYS 1
192#define APPENDFSYNC_EVERYSEC 2
193
194/* Zip structure related defaults */
195#define REDIS_HASH_MAX_ZIPMAP_ENTRIES 64
196#define REDIS_HASH_MAX_ZIPMAP_VALUE 512
197#define REDIS_LIST_MAX_ZIPLIST_ENTRIES 1024
198#define REDIS_LIST_MAX_ZIPLIST_VALUE 32
96ffb2fe 199#define REDIS_SET_MAX_INTSET_ENTRIES 4096
e2641e09 200
201/* Sets operations codes */
202#define REDIS_OP_UNION 0
203#define REDIS_OP_DIFF 1
204#define REDIS_OP_INTER 2
205
165346ca 206/* Redis maxmemory strategies */
207#define REDIS_MAXMEMORY_VOLATILE_LRU 0
208#define REDIS_MAXMEMORY_VOLATILE_TTL 1
209#define REDIS_MAXMEMORY_VOLATILE_RANDOM 2
210#define REDIS_MAXMEMORY_ALLKEYS_LRU 3
211#define REDIS_MAXMEMORY_ALLKEYS_RANDOM 4
5402c426 212#define REDIS_MAXMEMORY_NO_EVICTION 5
165346ca 213
e2641e09 214/* We can print the stacktrace, so our assert is defined this way: */
215#define redisAssert(_e) ((_e)?(void)0 : (_redisAssert(#_e,__FILE__,__LINE__),_exit(1)))
216#define redisPanic(_e) _redisPanic(#_e,__FILE__,__LINE__),_exit(1)
217void _redisAssert(char *estr, char *file, int line);
218void _redisPanic(char *msg, char *file, int line);
219
220/*-----------------------------------------------------------------------------
221 * Data types
222 *----------------------------------------------------------------------------*/
223
224/* A redis object, that is a type able to hold a string / list / set */
225
226/* The actual Redis Object */
ef59a8bc 227#define REDIS_LRU_CLOCK_MAX ((1<<21)-1) /* Max value of obj->lru */
165346ca 228#define REDIS_LRU_CLOCK_RESOLUTION 10 /* LRU clock resolution in seconds */
e2641e09 229typedef struct redisObject {
230 unsigned type:4;
231 unsigned storage:2; /* REDIS_VM_MEMORY or REDIS_VM_SWAPPING */
232 unsigned encoding:4;
233 unsigned lru:22; /* lru time (relative to server.lruclock) */
234 int refcount;
235 void *ptr;
236 /* VM fields are only allocated if VM is active, otherwise the
237 * object allocation function will just allocate
238 * sizeof(redisObjct) minus sizeof(redisObjectVM), so using
239 * Redis without VM active will not have any overhead. */
240} robj;
241
242/* The VM pointer structure - identifies an object in the swap file.
243 *
244 * This object is stored in place of the value
245 * object in the main key->value hash table representing a database.
246 * Note that the first fields (type, storage) are the same as the redisObject
247 * structure so that vmPointer strucuters can be accessed even when casted
248 * as redisObject structures.
249 *
250 * This is useful as we don't know if a value object is or not on disk, but we
251 * are always able to read obj->storage to check this. For vmPointer
252 * structures "type" is set to REDIS_VMPOINTER (even if without this field
253 * is still possible to check the kind of object from the value of 'storage').*/
254typedef struct vmPointer {
255 unsigned type:4;
256 unsigned storage:2; /* REDIS_VM_SWAPPED or REDIS_VM_LOADING */
257 unsigned notused:26;
258 unsigned int vtype; /* type of the object stored in the swap file */
259 off_t page; /* the page at witch the object is stored on disk */
260 off_t usedpages; /* number of pages used on disk */
261} vmpointer;
262
263/* Macro used to initalize a Redis object allocated on the stack.
264 * Note that this macro is taken near the structure definition to make sure
265 * we'll update it when the structure is changed, to avoid bugs like
266 * bug #85 introduced exactly in this way. */
267#define initStaticStringObject(_var,_ptr) do { \
268 _var.refcount = 1; \
269 _var.type = REDIS_STRING; \
270 _var.encoding = REDIS_ENCODING_RAW; \
271 _var.ptr = _ptr; \
272 _var.storage = REDIS_VM_MEMORY; \
273} while(0);
274
275typedef struct redisDb {
276 dict *dict; /* The keyspace for this DB */
277 dict *expires; /* Timeout of keys with a timeout set */
278 dict *blocking_keys; /* Keys with clients waiting for data (BLPOP) */
279 dict *io_keys; /* Keys with clients waiting for VM I/O */
280 dict *watched_keys; /* WATCHED keys for MULTI/EXEC CAS */
281 int id;
282} redisDb;
283
284/* Client MULTI/EXEC state */
285typedef struct multiCmd {
286 robj **argv;
287 int argc;
288 struct redisCommand *cmd;
289} multiCmd;
290
291typedef struct multiState {
292 multiCmd *commands; /* Array of MULTI commands */
293 int count; /* Total number of MULTI commands */
294} multiState;
295
357a8417
DJMM
296typedef struct blockingState {
297 robj **keys; /* The key we are waiting to terminate a blocking
298 * operation such as BLPOP. Otherwise NULL. */
299 int count; /* Number of blocking keys */
300 time_t timeout; /* Blocking operation timeout. If UNIX current time
301 * is >= timeout then the operation timed out. */
302 robj *target; /* The key that should receive the element,
303 * for BRPOPLPUSH. */
304} blockingState;
305
e2641e09 306/* With multiplexing we need to take per-clinet state.
307 * Clients are taken in a liked list. */
308typedef struct redisClient {
309 int fd;
310 redisDb *db;
311 int dictid;
312 sds querybuf;
cd8788f2
PN
313 int argc;
314 robj **argv;
315 int reqtype;
316 int multibulklen; /* number of multi bulk arguments left to read */
317 long bulklen; /* length of bulk argument in multi bulk request */
e2641e09 318 list *reply;
319 int sentlen;
320 time_t lastinteraction; /* time of the last interaction, used for timeout */
321 int flags; /* REDIS_SLAVE | REDIS_MONITOR | REDIS_MULTI ... */
322 int slaveseldb; /* slave selected db, if this client is a slave */
323 int authenticated; /* when requirepass is non-NULL */
324 int replstate; /* replication state if this is a slave */
325 int repldbfd; /* replication DB file descriptor */
326 long repldboff; /* replication DB file offset */
327 off_t repldbsize; /* replication DB file size */
328 multiState mstate; /* MULTI/EXEC state */
e3c51c4b 329 blockingState bpop; /* blocking state */
e2641e09 330 list *io_keys; /* Keys this client is waiting to be loaded from the
331 * swap file in order to continue. */
332 list *watched_keys; /* Keys WATCHED for MULTI/EXEC CAS */
333 dict *pubsub_channels; /* channels a client is interested in (SUBSCRIBE) */
334 list *pubsub_patterns; /* patterns a client is interested in (SUBSCRIBE) */
834ef78e
PN
335
336 /* Response buffer */
337 int bufpos;
f3357792 338 char buf[REDIS_REPLY_CHUNK_BYTES];
e2641e09 339} redisClient;
340
341struct saveparam {
342 time_t seconds;
343 int changes;
344};
345
346struct sharedObjectsStruct {
347 robj *crlf, *ok, *err, *emptybulk, *czero, *cone, *cnegone, *pong, *space,
348 *colon, *nullbulk, *nullmultibulk, *queued,
349 *emptymultibulk, *wrongtypeerr, *nokeyerr, *syntaxerr, *sameobjecterr,
97e7f8ae 350 *outofrangeerr, *loadingerr, *plus,
e2641e09 351 *select0, *select1, *select2, *select3, *select4,
352 *select5, *select6, *select7, *select8, *select9,
353 *messagebulk, *pmessagebulk, *subscribebulk, *unsubscribebulk, *mbulk3,
354 *mbulk4, *psubscribebulk, *punsubscribebulk,
355 *integers[REDIS_SHARED_INTEGERS];
356};
357
358/* Global server state structure */
359struct redisServer {
0e5441d8 360 pthread_t mainthread;
e2641e09 361 int port;
a5639e7d 362 char *bindaddr;
5d10923f 363 char *unixsocket;
a5639e7d
PN
364 int ipfd;
365 int sofd;
e2641e09 366 redisDb *db;
367 long long dirty; /* changes to DB from the last save */
2f6b31c3 368 long long dirty_before_bgsave; /* used to restore dirty on failed BGSAVE */
e2641e09 369 list *clients;
1b1f47c9 370 dict *commands; /* Command table hahs table */
97e7f8ae 371 /* RDB / AOF loading information */
372 int loading;
373 off_t loading_total_bytes;
374 off_t loading_loaded_bytes;
375 time_t loading_start_time;
4ebfc455 376 /* Fast pointers to often looked up command */
377 struct redisCommand *delCommand, *multiCommand;
e2641e09 378 list *slaves, *monitors;
379 char neterr[ANET_ERR_LEN];
380 aeEventLoop *el;
381 int cronloops; /* number of times the cron function run */
53eeeaff 382 time_t lastsave; /* Unix time of last save succeeede */
e2641e09 383 /* Fields used only for stats */
53eeeaff 384 time_t stat_starttime; /* server start time */
385 long long stat_numcommands; /* number of processed commands */
386 long long stat_numconnections; /* number of connections received */
387 long long stat_expiredkeys; /* number of expired keys */
388 long long stat_keyspace_hits; /* number of successful lookups of keys */
389 long long stat_keyspace_misses; /* number of failed lookups of keys */
e2641e09 390 /* Configuration */
391 int verbosity;
392 int glueoutputbuf;
393 int maxidletime;
394 int dbnum;
395 int daemonize;
396 int appendonly;
397 int appendfsync;
398 int no_appendfsync_on_rewrite;
399 int shutdown_asap;
400 time_t lastfsync;
401 int appendfd;
402 int appendseldb;
403 char *pidfile;
404 pid_t bgsavechildpid;
405 pid_t bgrewritechildpid;
406 sds bgrewritebuf; /* buffer taken by parent during oppend only rewrite */
407 sds aofbuf; /* AOF buffer, written before entering the event loop */
408 struct saveparam *saveparams;
409 int saveparamslen;
410 char *logfile;
e2641e09 411 char *dbfilename;
412 char *appendfilename;
413 char *requirepass;
414 int rdbcompression;
415 int activerehashing;
416 /* Replication related */
417 int isslave;
f4aa600b 418 /* Slave specific fields */
e2641e09 419 char *masterauth;
420 char *masterhost;
421 int masterport;
422 redisClient *master; /* client that is master for this slave */
f4aa600b 423 int replstate; /* replication status if the instance is a slave */
62ec599c 424 off_t repl_transfer_left; /* bytes left reading .rdb */
f4aa600b 425 int repl_transfer_s; /* slave -> master SYNC socket */
426 int repl_transfer_fd; /* slave -> master SYNC temp file descriptor */
427 char *repl_transfer_tmpfile; /* slave-> master SYNC temp file name */
428 time_t repl_transfer_lastio; /* unix time of the latest read, for timeout */
4ebfc455 429 int repl_serve_stale_data; /* Serve stale data when link is down? */
f4aa600b 430 /* Limits */
e2641e09 431 unsigned int maxclients;
432 unsigned long long maxmemory;
165346ca 433 int maxmemory_policy;
434 int maxmemory_samples;
f4aa600b 435 /* Blocked clients */
5fa95ad7 436 unsigned int bpop_blocked_clients;
e2641e09 437 unsigned int vm_blocked_clients;
438 /* Sort parameters - qsort_r() is only available under BSD so we
439 * have to take this state global, in order to pass it to sortCompare() */
440 int sort_desc;
441 int sort_alpha;
442 int sort_bypattern;
443 /* Virtual memory configuration */
444 int vm_enabled;
445 char *vm_swap_file;
446 off_t vm_page_size;
447 off_t vm_pages;
448 unsigned long long vm_max_memory;
449 /* Zip structure config */
450 size_t hash_max_zipmap_entries;
451 size_t hash_max_zipmap_value;
452 size_t list_max_ziplist_entries;
453 size_t list_max_ziplist_value;
96ffb2fe 454 size_t set_max_intset_entries;
e2641e09 455 /* Virtual memory state */
456 FILE *vm_fp;
457 int vm_fd;
458 off_t vm_next_page; /* Next probably empty page */
459 off_t vm_near_pages; /* Number of pages allocated sequentially */
460 unsigned char *vm_bitmap; /* Bitmap of free/used pages */
461 time_t unixtime; /* Unix time sampled every second. */
462 /* Virtual memory I/O threads stuff */
463 /* An I/O thread process an element taken from the io_jobs queue and
464 * put the result of the operation in the io_done list. While the
465 * job is being processed, it's put on io_processing queue. */
466 list *io_newjobs; /* List of VM I/O jobs yet to be processed */
467 list *io_processing; /* List of VM I/O jobs being processed */
468 list *io_processed; /* List of VM I/O jobs already processed */
469 list *io_ready_clients; /* Clients ready to be unblocked. All keys loaded */
470 pthread_mutex_t io_mutex; /* lock to access io_jobs/io_done/io_thread_job */
e2641e09 471 pthread_mutex_t io_swapfile_mutex; /* So we can lseek + write */
472 pthread_attr_t io_threads_attr; /* attributes for threads creation */
473 int io_active_threads; /* Number of running I/O threads */
474 int vm_max_threads; /* Max number of I/O threads running at the same time */
475 /* Our main thread is blocked on the event loop, locking for sockets ready
476 * to be read or written, so when a threaded I/O operation is ready to be
477 * processed by the main thread, the I/O thread will use a unix pipe to
478 * awake the main thread. The followings are the two pipe FDs. */
479 int io_ready_pipe_read;
480 int io_ready_pipe_write;
481 /* Virtual memory stats */
482 unsigned long long vm_stats_used_pages;
483 unsigned long long vm_stats_swapped_objects;
484 unsigned long long vm_stats_swapouts;
485 unsigned long long vm_stats_swapins;
486 /* Pubsub */
487 dict *pubsub_channels; /* Map channels to list of subscribed clients */
488 list *pubsub_patterns; /* A list of pubsub_patterns */
489 /* Misc */
e2641e09 490 unsigned lruclock:22; /* clock incrementing every minute, for LRU */
491 unsigned lruclock_padding:10;
492};
493
494typedef struct pubsubPattern {
495 redisClient *client;
496 robj *pattern;
497} pubsubPattern;
498
499typedef void redisCommandProc(redisClient *c);
500typedef void redisVmPreloadProc(redisClient *c, struct redisCommand *cmd, int argc, robj **argv);
501struct redisCommand {
502 char *name;
503 redisCommandProc *proc;
504 int arity;
505 int flags;
506 /* Use a function to determine which keys need to be loaded
507 * in the background prior to executing this command. Takes precedence
508 * over vm_firstkey and others, ignored when NULL */
509 redisVmPreloadProc *vm_preload_proc;
510 /* What keys should be loaded in background when calling this command? */
511 int vm_firstkey; /* The first argument that's a key (0 = no keys) */
512 int vm_lastkey; /* THe last argument that's a key */
513 int vm_keystep; /* The step between first and last key */
514};
515
516struct redisFunctionSym {
517 char *name;
518 unsigned long pointer;
519};
520
521typedef struct _redisSortObject {
522 robj *obj;
523 union {
524 double score;
525 robj *cmpobj;
526 } u;
527} redisSortObject;
528
529typedef struct _redisSortOperation {
530 int type;
531 robj *pattern;
532} redisSortOperation;
533
534/* ZSETs use a specialized version of Skiplists */
e2641e09 535typedef struct zskiplistNode {
e2641e09 536 robj *obj;
2159782b
PN
537 double score;
538 struct zskiplistNode *backward;
539 struct zskiplistLevel {
540 struct zskiplistNode *forward;
541 unsigned int span;
542 } level[];
e2641e09 543} zskiplistNode;
544
545typedef struct zskiplist {
546 struct zskiplistNode *header, *tail;
547 unsigned long length;
548 int level;
549} zskiplist;
550
551typedef struct zset {
552 dict *dict;
553 zskiplist *zsl;
554} zset;
555
556/* VM threaded I/O request message */
557#define REDIS_IOJOB_LOAD 0 /* Load from disk to memory */
558#define REDIS_IOJOB_PREPARE_SWAP 1 /* Compute needed pages */
559#define REDIS_IOJOB_DO_SWAP 2 /* Swap from memory to disk */
560typedef struct iojob {
561 int type; /* Request type, REDIS_IOJOB_* */
562 redisDb *db;/* Redis database */
563 robj *key; /* This I/O request is about swapping this key */
564 robj *id; /* Unique identifier of this job:
565 this is the object to swap for REDIS_IOREQ_*_SWAP, or the
566 vmpointer objct for REDIS_IOREQ_LOAD. */
567 robj *val; /* the value to swap for REDIS_IOREQ_*_SWAP, otherwise this
568 * field is populated by the I/O thread for REDIS_IOREQ_LOAD. */
569 off_t page; /* Swap page where to read/write the object */
570 off_t pages; /* Swap pages needed to save object. PREPARE_SWAP return val */
571 int canceled; /* True if this command was canceled by blocking side of VM */
572 pthread_t thread; /* ID of the thread processing this entry */
573} iojob;
574
575/* Structure to hold list iteration abstraction. */
576typedef struct {
577 robj *subject;
578 unsigned char encoding;
579 unsigned char direction; /* Iteration direction */
580 unsigned char *zi;
581 listNode *ln;
582} listTypeIterator;
583
584/* Structure for an entry while iterating over a list. */
585typedef struct {
586 listTypeIterator *li;
587 unsigned char *zi; /* Entry in ziplist */
588 listNode *ln; /* Entry in linked list */
589} listTypeEntry;
590
96ffb2fe
PN
591/* Structure to hold set iteration abstraction. */
592typedef struct {
593 robj *subject;
594 int encoding;
595 int ii; /* intset iterator */
596 dictIterator *di;
cb72d0f1 597} setTypeIterator;
96ffb2fe 598
e2641e09 599/* Structure to hold hash iteration abstration. Note that iteration over
600 * hashes involves both fields and values. Because it is possible that
601 * not both are required, store pointers in the iterator to avoid
602 * unnecessary memory allocation for fields/values. */
603typedef struct {
604 int encoding;
605 unsigned char *zi;
606 unsigned char *zk, *zv;
607 unsigned int zklen, zvlen;
608
609 dictIterator *di;
610 dictEntry *de;
611} hashTypeIterator;
612
613#define REDIS_HASH_KEY 1
614#define REDIS_HASH_VALUE 2
615
616/*-----------------------------------------------------------------------------
617 * Extern declarations
618 *----------------------------------------------------------------------------*/
619
620extern struct redisServer server;
621extern struct sharedObjectsStruct shared;
622extern dictType setDictType;
623extern dictType zsetDictType;
624extern double R_Zero, R_PosInf, R_NegInf, R_Nan;
625dictType hashDictType;
626
627/*-----------------------------------------------------------------------------
628 * Functions prototypes
629 *----------------------------------------------------------------------------*/
630
631/* networking.c -- Networking and Client related operations */
632redisClient *createClient(int fd);
633void closeTimedoutClients(void);
634void freeClient(redisClient *c);
635void resetClient(redisClient *c);
636void sendReplyToClient(aeEventLoop *el, int fd, void *privdata, int mask);
637void sendReplyToClientWritev(aeEventLoop *el, int fd, void *privdata, int mask);
638void addReply(redisClient *c, robj *obj);
b301c1fc
PN
639void *addDeferredMultiBulkLength(redisClient *c);
640void setDeferredMultiBulkLength(redisClient *c, void *node, long length);
e2641e09 641void addReplySds(redisClient *c, sds s);
642void processInputBuffer(redisClient *c);
ab17b909
PN
643void acceptTcpHandler(aeEventLoop *el, int fd, void *privdata, int mask);
644void acceptUnixHandler(aeEventLoop *el, int fd, void *privdata, int mask);
e2641e09 645void readQueryFromClient(aeEventLoop *el, int fd, void *privdata, int mask);
646void addReplyBulk(redisClient *c, robj *obj);
647void addReplyBulkCString(redisClient *c, char *s);
648void acceptHandler(aeEventLoop *el, int fd, void *privdata, int mask);
649void addReply(redisClient *c, robj *obj);
650void addReplySds(redisClient *c, sds s);
3ab20376
PN
651void addReplyError(redisClient *c, char *err);
652void addReplyStatus(redisClient *c, char *status);
e2641e09 653void addReplyDouble(redisClient *c, double d);
654void addReplyLongLong(redisClient *c, long long ll);
0537e7bf 655void addReplyMultiBulkLen(redisClient *c, long length);
e2641e09 656void *dupClientReplyValue(void *o);
657
3ab20376
PN
658#ifdef __GNUC__
659void addReplyErrorFormat(redisClient *c, const char *fmt, ...)
660 __attribute__((format(printf, 2, 3)));
661void addReplyStatusFormat(redisClient *c, const char *fmt, ...)
662 __attribute__((format(printf, 2, 3)));
663#else
664void addReplyErrorFormat(redisClient *c, const char *fmt, ...);
665void addReplyStatusFormat(redisClient *c, const char *fmt, ...);
666#endif
667
e2641e09 668/* List data type */
669void listTypeTryConversion(robj *subject, robj *value);
670void listTypePush(robj *subject, robj *value, int where);
671robj *listTypePop(robj *subject, int where);
672unsigned long listTypeLength(robj *subject);
673listTypeIterator *listTypeInitIterator(robj *subject, int index, unsigned char direction);
674void listTypeReleaseIterator(listTypeIterator *li);
675int listTypeNext(listTypeIterator *li, listTypeEntry *entry);
676robj *listTypeGet(listTypeEntry *entry);
677void listTypeInsert(listTypeEntry *entry, robj *value, int where);
678int listTypeEqual(listTypeEntry *entry, robj *o);
679void listTypeDelete(listTypeEntry *entry);
680void listTypeConvert(robj *subject, int enc);
681void unblockClientWaitingData(redisClient *c);
682int handleClientsWaitingListPush(redisClient *c, robj *key, robj *ele);
683void popGenericCommand(redisClient *c, int where);
684
685/* MULTI/EXEC/WATCH... */
686void unwatchAllKeys(redisClient *c);
687void initClientMultiState(redisClient *c);
688void freeClientMultiState(redisClient *c);
689void queueMultiCommand(redisClient *c, struct redisCommand *cmd);
690void touchWatchedKey(redisDb *db, robj *key);
691void touchWatchedKeysOnFlush(int dbid);
692
693/* Redis object implementation */
694void decrRefCount(void *o);
695void incrRefCount(robj *o);
696void freeStringObject(robj *o);
697void freeListObject(robj *o);
698void freeSetObject(robj *o);
699void freeZsetObject(robj *o);
700void freeHashObject(robj *o);
701robj *createObject(int type, void *ptr);
702robj *createStringObject(char *ptr, size_t len);
703robj *dupStringObject(robj *o);
704robj *tryObjectEncoding(robj *o);
705robj *getDecodedObject(robj *o);
706size_t stringObjectLen(robj *o);
e2641e09 707robj *createStringObjectFromLongLong(long long value);
708robj *createListObject(void);
709robj *createZiplistObject(void);
710robj *createSetObject(void);
96ffb2fe 711robj *createIntsetObject(void);
e2641e09 712robj *createHashObject(void);
713robj *createZsetObject(void);
714int getLongFromObjectOrReply(redisClient *c, robj *o, long *target, const char *msg);
715int checkType(redisClient *c, robj *o, int type);
716int getLongLongFromObjectOrReply(redisClient *c, robj *o, long long *target, const char *msg);
717int getDoubleFromObjectOrReply(redisClient *c, robj *o, double *target, const char *msg);
718int getLongLongFromObject(robj *o, long long *target);
719char *strEncoding(int encoding);
720int compareStringObjects(robj *a, robj *b);
721int equalStringObjects(robj *a, robj *b);
ef59a8bc 722unsigned long estimateObjectIdleTime(robj *o);
e2641e09 723
19e61097 724/* Synchronous I/O with timeout */
725int syncWrite(int fd, char *ptr, ssize_t size, int timeout);
726int syncRead(int fd, char *ptr, ssize_t size, int timeout);
727int syncReadLine(int fd, char *ptr, ssize_t size, int timeout);
d08fac3e 728int fwriteBulkString(FILE *fp, char *s, unsigned long len);
729int fwriteBulkDouble(FILE *fp, double d);
730int fwriteBulkLongLong(FILE *fp, long long l);
244201f6 731int fwriteBulkObject(FILE *fp, robj *obj);
19e61097 732
e2641e09 733/* Replication */
734void replicationFeedSlaves(list *slaves, int dictid, robj **argv, int argc);
735void replicationFeedMonitors(list *monitors, int dictid, robj **argv, int argc);
736int syncWithMaster(void);
737void updateSlavesWaitingBgsave(int bgsaveerr);
f4aa600b 738void replicationCron(void);
e2641e09 739
97e7f8ae 740/* Generic persistence functions */
741void startLoading(FILE *fp);
742void loadingProgress(off_t pos);
743void stopLoading(void);
744
e2641e09 745/* RDB persistence */
746int rdbLoad(char *filename);
747int rdbSaveBackground(char *filename);
748void rdbRemoveTempFile(pid_t childpid);
749int rdbSave(char *filename);
750int rdbSaveObject(FILE *fp, robj *o);
bd70a5f5
PN
751off_t rdbSavedObjectLen(robj *o);
752off_t rdbSavedObjectPages(robj *o);
e2641e09 753robj *rdbLoadObject(int type, FILE *fp);
754void backgroundSaveDoneHandler(int statloc);
755
756/* AOF persistence */
757void flushAppendOnlyFile(void);
758void feedAppendOnlyFile(struct redisCommand *cmd, int dictid, robj **argv, int argc);
759void aofRemoveTempFile(pid_t childpid);
760int rewriteAppendOnlyFileBackground(void);
761int loadAppendOnlyFile(char *filename);
762void stopAppendOnly(void);
763int startAppendOnly(void);
764void backgroundRewriteDoneHandler(int statloc);
765
766/* Sorted sets data type */
767zskiplist *zslCreate(void);
768void zslFree(zskiplist *zsl);
69ef89f2 769zskiplistNode *zslInsert(zskiplist *zsl, double score, robj *obj);
e2641e09 770
771/* Core functions */
772void freeMemoryIfNeeded(void);
773int processCommand(redisClient *c);
774void setupSigSegvAction(void);
1b1f47c9 775struct redisCommand *lookupCommand(sds name);
776struct redisCommand *lookupCommandByCString(char *s);
e2641e09 777void call(redisClient *c, struct redisCommand *cmd);
778int prepareForShutdown();
779void redisLog(int level, const char *fmt, ...);
780void usage();
781void updateDictResizePolicy(void);
782int htNeedsResize(dict *dict);
783void oom(const char *msg);
1b1f47c9 784void populateCommandTable(void);
e2641e09 785
786/* Virtual Memory */
787void vmInit(void);
788void vmMarkPagesFree(off_t page, off_t count);
789robj *vmLoadObject(robj *o);
790robj *vmPreviewObject(robj *o);
791int vmSwapOneObjectBlocking(void);
792int vmSwapOneObjectThreaded(void);
793int vmCanSwapOut(void);
794void vmThreadedIOCompletedJob(aeEventLoop *el, int fd, void *privdata, int mask);
795void vmCancelThreadedIOJob(robj *o);
796void lockThreadedIO(void);
797void unlockThreadedIO(void);
798int vmSwapObjectThreaded(robj *key, robj *val, redisDb *db);
799void freeIOJob(iojob *j);
800void queueIOJob(iojob *j);
801int vmWriteObjectOnSwap(robj *o, off_t page);
802robj *vmReadObjectFromSwap(off_t page, int type);
803void waitEmptyIOJobsQueue(void);
804void vmReopenSwapFile(void);
805int vmFreePage(off_t page);
806void zunionInterBlockClientOnSwappedKeys(redisClient *c, struct redisCommand *cmd, int argc, robj **argv);
807void execBlockClientOnSwappedKeys(redisClient *c, struct redisCommand *cmd, int argc, robj **argv);
808int blockClientOnSwappedKeys(redisClient *c, struct redisCommand *cmd);
809int dontWaitForSwappedKey(redisClient *c, robj *key);
810void handleClientsBlockedOnSwappedKey(redisDb *db, robj *key);
811vmpointer *vmSwapObjectBlocking(robj *val);
812
96ffb2fe
PN
813/* Set data type */
814robj *setTypeCreate(robj *value);
815int setTypeAdd(robj *subject, robj *value);
816int setTypeRemove(robj *subject, robj *value);
817int setTypeIsMember(robj *subject, robj *value);
cb72d0f1
PN
818setTypeIterator *setTypeInitIterator(robj *subject);
819void setTypeReleaseIterator(setTypeIterator *si);
820robj *setTypeNext(setTypeIterator *si);
96ffb2fe
PN
821robj *setTypeRandomElement(robj *subject);
822unsigned long setTypeSize(robj *subject);
823void setTypeConvert(robj *subject, int enc);
824
e2641e09 825/* Hash data type */
826void convertToRealHash(robj *o);
827void hashTypeTryConversion(robj *subject, robj **argv, int start, int end);
828void hashTypeTryObjectEncoding(robj *subject, robj **o1, robj **o2);
829robj *hashTypeGet(robj *o, robj *key);
830int hashTypeExists(robj *o, robj *key);
831int hashTypeSet(robj *o, robj *key, robj *value);
832int hashTypeDelete(robj *o, robj *key);
833unsigned long hashTypeLength(robj *o);
834hashTypeIterator *hashTypeInitIterator(robj *subject);
835void hashTypeReleaseIterator(hashTypeIterator *hi);
836int hashTypeNext(hashTypeIterator *hi);
837robj *hashTypeCurrent(hashTypeIterator *hi, int what);
838robj *hashTypeLookupWriteOrCreate(redisClient *c, robj *key);
839
840/* Pub / Sub */
841int pubsubUnsubscribeAllChannels(redisClient *c, int notify);
842int pubsubUnsubscribeAllPatterns(redisClient *c, int notify);
843void freePubsubPattern(void *p);
844int listMatchPubsubPattern(void *a, void *b);
845
846/* Utility functions */
847int stringmatchlen(const char *pattern, int patternLen,
848 const char *string, int stringLen, int nocase);
849int stringmatch(const char *pattern, const char *string, int nocase);
850long long memtoll(const char *p, int *err);
851int ll2string(char *s, size_t len, long long value);
852int isStringRepresentableAsLong(sds s, long *longval);
ec7e1389 853int isStringRepresentableAsLongLong(sds s, long long *longval);
854int isObjectRepresentableAsLongLong(robj *o, long long *llongval);
e2641e09 855
856/* Configuration */
857void loadServerConfig(char *filename);
858void appendServerSaveParams(time_t seconds, int changes);
859void resetServerSaveParams();
860
861/* db.c -- Keyspace access API */
862int removeExpire(redisDb *db, robj *key);
bcf2995c 863void propagateExpire(redisDb *db, robj *key);
e2641e09 864int expireIfNeeded(redisDb *db, robj *key);
e2641e09 865time_t getExpire(redisDb *db, robj *key);
0cf5b7b5 866void setExpire(redisDb *db, robj *key, time_t when);
e2641e09 867robj *lookupKey(redisDb *db, robj *key);
868robj *lookupKeyRead(redisDb *db, robj *key);
869robj *lookupKeyWrite(redisDb *db, robj *key);
870robj *lookupKeyReadOrReply(redisClient *c, robj *key, robj *reply);
871robj *lookupKeyWriteOrReply(redisClient *c, robj *key, robj *reply);
872int dbAdd(redisDb *db, robj *key, robj *val);
873int dbReplace(redisDb *db, robj *key, robj *val);
874int dbExists(redisDb *db, robj *key);
875robj *dbRandomKey(redisDb *db);
876int dbDelete(redisDb *db, robj *key);
877long long emptyDb();
878int selectDb(redisClient *c, int id);
879
880/* Git SHA1 */
881char *redisGitSHA1(void);
882char *redisGitDirty(void);
883
884/* Commands prototypes */
885void authCommand(redisClient *c);
886void pingCommand(redisClient *c);
887void echoCommand(redisClient *c);
888void setCommand(redisClient *c);
889void setnxCommand(redisClient *c);
890void setexCommand(redisClient *c);
891void getCommand(redisClient *c);
892void delCommand(redisClient *c);
893void existsCommand(redisClient *c);
894void incrCommand(redisClient *c);
895void decrCommand(redisClient *c);
896void incrbyCommand(redisClient *c);
897void decrbyCommand(redisClient *c);
898void selectCommand(redisClient *c);
899void randomkeyCommand(redisClient *c);
900void keysCommand(redisClient *c);
901void dbsizeCommand(redisClient *c);
902void lastsaveCommand(redisClient *c);
903void saveCommand(redisClient *c);
904void bgsaveCommand(redisClient *c);
905void bgrewriteaofCommand(redisClient *c);
906void shutdownCommand(redisClient *c);
907void moveCommand(redisClient *c);
908void renameCommand(redisClient *c);
909void renamenxCommand(redisClient *c);
910void lpushCommand(redisClient *c);
911void rpushCommand(redisClient *c);
912void lpushxCommand(redisClient *c);
913void rpushxCommand(redisClient *c);
914void linsertCommand(redisClient *c);
915void lpopCommand(redisClient *c);
916void rpopCommand(redisClient *c);
917void llenCommand(redisClient *c);
918void lindexCommand(redisClient *c);
919void lrangeCommand(redisClient *c);
920void ltrimCommand(redisClient *c);
921void typeCommand(redisClient *c);
922void lsetCommand(redisClient *c);
923void saddCommand(redisClient *c);
924void sremCommand(redisClient *c);
925void smoveCommand(redisClient *c);
926void sismemberCommand(redisClient *c);
927void scardCommand(redisClient *c);
928void spopCommand(redisClient *c);
929void srandmemberCommand(redisClient *c);
930void sinterCommand(redisClient *c);
931void sinterstoreCommand(redisClient *c);
932void sunionCommand(redisClient *c);
933void sunionstoreCommand(redisClient *c);
934void sdiffCommand(redisClient *c);
935void sdiffstoreCommand(redisClient *c);
936void syncCommand(redisClient *c);
937void flushdbCommand(redisClient *c);
938void flushallCommand(redisClient *c);
939void sortCommand(redisClient *c);
940void lremCommand(redisClient *c);
8a979f03 941void rpoplpushCommand(redisClient *c);
e2641e09 942void infoCommand(redisClient *c);
943void mgetCommand(redisClient *c);
944void monitorCommand(redisClient *c);
945void expireCommand(redisClient *c);
946void expireatCommand(redisClient *c);
947void getsetCommand(redisClient *c);
948void ttlCommand(redisClient *c);
a539d29a 949void persistCommand(redisClient *c);
e2641e09 950void slaveofCommand(redisClient *c);
951void debugCommand(redisClient *c);
952void msetCommand(redisClient *c);
953void msetnxCommand(redisClient *c);
954void zaddCommand(redisClient *c);
955void zincrbyCommand(redisClient *c);
956void zrangeCommand(redisClient *c);
957void zrangebyscoreCommand(redisClient *c);
25bb8a44 958void zrevrangebyscoreCommand(redisClient *c);
e2641e09 959void zcountCommand(redisClient *c);
960void zrevrangeCommand(redisClient *c);
961void zcardCommand(redisClient *c);
962void zremCommand(redisClient *c);
963void zscoreCommand(redisClient *c);
964void zremrangebyscoreCommand(redisClient *c);
965void multiCommand(redisClient *c);
966void execCommand(redisClient *c);
967void discardCommand(redisClient *c);
968void blpopCommand(redisClient *c);
969void brpopCommand(redisClient *c);
b2a7fd0c 970void brpoplpushCommand(redisClient *c);
e2641e09 971void appendCommand(redisClient *c);
972void substrCommand(redisClient *c);
80091bba 973void strlenCommand(redisClient *c);
e2641e09 974void zrankCommand(redisClient *c);
975void zrevrankCommand(redisClient *c);
976void hsetCommand(redisClient *c);
977void hsetnxCommand(redisClient *c);
978void hgetCommand(redisClient *c);
979void hmsetCommand(redisClient *c);
980void hmgetCommand(redisClient *c);
981void hdelCommand(redisClient *c);
982void hlenCommand(redisClient *c);
983void zremrangebyrankCommand(redisClient *c);
984void zunionstoreCommand(redisClient *c);
985void zinterstoreCommand(redisClient *c);
986void hkeysCommand(redisClient *c);
987void hvalsCommand(redisClient *c);
988void hgetallCommand(redisClient *c);
989void hexistsCommand(redisClient *c);
990void configCommand(redisClient *c);
991void hincrbyCommand(redisClient *c);
992void subscribeCommand(redisClient *c);
993void unsubscribeCommand(redisClient *c);
994void psubscribeCommand(redisClient *c);
995void punsubscribeCommand(redisClient *c);
996void publishCommand(redisClient *c);
997void watchCommand(redisClient *c);
998void unwatchCommand(redisClient *c);
999
b3aa6d71 1000#if defined(__GNUC__)
b3aa6d71 1001void *calloc(size_t count, size_t size) __attribute__ ((deprecated));
1002void free(void *ptr) __attribute__ ((deprecated));
1003void *malloc(size_t size) __attribute__ ((deprecated));
1004void *realloc(void *ptr, size_t size) __attribute__ ((deprecated));
1005#endif
1006
e2641e09 1007#endif