]> git.saurik.com Git - redis.git/blame_incremental - src/redis.h
syslog support
[redis.git] / src / redis.h
... / ...
CommitLineData
1#ifndef __REDIS_H
2#define __REDIS_H
3
4#include "fmacros.h"
5#include "config.h"
6
7#if defined(__sun)
8#include "solarisfixes.h"
9#endif
10
11#include <stdio.h>
12#include <stdlib.h>
13#include <string.h>
14#include <time.h>
15#include <limits.h>
16#include <unistd.h>
17#include <errno.h>
18#include <inttypes.h>
19#include <pthread.h>
20#include <syslog.h>
21
22#include "ae.h" /* Event driven programming library */
23#include "sds.h" /* Dynamic safe strings */
24#include "dict.h" /* Hash tables */
25#include "adlist.h" /* Linked lists */
26#include "zmalloc.h" /* total memory usage aware version of malloc/free */
27#include "anet.h" /* Networking the easy way */
28#include "zipmap.h" /* Compact string -> string data structure */
29#include "ziplist.h" /* Compact list data structure */
30#include "intset.h" /* Compact integer set structure */
31#include "version.h"
32
33/* Error codes */
34#define REDIS_OK 0
35#define REDIS_ERR -1
36
37/* Static server configuration */
38#define REDIS_SERVERPORT 6379 /* TCP port */
39#define REDIS_MAXIDLETIME (60*5) /* default client timeout */
40#define REDIS_IOBUF_LEN 1024
41#define REDIS_LOADBUF_LEN 1024
42#define REDIS_STATIC_ARGS 8
43#define REDIS_DEFAULT_DBNUM 16
44#define REDIS_CONFIGLINE_MAX 1024
45#define REDIS_MAX_SYNC_TIME 60 /* Slave can't take more to sync */
46#define REDIS_EXPIRELOOKUPS_PER_CRON 10 /* lookup 10 expires per loop */
47#define REDIS_MAX_WRITE_PER_EVENT (1024*64)
48#define REDIS_REQUEST_MAX_SIZE (1024*1024*256) /* max bytes in inline command */
49#define REDIS_SHARED_INTEGERS 10000
50#define REDIS_REPLY_CHUNK_BYTES (5*1500) /* 5 TCP packets with default MTU */
51#define REDIS_MAX_LOGMSG_LEN 1024 /* Default maximum length of syslog messages */
52
53/* If more then REDIS_WRITEV_THRESHOLD write packets are pending use writev */
54#define REDIS_WRITEV_THRESHOLD 3
55/* Max number of iovecs used for each writev call */
56#define REDIS_WRITEV_IOVEC_COUNT 256
57
58/* Hash table parameters */
59#define REDIS_HT_MINFILL 10 /* Minimal hash table fill 10% */
60
61/* Command flags:
62 * REDIS_CMD_DENYOOM:
63 * Commands marked with this flag will return an error when 'maxmemory' is
64 * set and the server is using more than 'maxmemory' bytes of memory.
65 * In short: commands with this flag are denied on low memory conditions.
66 * REDIS_CMD_FORCE_REPLICATION:
67 * Force replication even if dirty is 0. */
68#define REDIS_CMD_DENYOOM 4
69#define REDIS_CMD_FORCE_REPLICATION 8
70
71/* Object types */
72#define REDIS_STRING 0
73#define REDIS_LIST 1
74#define REDIS_SET 2
75#define REDIS_ZSET 3
76#define REDIS_HASH 4
77#define REDIS_VMPOINTER 8
78
79/* Objects encoding. Some kind of objects like Strings and Hashes can be
80 * internally represented in multiple ways. The 'encoding' field of the object
81 * is set to one of this fields for this object. */
82#define REDIS_ENCODING_RAW 0 /* Raw representation */
83#define REDIS_ENCODING_INT 1 /* Encoded as integer */
84#define REDIS_ENCODING_HT 2 /* Encoded as hash table */
85#define REDIS_ENCODING_ZIPMAP 3 /* Encoded as zipmap */
86#define REDIS_ENCODING_LINKEDLIST 4 /* Encoded as regular linked list */
87#define REDIS_ENCODING_ZIPLIST 5 /* Encoded as ziplist */
88#define REDIS_ENCODING_INTSET 6 /* Encoded as intset */
89
90/* Object types only used for dumping to disk */
91#define REDIS_EXPIRETIME 253
92#define REDIS_SELECTDB 254
93#define REDIS_EOF 255
94
95/* Defines related to the dump file format. To store 32 bits lengths for short
96 * keys requires a lot of space, so we check the most significant 2 bits of
97 * the first byte to interpreter the length:
98 *
99 * 00|000000 => if the two MSB are 00 the len is the 6 bits of this byte
100 * 01|000000 00000000 => 01, the len is 14 byes, 6 bits + 8 bits of next byte
101 * 10|000000 [32 bit integer] => if it's 01, a full 32 bit len will follow
102 * 11|000000 this means: specially encoded object will follow. The six bits
103 * number specify the kind of object that follows.
104 * See the REDIS_RDB_ENC_* defines.
105 *
106 * Lenghts up to 63 are stored using a single byte, most DB keys, and may
107 * values, will fit inside. */
108#define REDIS_RDB_6BITLEN 0
109#define REDIS_RDB_14BITLEN 1
110#define REDIS_RDB_32BITLEN 2
111#define REDIS_RDB_ENCVAL 3
112#define REDIS_RDB_LENERR UINT_MAX
113
114/* When a length of a string object stored on disk has the first two bits
115 * set, the remaining two bits specify a special encoding for the object
116 * accordingly to the following defines: */
117#define REDIS_RDB_ENC_INT8 0 /* 8 bit signed integer */
118#define REDIS_RDB_ENC_INT16 1 /* 16 bit signed integer */
119#define REDIS_RDB_ENC_INT32 2 /* 32 bit signed integer */
120#define REDIS_RDB_ENC_LZF 3 /* string compressed with FASTLZ */
121
122/* Virtual memory object->where field. */
123#define REDIS_VM_MEMORY 0 /* The object is on memory */
124#define REDIS_VM_SWAPPED 1 /* The object is on disk */
125#define REDIS_VM_SWAPPING 2 /* Redis is swapping this object on disk */
126#define REDIS_VM_LOADING 3 /* Redis is loading this object from disk */
127
128/* Virtual memory static configuration stuff.
129 * Check vmFindContiguousPages() to know more about this magic numbers. */
130#define REDIS_VM_MAX_NEAR_PAGES 65536
131#define REDIS_VM_MAX_RANDOM_JUMP 4096
132#define REDIS_VM_MAX_THREADS 32
133#define REDIS_THREAD_STACK_SIZE (1024*1024*4)
134/* The following is the *percentage* of completed I/O jobs to process when the
135 * handelr is called. While Virtual Memory I/O operations are performed by
136 * threads, this operations must be processed by the main thread when completed
137 * in order to take effect. */
138#define REDIS_MAX_COMPLETED_JOBS_PROCESSED 1
139
140/* Client flags */
141#define REDIS_SLAVE 1 /* This client is a slave server */
142#define REDIS_MASTER 2 /* This client is a master server */
143#define REDIS_MONITOR 4 /* This client is a slave monitor, see MONITOR */
144#define REDIS_MULTI 8 /* This client is in a MULTI context */
145#define REDIS_BLOCKED 16 /* The client is waiting in a blocking operation */
146#define REDIS_IO_WAIT 32 /* The client is waiting for Virtual Memory I/O */
147#define REDIS_DIRTY_CAS 64 /* Watched keys modified. EXEC will fail. */
148#define REDIS_CLOSE_AFTER_REPLY 128 /* Close after writing entire reply. */
149
150/* Client request types */
151#define REDIS_REQ_INLINE 1
152#define REDIS_REQ_MULTIBULK 2
153
154/* Slave replication state - slave side */
155#define REDIS_REPL_NONE 0 /* No active replication */
156#define REDIS_REPL_CONNECT 1 /* Must connect to master */
157#define REDIS_REPL_TRANSFER 2 /* Receiving .rdb from master */
158#define REDIS_REPL_CONNECTED 3 /* Connected to master */
159
160/* Slave replication state - from the point of view of master
161 * Note that in SEND_BULK and ONLINE state the slave receives new updates
162 * in its output queue. In the WAIT_BGSAVE state instead the server is waiting
163 * to start the next background saving in order to send updates to it. */
164#define REDIS_REPL_WAIT_BGSAVE_START 3 /* master waits bgsave to start feeding it */
165#define REDIS_REPL_WAIT_BGSAVE_END 4 /* master waits bgsave to start bulk DB transmission */
166#define REDIS_REPL_SEND_BULK 5 /* master is sending the bulk DB */
167#define REDIS_REPL_ONLINE 6 /* bulk DB already transmitted, receive updates */
168
169/* List related stuff */
170#define REDIS_HEAD 0
171#define REDIS_TAIL 1
172
173/* Sort operations */
174#define REDIS_SORT_GET 0
175#define REDIS_SORT_ASC 1
176#define REDIS_SORT_DESC 2
177#define REDIS_SORTKEY_MAX 1024
178
179/* Log levels */
180#define REDIS_DEBUG 0
181#define REDIS_VERBOSE 1
182#define REDIS_NOTICE 2
183#define REDIS_WARNING 3
184
185/* Anti-warning macro... */
186#define REDIS_NOTUSED(V) ((void) V)
187
188#define ZSKIPLIST_MAXLEVEL 32 /* Should be enough for 2^32 elements */
189#define ZSKIPLIST_P 0.25 /* Skiplist P = 1/4 */
190
191/* Append only defines */
192#define APPENDFSYNC_NO 0
193#define APPENDFSYNC_ALWAYS 1
194#define APPENDFSYNC_EVERYSEC 2
195
196/* Zip structure related defaults */
197#define REDIS_HASH_MAX_ZIPMAP_ENTRIES 64
198#define REDIS_HASH_MAX_ZIPMAP_VALUE 512
199#define REDIS_LIST_MAX_ZIPLIST_ENTRIES 1024
200#define REDIS_LIST_MAX_ZIPLIST_VALUE 32
201#define REDIS_SET_MAX_INTSET_ENTRIES 4096
202
203/* Sets operations codes */
204#define REDIS_OP_UNION 0
205#define REDIS_OP_DIFF 1
206#define REDIS_OP_INTER 2
207
208/* Redis maxmemory strategies */
209#define REDIS_MAXMEMORY_VOLATILE_LRU 0
210#define REDIS_MAXMEMORY_VOLATILE_TTL 1
211#define REDIS_MAXMEMORY_VOLATILE_RANDOM 2
212#define REDIS_MAXMEMORY_ALLKEYS_LRU 3
213#define REDIS_MAXMEMORY_ALLKEYS_RANDOM 4
214#define REDIS_MAXMEMORY_NO_EVICTION 5
215
216/* We can print the stacktrace, so our assert is defined this way: */
217#define redisAssert(_e) ((_e)?(void)0 : (_redisAssert(#_e,__FILE__,__LINE__),_exit(1)))
218#define redisPanic(_e) _redisPanic(#_e,__FILE__,__LINE__),_exit(1)
219void _redisAssert(char *estr, char *file, int line);
220void _redisPanic(char *msg, char *file, int line);
221
222/*-----------------------------------------------------------------------------
223 * Data types
224 *----------------------------------------------------------------------------*/
225
226/* A redis object, that is a type able to hold a string / list / set */
227
228/* The actual Redis Object */
229#define REDIS_LRU_CLOCK_MAX ((1<<21)-1) /* Max value of obj->lru */
230#define REDIS_LRU_CLOCK_RESOLUTION 10 /* LRU clock resolution in seconds */
231typedef struct redisObject {
232 unsigned type:4;
233 unsigned storage:2; /* REDIS_VM_MEMORY or REDIS_VM_SWAPPING */
234 unsigned encoding:4;
235 unsigned lru:22; /* lru time (relative to server.lruclock) */
236 int refcount;
237 void *ptr;
238 /* VM fields are only allocated if VM is active, otherwise the
239 * object allocation function will just allocate
240 * sizeof(redisObjct) minus sizeof(redisObjectVM), so using
241 * Redis without VM active will not have any overhead. */
242} robj;
243
244/* The VM pointer structure - identifies an object in the swap file.
245 *
246 * This object is stored in place of the value
247 * object in the main key->value hash table representing a database.
248 * Note that the first fields (type, storage) are the same as the redisObject
249 * structure so that vmPointer strucuters can be accessed even when casted
250 * as redisObject structures.
251 *
252 * This is useful as we don't know if a value object is or not on disk, but we
253 * are always able to read obj->storage to check this. For vmPointer
254 * structures "type" is set to REDIS_VMPOINTER (even if without this field
255 * is still possible to check the kind of object from the value of 'storage').*/
256typedef struct vmPointer {
257 unsigned type:4;
258 unsigned storage:2; /* REDIS_VM_SWAPPED or REDIS_VM_LOADING */
259 unsigned notused:26;
260 unsigned int vtype; /* type of the object stored in the swap file */
261 off_t page; /* the page at witch the object is stored on disk */
262 off_t usedpages; /* number of pages used on disk */
263} vmpointer;
264
265/* Macro used to initalize a Redis object allocated on the stack.
266 * Note that this macro is taken near the structure definition to make sure
267 * we'll update it when the structure is changed, to avoid bugs like
268 * bug #85 introduced exactly in this way. */
269#define initStaticStringObject(_var,_ptr) do { \
270 _var.refcount = 1; \
271 _var.type = REDIS_STRING; \
272 _var.encoding = REDIS_ENCODING_RAW; \
273 _var.ptr = _ptr; \
274 _var.storage = REDIS_VM_MEMORY; \
275} while(0);
276
277typedef struct redisDb {
278 dict *dict; /* The keyspace for this DB */
279 dict *expires; /* Timeout of keys with a timeout set */
280 dict *blocking_keys; /* Keys with clients waiting for data (BLPOP) */
281 dict *io_keys; /* Keys with clients waiting for VM I/O */
282 dict *watched_keys; /* WATCHED keys for MULTI/EXEC CAS */
283 int id;
284} redisDb;
285
286/* Client MULTI/EXEC state */
287typedef struct multiCmd {
288 robj **argv;
289 int argc;
290 struct redisCommand *cmd;
291} multiCmd;
292
293typedef struct multiState {
294 multiCmd *commands; /* Array of MULTI commands */
295 int count; /* Total number of MULTI commands */
296} multiState;
297
298/* With multiplexing we need to take per-clinet state.
299 * Clients are taken in a liked list. */
300typedef struct redisClient {
301 int fd;
302 redisDb *db;
303 int dictid;
304 sds querybuf;
305 int argc;
306 robj **argv;
307 int reqtype;
308 int multibulklen; /* number of multi bulk arguments left to read */
309 long bulklen; /* length of bulk argument in multi bulk request */
310 list *reply;
311 int sentlen;
312 time_t lastinteraction; /* time of the last interaction, used for timeout */
313 int flags; /* REDIS_SLAVE | REDIS_MONITOR | REDIS_MULTI ... */
314 int slaveseldb; /* slave selected db, if this client is a slave */
315 int authenticated; /* when requirepass is non-NULL */
316 int replstate; /* replication state if this is a slave */
317 int repldbfd; /* replication DB file descriptor */
318 long repldboff; /* replication DB file offset */
319 off_t repldbsize; /* replication DB file size */
320 multiState mstate; /* MULTI/EXEC state */
321 robj **blocking_keys; /* The key we are waiting to terminate a blocking
322 * operation such as BLPOP. Otherwise NULL. */
323 int blocking_keys_num; /* Number of blocking keys */
324 time_t blockingto; /* Blocking operation timeout. If UNIX current time
325 * is >= blockingto then the operation timed out. */
326 list *io_keys; /* Keys this client is waiting to be loaded from the
327 * swap file in order to continue. */
328 list *watched_keys; /* Keys WATCHED for MULTI/EXEC CAS */
329 dict *pubsub_channels; /* channels a client is interested in (SUBSCRIBE) */
330 list *pubsub_patterns; /* patterns a client is interested in (SUBSCRIBE) */
331
332 /* Response buffer */
333 int bufpos;
334 char buf[REDIS_REPLY_CHUNK_BYTES];
335} redisClient;
336
337struct saveparam {
338 time_t seconds;
339 int changes;
340};
341
342struct sharedObjectsStruct {
343 robj *crlf, *ok, *err, *emptybulk, *czero, *cone, *cnegone, *pong, *space,
344 *colon, *nullbulk, *nullmultibulk, *queued,
345 *emptymultibulk, *wrongtypeerr, *nokeyerr, *syntaxerr, *sameobjecterr,
346 *outofrangeerr, *loadingerr, *plus,
347 *select0, *select1, *select2, *select3, *select4,
348 *select5, *select6, *select7, *select8, *select9,
349 *messagebulk, *pmessagebulk, *subscribebulk, *unsubscribebulk, *mbulk3,
350 *mbulk4, *psubscribebulk, *punsubscribebulk,
351 *integers[REDIS_SHARED_INTEGERS];
352};
353
354/* Global server state structure */
355struct redisServer {
356 pthread_t mainthread;
357 int port;
358 char *bindaddr;
359 char *unixsocket;
360 int ipfd;
361 int sofd;
362 redisDb *db;
363 long long dirty; /* changes to DB from the last save */
364 long long dirty_before_bgsave; /* used to restore dirty on failed BGSAVE */
365 list *clients;
366 dict *commands; /* Command table hahs table */
367 /* RDB / AOF loading information */
368 int loading;
369 off_t loading_total_bytes;
370 off_t loading_loaded_bytes;
371 time_t loading_start_time;
372 /* Fast pointers to often looked up command */
373 struct redisCommand *delCommand, *multiCommand;
374 list *slaves, *monitors;
375 char neterr[ANET_ERR_LEN];
376 aeEventLoop *el;
377 int cronloops; /* number of times the cron function run */
378 time_t lastsave; /* Unix time of last save succeeede */
379 /* Fields used only for stats */
380 time_t stat_starttime; /* server start time */
381 long long stat_numcommands; /* number of processed commands */
382 long long stat_numconnections; /* number of connections received */
383 long long stat_expiredkeys; /* number of expired keys */
384 long long stat_keyspace_hits; /* number of successful lookups of keys */
385 long long stat_keyspace_misses; /* number of failed lookups of keys */
386 /* Configuration */
387 int verbosity;
388 int glueoutputbuf;
389 int maxidletime;
390 int dbnum;
391 int daemonize;
392 int appendonly;
393 int appendfsync;
394 int no_appendfsync_on_rewrite;
395 int shutdown_asap;
396 time_t lastfsync;
397 int appendfd;
398 int appendseldb;
399 char *pidfile;
400 pid_t bgsavechildpid;
401 pid_t bgrewritechildpid;
402 sds bgrewritebuf; /* buffer taken by parent during oppend only rewrite */
403 sds aofbuf; /* AOF buffer, written before entering the event loop */
404 struct saveparam *saveparams;
405 int saveparamslen;
406 char *logfile;
407 int syslog_enabled;
408 char *syslog_ident;
409 int syslog_facility;
410 char *dbfilename;
411 char *appendfilename;
412 char *requirepass;
413 int rdbcompression;
414 int activerehashing;
415 /* Replication related */
416 int isslave;
417 /* Slave specific fields */
418 char *masterauth;
419 char *masterhost;
420 int masterport;
421 redisClient *master; /* client that is master for this slave */
422 int replstate; /* replication status if the instance is a slave */
423 off_t repl_transfer_left; /* bytes left reading .rdb */
424 int repl_transfer_s; /* slave -> master SYNC socket */
425 int repl_transfer_fd; /* slave -> master SYNC temp file descriptor */
426 char *repl_transfer_tmpfile; /* slave-> master SYNC temp file name */
427 time_t repl_transfer_lastio; /* unix time of the latest read, for timeout */
428 int repl_serve_stale_data; /* Serve stale data when link is down? */
429 /* Limits */
430 unsigned int maxclients;
431 unsigned long long maxmemory;
432 int maxmemory_policy;
433 int maxmemory_samples;
434 /* Blocked clients */
435 unsigned int blpop_blocked_clients;
436 unsigned int vm_blocked_clients;
437 /* Sort parameters - qsort_r() is only available under BSD so we
438 * have to take this state global, in order to pass it to sortCompare() */
439 int sort_desc;
440 int sort_alpha;
441 int sort_bypattern;
442 /* Virtual memory configuration */
443 int vm_enabled;
444 char *vm_swap_file;
445 off_t vm_page_size;
446 off_t vm_pages;
447 unsigned long long vm_max_memory;
448 /* Zip structure config */
449 size_t hash_max_zipmap_entries;
450 size_t hash_max_zipmap_value;
451 size_t list_max_ziplist_entries;
452 size_t list_max_ziplist_value;
453 size_t set_max_intset_entries;
454 /* Virtual memory state */
455 FILE *vm_fp;
456 int vm_fd;
457 off_t vm_next_page; /* Next probably empty page */
458 off_t vm_near_pages; /* Number of pages allocated sequentially */
459 unsigned char *vm_bitmap; /* Bitmap of free/used pages */
460 time_t unixtime; /* Unix time sampled every second. */
461 /* Virtual memory I/O threads stuff */
462 /* An I/O thread process an element taken from the io_jobs queue and
463 * put the result of the operation in the io_done list. While the
464 * job is being processed, it's put on io_processing queue. */
465 list *io_newjobs; /* List of VM I/O jobs yet to be processed */
466 list *io_processing; /* List of VM I/O jobs being processed */
467 list *io_processed; /* List of VM I/O jobs already processed */
468 list *io_ready_clients; /* Clients ready to be unblocked. All keys loaded */
469 pthread_mutex_t io_mutex; /* lock to access io_jobs/io_done/io_thread_job */
470 pthread_mutex_t io_swapfile_mutex; /* So we can lseek + write */
471 pthread_attr_t io_threads_attr; /* attributes for threads creation */
472 int io_active_threads; /* Number of running I/O threads */
473 int vm_max_threads; /* Max number of I/O threads running at the same time */
474 /* Our main thread is blocked on the event loop, locking for sockets ready
475 * to be read or written, so when a threaded I/O operation is ready to be
476 * processed by the main thread, the I/O thread will use a unix pipe to
477 * awake the main thread. The followings are the two pipe FDs. */
478 int io_ready_pipe_read;
479 int io_ready_pipe_write;
480 /* Virtual memory stats */
481 unsigned long long vm_stats_used_pages;
482 unsigned long long vm_stats_swapped_objects;
483 unsigned long long vm_stats_swapouts;
484 unsigned long long vm_stats_swapins;
485 /* Pubsub */
486 dict *pubsub_channels; /* Map channels to list of subscribed clients */
487 list *pubsub_patterns; /* A list of pubsub_patterns */
488 /* Misc */
489 unsigned lruclock:22; /* clock incrementing every minute, for LRU */
490 unsigned lruclock_padding:10;
491};
492
493typedef struct pubsubPattern {
494 redisClient *client;
495 robj *pattern;
496} pubsubPattern;
497
498typedef void redisCommandProc(redisClient *c);
499typedef void redisVmPreloadProc(redisClient *c, struct redisCommand *cmd, int argc, robj **argv);
500struct redisCommand {
501 char *name;
502 redisCommandProc *proc;
503 int arity;
504 int flags;
505 /* Use a function to determine which keys need to be loaded
506 * in the background prior to executing this command. Takes precedence
507 * over vm_firstkey and others, ignored when NULL */
508 redisVmPreloadProc *vm_preload_proc;
509 /* What keys should be loaded in background when calling this command? */
510 int vm_firstkey; /* The first argument that's a key (0 = no keys) */
511 int vm_lastkey; /* THe last argument that's a key */
512 int vm_keystep; /* The step between first and last key */
513};
514
515struct redisFunctionSym {
516 char *name;
517 unsigned long pointer;
518};
519
520typedef struct _redisSortObject {
521 robj *obj;
522 union {
523 double score;
524 robj *cmpobj;
525 } u;
526} redisSortObject;
527
528typedef struct _redisSortOperation {
529 int type;
530 robj *pattern;
531} redisSortOperation;
532
533/* ZSETs use a specialized version of Skiplists */
534typedef struct zskiplistNode {
535 robj *obj;
536 double score;
537 struct zskiplistNode *backward;
538 struct zskiplistLevel {
539 struct zskiplistNode *forward;
540 unsigned int span;
541 } level[];
542} zskiplistNode;
543
544typedef struct zskiplist {
545 struct zskiplistNode *header, *tail;
546 unsigned long length;
547 int level;
548} zskiplist;
549
550typedef struct zset {
551 dict *dict;
552 zskiplist *zsl;
553} zset;
554
555/* VM threaded I/O request message */
556#define REDIS_IOJOB_LOAD 0 /* Load from disk to memory */
557#define REDIS_IOJOB_PREPARE_SWAP 1 /* Compute needed pages */
558#define REDIS_IOJOB_DO_SWAP 2 /* Swap from memory to disk */
559typedef struct iojob {
560 int type; /* Request type, REDIS_IOJOB_* */
561 redisDb *db;/* Redis database */
562 robj *key; /* This I/O request is about swapping this key */
563 robj *id; /* Unique identifier of this job:
564 this is the object to swap for REDIS_IOREQ_*_SWAP, or the
565 vmpointer objct for REDIS_IOREQ_LOAD. */
566 robj *val; /* the value to swap for REDIS_IOREQ_*_SWAP, otherwise this
567 * field is populated by the I/O thread for REDIS_IOREQ_LOAD. */
568 off_t page; /* Swap page where to read/write the object */
569 off_t pages; /* Swap pages needed to save object. PREPARE_SWAP return val */
570 int canceled; /* True if this command was canceled by blocking side of VM */
571 pthread_t thread; /* ID of the thread processing this entry */
572} iojob;
573
574/* Structure to hold list iteration abstraction. */
575typedef struct {
576 robj *subject;
577 unsigned char encoding;
578 unsigned char direction; /* Iteration direction */
579 unsigned char *zi;
580 listNode *ln;
581} listTypeIterator;
582
583/* Structure for an entry while iterating over a list. */
584typedef struct {
585 listTypeIterator *li;
586 unsigned char *zi; /* Entry in ziplist */
587 listNode *ln; /* Entry in linked list */
588} listTypeEntry;
589
590/* Structure to hold set iteration abstraction. */
591typedef struct {
592 robj *subject;
593 int encoding;
594 int ii; /* intset iterator */
595 dictIterator *di;
596} setTypeIterator;
597
598/* Structure to hold hash iteration abstration. Note that iteration over
599 * hashes involves both fields and values. Because it is possible that
600 * not both are required, store pointers in the iterator to avoid
601 * unnecessary memory allocation for fields/values. */
602typedef struct {
603 int encoding;
604 unsigned char *zi;
605 unsigned char *zk, *zv;
606 unsigned int zklen, zvlen;
607
608 dictIterator *di;
609 dictEntry *de;
610} hashTypeIterator;
611
612#define REDIS_HASH_KEY 1
613#define REDIS_HASH_VALUE 2
614
615/*-----------------------------------------------------------------------------
616 * Extern declarations
617 *----------------------------------------------------------------------------*/
618
619extern struct redisServer server;
620extern struct sharedObjectsStruct shared;
621extern dictType setDictType;
622extern dictType zsetDictType;
623extern double R_Zero, R_PosInf, R_NegInf, R_Nan;
624dictType hashDictType;
625
626/*-----------------------------------------------------------------------------
627 * Functions prototypes
628 *----------------------------------------------------------------------------*/
629
630/* networking.c -- Networking and Client related operations */
631redisClient *createClient(int fd);
632void closeTimedoutClients(void);
633void freeClient(redisClient *c);
634void resetClient(redisClient *c);
635void sendReplyToClient(aeEventLoop *el, int fd, void *privdata, int mask);
636void sendReplyToClientWritev(aeEventLoop *el, int fd, void *privdata, int mask);
637void addReply(redisClient *c, robj *obj);
638void *addDeferredMultiBulkLength(redisClient *c);
639void setDeferredMultiBulkLength(redisClient *c, void *node, long length);
640void addReplySds(redisClient *c, sds s);
641void processInputBuffer(redisClient *c);
642void acceptTcpHandler(aeEventLoop *el, int fd, void *privdata, int mask);
643void acceptUnixHandler(aeEventLoop *el, int fd, void *privdata, int mask);
644void readQueryFromClient(aeEventLoop *el, int fd, void *privdata, int mask);
645void addReplyBulk(redisClient *c, robj *obj);
646void addReplyBulkCString(redisClient *c, char *s);
647void addReplyBulkCBuffer(redisClient *c, void *p, size_t len);
648void addReplyBulkLongLong(redisClient *c, long long ll);
649void acceptHandler(aeEventLoop *el, int fd, void *privdata, int mask);
650void addReply(redisClient *c, robj *obj);
651void addReplySds(redisClient *c, sds s);
652void addReplyError(redisClient *c, char *err);
653void addReplyStatus(redisClient *c, char *status);
654void addReplyDouble(redisClient *c, double d);
655void addReplyLongLong(redisClient *c, long long ll);
656void addReplyMultiBulkLen(redisClient *c, long length);
657void *dupClientReplyValue(void *o);
658
659#ifdef __GNUC__
660void addReplyErrorFormat(redisClient *c, const char *fmt, ...)
661 __attribute__((format(printf, 2, 3)));
662void addReplyStatusFormat(redisClient *c, const char *fmt, ...)
663 __attribute__((format(printf, 2, 3)));
664#else
665void addReplyErrorFormat(redisClient *c, const char *fmt, ...);
666void addReplyStatusFormat(redisClient *c, const char *fmt, ...);
667#endif
668
669/* List data type */
670void listTypeTryConversion(robj *subject, robj *value);
671void listTypePush(robj *subject, robj *value, int where);
672robj *listTypePop(robj *subject, int where);
673unsigned long listTypeLength(robj *subject);
674listTypeIterator *listTypeInitIterator(robj *subject, int index, unsigned char direction);
675void listTypeReleaseIterator(listTypeIterator *li);
676int listTypeNext(listTypeIterator *li, listTypeEntry *entry);
677robj *listTypeGet(listTypeEntry *entry);
678void listTypeInsert(listTypeEntry *entry, robj *value, int where);
679int listTypeEqual(listTypeEntry *entry, robj *o);
680void listTypeDelete(listTypeEntry *entry);
681void listTypeConvert(robj *subject, int enc);
682void unblockClientWaitingData(redisClient *c);
683int handleClientsWaitingListPush(redisClient *c, robj *key, robj *ele);
684void popGenericCommand(redisClient *c, int where);
685
686/* MULTI/EXEC/WATCH... */
687void unwatchAllKeys(redisClient *c);
688void initClientMultiState(redisClient *c);
689void freeClientMultiState(redisClient *c);
690void queueMultiCommand(redisClient *c, struct redisCommand *cmd);
691void touchWatchedKey(redisDb *db, robj *key);
692void touchWatchedKeysOnFlush(int dbid);
693
694/* Redis object implementation */
695void decrRefCount(void *o);
696void incrRefCount(robj *o);
697void freeStringObject(robj *o);
698void freeListObject(robj *o);
699void freeSetObject(robj *o);
700void freeZsetObject(robj *o);
701void freeHashObject(robj *o);
702robj *createObject(int type, void *ptr);
703robj *createStringObject(char *ptr, size_t len);
704robj *dupStringObject(robj *o);
705robj *tryObjectEncoding(robj *o);
706robj *getDecodedObject(robj *o);
707size_t stringObjectLen(robj *o);
708robj *createStringObjectFromLongLong(long long value);
709robj *createListObject(void);
710robj *createZiplistObject(void);
711robj *createSetObject(void);
712robj *createIntsetObject(void);
713robj *createHashObject(void);
714robj *createZsetObject(void);
715int getLongFromObjectOrReply(redisClient *c, robj *o, long *target, const char *msg);
716int checkType(redisClient *c, robj *o, int type);
717int getLongLongFromObjectOrReply(redisClient *c, robj *o, long long *target, const char *msg);
718int getDoubleFromObjectOrReply(redisClient *c, robj *o, double *target, const char *msg);
719int getLongLongFromObject(robj *o, long long *target);
720char *strEncoding(int encoding);
721int compareStringObjects(robj *a, robj *b);
722int equalStringObjects(robj *a, robj *b);
723unsigned long estimateObjectIdleTime(robj *o);
724
725/* Synchronous I/O with timeout */
726int syncWrite(int fd, char *ptr, ssize_t size, int timeout);
727int syncRead(int fd, char *ptr, ssize_t size, int timeout);
728int syncReadLine(int fd, char *ptr, ssize_t size, int timeout);
729int fwriteBulkString(FILE *fp, char *s, unsigned long len);
730int fwriteBulkDouble(FILE *fp, double d);
731int fwriteBulkLongLong(FILE *fp, long long l);
732int fwriteBulkObject(FILE *fp, robj *obj);
733
734/* Replication */
735void replicationFeedSlaves(list *slaves, int dictid, robj **argv, int argc);
736void replicationFeedMonitors(list *monitors, int dictid, robj **argv, int argc);
737int syncWithMaster(void);
738void updateSlavesWaitingBgsave(int bgsaveerr);
739void replicationCron(void);
740
741/* Generic persistence functions */
742void startLoading(FILE *fp);
743void loadingProgress(off_t pos);
744void stopLoading(void);
745
746/* RDB persistence */
747int rdbLoad(char *filename);
748int rdbSaveBackground(char *filename);
749void rdbRemoveTempFile(pid_t childpid);
750int rdbSave(char *filename);
751int rdbSaveObject(FILE *fp, robj *o);
752off_t rdbSavedObjectLen(robj *o);
753off_t rdbSavedObjectPages(robj *o);
754robj *rdbLoadObject(int type, FILE *fp);
755void backgroundSaveDoneHandler(int statloc);
756
757/* AOF persistence */
758void flushAppendOnlyFile(void);
759void feedAppendOnlyFile(struct redisCommand *cmd, int dictid, robj **argv, int argc);
760void aofRemoveTempFile(pid_t childpid);
761int rewriteAppendOnlyFileBackground(void);
762int loadAppendOnlyFile(char *filename);
763void stopAppendOnly(void);
764int startAppendOnly(void);
765void backgroundRewriteDoneHandler(int statloc);
766
767/* Sorted sets data type */
768zskiplist *zslCreate(void);
769void zslFree(zskiplist *zsl);
770zskiplistNode *zslInsert(zskiplist *zsl, double score, robj *obj);
771
772/* Core functions */
773void freeMemoryIfNeeded(void);
774int processCommand(redisClient *c);
775void setupSigSegvAction(void);
776struct redisCommand *lookupCommand(sds name);
777struct redisCommand *lookupCommandByCString(char *s);
778void call(redisClient *c, struct redisCommand *cmd);
779int prepareForShutdown();
780void redisLog(int level, const char *fmt, ...);
781void usage();
782void updateDictResizePolicy(void);
783int htNeedsResize(dict *dict);
784void oom(const char *msg);
785void populateCommandTable(void);
786
787/* Virtual Memory */
788void vmInit(void);
789void vmMarkPagesFree(off_t page, off_t count);
790robj *vmLoadObject(robj *o);
791robj *vmPreviewObject(robj *o);
792int vmSwapOneObjectBlocking(void);
793int vmSwapOneObjectThreaded(void);
794int vmCanSwapOut(void);
795void vmThreadedIOCompletedJob(aeEventLoop *el, int fd, void *privdata, int mask);
796void vmCancelThreadedIOJob(robj *o);
797void lockThreadedIO(void);
798void unlockThreadedIO(void);
799int vmSwapObjectThreaded(robj *key, robj *val, redisDb *db);
800void freeIOJob(iojob *j);
801void queueIOJob(iojob *j);
802int vmWriteObjectOnSwap(robj *o, off_t page);
803robj *vmReadObjectFromSwap(off_t page, int type);
804void waitEmptyIOJobsQueue(void);
805void vmReopenSwapFile(void);
806int vmFreePage(off_t page);
807void zunionInterBlockClientOnSwappedKeys(redisClient *c, struct redisCommand *cmd, int argc, robj **argv);
808void execBlockClientOnSwappedKeys(redisClient *c, struct redisCommand *cmd, int argc, robj **argv);
809int blockClientOnSwappedKeys(redisClient *c, struct redisCommand *cmd);
810int dontWaitForSwappedKey(redisClient *c, robj *key);
811void handleClientsBlockedOnSwappedKey(redisDb *db, robj *key);
812vmpointer *vmSwapObjectBlocking(robj *val);
813
814/* Set data type */
815robj *setTypeCreate(robj *value);
816int setTypeAdd(robj *subject, robj *value);
817int setTypeRemove(robj *subject, robj *value);
818int setTypeIsMember(robj *subject, robj *value);
819setTypeIterator *setTypeInitIterator(robj *subject);
820void setTypeReleaseIterator(setTypeIterator *si);
821robj *setTypeNext(setTypeIterator *si);
822robj *setTypeRandomElement(robj *subject);
823unsigned long setTypeSize(robj *subject);
824void setTypeConvert(robj *subject, int enc);
825
826/* Hash data type */
827void convertToRealHash(robj *o);
828void hashTypeTryConversion(robj *subject, robj **argv, int start, int end);
829void hashTypeTryObjectEncoding(robj *subject, robj **o1, robj **o2);
830robj *hashTypeGet(robj *o, robj *key);
831int hashTypeExists(robj *o, robj *key);
832int hashTypeSet(robj *o, robj *key, robj *value);
833int hashTypeDelete(robj *o, robj *key);
834unsigned long hashTypeLength(robj *o);
835hashTypeIterator *hashTypeInitIterator(robj *subject);
836void hashTypeReleaseIterator(hashTypeIterator *hi);
837int hashTypeNext(hashTypeIterator *hi);
838robj *hashTypeCurrent(hashTypeIterator *hi, int what);
839robj *hashTypeLookupWriteOrCreate(redisClient *c, robj *key);
840
841/* Pub / Sub */
842int pubsubUnsubscribeAllChannels(redisClient *c, int notify);
843int pubsubUnsubscribeAllPatterns(redisClient *c, int notify);
844void freePubsubPattern(void *p);
845int listMatchPubsubPattern(void *a, void *b);
846
847/* Utility functions */
848int stringmatchlen(const char *pattern, int patternLen,
849 const char *string, int stringLen, int nocase);
850int stringmatch(const char *pattern, const char *string, int nocase);
851long long memtoll(const char *p, int *err);
852int ll2string(char *s, size_t len, long long value);
853int isStringRepresentableAsLong(sds s, long *longval);
854int isStringRepresentableAsLongLong(sds s, long long *longval);
855int isObjectRepresentableAsLongLong(robj *o, long long *llongval);
856
857/* Configuration */
858void loadServerConfig(char *filename);
859void appendServerSaveParams(time_t seconds, int changes);
860void resetServerSaveParams();
861
862/* db.c -- Keyspace access API */
863int removeExpire(redisDb *db, robj *key);
864void propagateExpire(redisDb *db, robj *key);
865int expireIfNeeded(redisDb *db, robj *key);
866time_t getExpire(redisDb *db, robj *key);
867void setExpire(redisDb *db, robj *key, time_t when);
868robj *lookupKey(redisDb *db, robj *key);
869robj *lookupKeyRead(redisDb *db, robj *key);
870robj *lookupKeyWrite(redisDb *db, robj *key);
871robj *lookupKeyReadOrReply(redisClient *c, robj *key, robj *reply);
872robj *lookupKeyWriteOrReply(redisClient *c, robj *key, robj *reply);
873int dbAdd(redisDb *db, robj *key, robj *val);
874int dbReplace(redisDb *db, robj *key, robj *val);
875int dbExists(redisDb *db, robj *key);
876robj *dbRandomKey(redisDb *db);
877int dbDelete(redisDb *db, robj *key);
878long long emptyDb();
879int selectDb(redisClient *c, int id);
880
881/* Git SHA1 */
882char *redisGitSHA1(void);
883char *redisGitDirty(void);
884
885/* Commands prototypes */
886void authCommand(redisClient *c);
887void pingCommand(redisClient *c);
888void echoCommand(redisClient *c);
889void setCommand(redisClient *c);
890void setnxCommand(redisClient *c);
891void setexCommand(redisClient *c);
892void getCommand(redisClient *c);
893void delCommand(redisClient *c);
894void existsCommand(redisClient *c);
895void incrCommand(redisClient *c);
896void decrCommand(redisClient *c);
897void incrbyCommand(redisClient *c);
898void decrbyCommand(redisClient *c);
899void selectCommand(redisClient *c);
900void randomkeyCommand(redisClient *c);
901void keysCommand(redisClient *c);
902void dbsizeCommand(redisClient *c);
903void lastsaveCommand(redisClient *c);
904void saveCommand(redisClient *c);
905void bgsaveCommand(redisClient *c);
906void bgrewriteaofCommand(redisClient *c);
907void shutdownCommand(redisClient *c);
908void moveCommand(redisClient *c);
909void renameCommand(redisClient *c);
910void renamenxCommand(redisClient *c);
911void lpushCommand(redisClient *c);
912void rpushCommand(redisClient *c);
913void lpushxCommand(redisClient *c);
914void rpushxCommand(redisClient *c);
915void linsertCommand(redisClient *c);
916void lpopCommand(redisClient *c);
917void rpopCommand(redisClient *c);
918void llenCommand(redisClient *c);
919void lindexCommand(redisClient *c);
920void lrangeCommand(redisClient *c);
921void ltrimCommand(redisClient *c);
922void typeCommand(redisClient *c);
923void lsetCommand(redisClient *c);
924void saddCommand(redisClient *c);
925void sremCommand(redisClient *c);
926void smoveCommand(redisClient *c);
927void sismemberCommand(redisClient *c);
928void scardCommand(redisClient *c);
929void spopCommand(redisClient *c);
930void srandmemberCommand(redisClient *c);
931void sinterCommand(redisClient *c);
932void sinterstoreCommand(redisClient *c);
933void sunionCommand(redisClient *c);
934void sunionstoreCommand(redisClient *c);
935void sdiffCommand(redisClient *c);
936void sdiffstoreCommand(redisClient *c);
937void syncCommand(redisClient *c);
938void flushdbCommand(redisClient *c);
939void flushallCommand(redisClient *c);
940void sortCommand(redisClient *c);
941void lremCommand(redisClient *c);
942void rpoplpushcommand(redisClient *c);
943void infoCommand(redisClient *c);
944void mgetCommand(redisClient *c);
945void monitorCommand(redisClient *c);
946void expireCommand(redisClient *c);
947void expireatCommand(redisClient *c);
948void getsetCommand(redisClient *c);
949void ttlCommand(redisClient *c);
950void persistCommand(redisClient *c);
951void slaveofCommand(redisClient *c);
952void debugCommand(redisClient *c);
953void msetCommand(redisClient *c);
954void msetnxCommand(redisClient *c);
955void zaddCommand(redisClient *c);
956void zincrbyCommand(redisClient *c);
957void zrangeCommand(redisClient *c);
958void zrangebyscoreCommand(redisClient *c);
959void zrevrangebyscoreCommand(redisClient *c);
960void zcountCommand(redisClient *c);
961void zrevrangeCommand(redisClient *c);
962void zcardCommand(redisClient *c);
963void zremCommand(redisClient *c);
964void zscoreCommand(redisClient *c);
965void zremrangebyscoreCommand(redisClient *c);
966void multiCommand(redisClient *c);
967void execCommand(redisClient *c);
968void discardCommand(redisClient *c);
969void blpopCommand(redisClient *c);
970void brpopCommand(redisClient *c);
971void appendCommand(redisClient *c);
972void substrCommand(redisClient *c);
973void strlenCommand(redisClient *c);
974void zrankCommand(redisClient *c);
975void zrevrankCommand(redisClient *c);
976void hsetCommand(redisClient *c);
977void hsetnxCommand(redisClient *c);
978void hgetCommand(redisClient *c);
979void hmsetCommand(redisClient *c);
980void hmgetCommand(redisClient *c);
981void hdelCommand(redisClient *c);
982void hlenCommand(redisClient *c);
983void zremrangebyrankCommand(redisClient *c);
984void zunionstoreCommand(redisClient *c);
985void zinterstoreCommand(redisClient *c);
986void hkeysCommand(redisClient *c);
987void hvalsCommand(redisClient *c);
988void hgetallCommand(redisClient *c);
989void hexistsCommand(redisClient *c);
990void configCommand(redisClient *c);
991void hincrbyCommand(redisClient *c);
992void subscribeCommand(redisClient *c);
993void unsubscribeCommand(redisClient *c);
994void psubscribeCommand(redisClient *c);
995void punsubscribeCommand(redisClient *c);
996void publishCommand(redisClient *c);
997void watchCommand(redisClient *c);
998void unwatchCommand(redisClient *c);
999
1000#if defined(__GNUC__)
1001void *calloc(size_t count, size_t size) __attribute__ ((deprecated));
1002void free(void *ptr) __attribute__ ((deprecated));
1003void *malloc(size_t size) __attribute__ ((deprecated));
1004void *realloc(void *ptr, size_t size) __attribute__ ((deprecated));
1005#endif
1006
1007#endif