]>
git.saurik.com Git - redis.git/blob - src/ziplist.c
1c492f25dac15f814ffda5e7f061a4159e69af31
1 /* The ziplist is a specially encoded dually linked list that is designed
2 * to be very memory efficient. It stores both strings and integer values,
3 * where integers are encoded as actual integers instead of a series of
4 * characters. It allows push and pop operations on either side of the list
5 * in O(1) time. However, because every operation requires a reallocation of
6 * the memory used by the ziplist, the actual complexity is related to the
7 * amount of memory used by the ziplist.
9 * ----------------------------------------------------------------------------
11 * ZIPLIST OVERALL LAYOUT:
12 * The general layout of the ziplist is as follows:
13 * <zlbytes><zltail><zllen><entry><entry><zlend>
15 * <zlbytes> is an unsigned integer to hold the number of bytes that the
16 * ziplist occupies. This value needs to be stored to be able to resize the
17 * entire structure without the need to traverse it first.
19 * <zltail> is the offset to the last entry in the list. This allows a pop
20 * operation on the far side of the list without the need for full traversal.
22 * <zllen> is the number of entries.When this value is larger than 2**16-2,
23 * we need to traverse the entire list to know how many items it holds.
25 * <zlend> is a single byte special value, equal to 255, which indicates the
29 * Every entry in the ziplist is prefixed by a header that contains two pieces
30 * of information. First, the length of the previous entry is stored to be
31 * able to traverse the list from back to front. Second, the encoding with an
32 * optional string length of the entry itself is stored.
34 * The length of the previous entry is encoded in the following way:
35 * If this length is smaller than 254 bytes, it will only consume a single
36 * byte that takes the length as value. When the length is greater than or
37 * equal to 254, it will consume 5 bytes. The first byte is set to 254 to
38 * indicate a larger value is following. The remaining 4 bytes take the
39 * length of the previous entry as value.
41 * The other header field of the entry itself depends on the contents of the
42 * entry. When the entry is a string, the first 2 bits of this header will hold
43 * the type of encoding used to store the length of the string, followed by the
44 * actual length of the string. When the entry is an integer the first 2 bits
45 * are both set to 1. The following 2 bits are used to specify what kind of
46 * integer will be stored after this header. An overview of the different
47 * types and encodings is as follows:
50 * String value with length less than or equal to 63 bytes (6 bits).
51 * |01pppppp|qqqqqqqq| - 2 bytes
52 * String value with length less than or equal to 16383 bytes (14 bits).
53 * |10______|qqqqqqqq|rrrrrrrr|ssssssss|tttttttt| - 5 bytes
54 * String value with length greater than or equal to 16384 bytes.
56 * Integer encoded as int16_t (2 bytes).
58 * Integer encoded as int32_t (4 bytes).
60 * Integer encoded as int64_t (8 bytes).
73 int ll2string(char *s
, size_t len
, long long value
);
76 #define ZIP_BIGLEN 254
78 /* Different encoding/length possibilities */
79 #define ZIP_STR_06B (0 << 6)
80 #define ZIP_STR_14B (1 << 6)
81 #define ZIP_STR_32B (2 << 6)
82 #define ZIP_INT_16B (0xc0 | 0<<4)
83 #define ZIP_INT_32B (0xc0 | 1<<4)
84 #define ZIP_INT_64B (0xc0 | 2<<4)
86 /* Macro's to determine type */
87 #define ZIP_IS_STR(enc) (((enc) & 0xc0) < 0xc0)
88 #define ZIP_IS_INT(enc) (!ZIP_IS_STR(enc) && ((enc) & 0x30) < 0x30)
91 #define ZIPLIST_BYTES(zl) (*((uint32_t*)(zl)))
92 #define ZIPLIST_TAIL_OFFSET(zl) (*((uint32_t*)((zl)+sizeof(uint32_t))))
93 #define ZIPLIST_LENGTH(zl) (*((uint16_t*)((zl)+sizeof(uint32_t)*2)))
94 #define ZIPLIST_HEADER_SIZE (sizeof(uint32_t)*2+sizeof(uint16_t))
95 #define ZIPLIST_ENTRY_HEAD(zl) ((zl)+ZIPLIST_HEADER_SIZE)
96 #define ZIPLIST_ENTRY_TAIL(zl) ((zl)+ZIPLIST_TAIL_OFFSET(zl))
97 #define ZIPLIST_ENTRY_END(zl) ((zl)+ZIPLIST_BYTES(zl)-1)
99 /* We know a positive increment can only be 1 because entries can only be
100 * pushed one at a time. */
101 #define ZIPLIST_INCR_LENGTH(zl,incr) { \
102 if (ZIPLIST_LENGTH(zl) < UINT16_MAX) ZIPLIST_LENGTH(zl)+=incr; }
104 typedef struct zlentry
{
105 unsigned int prevrawlensize
, prevrawlen
;
106 unsigned int lensize
, len
;
107 unsigned int headersize
;
108 unsigned char encoding
;
112 /* Return the encoding pointer to by 'p'. */
113 static unsigned int zipEntryEncoding(unsigned char *p
) {
114 /* String encoding: 2 MSBs */
115 unsigned char b
= p
[0] & 0xc0;
119 /* Integer encoding: 4 MSBs */
126 /* Return bytes needed to store integer encoded by 'encoding' */
127 static unsigned int zipIntSize(unsigned char encoding
) {
129 case ZIP_INT_16B
: return sizeof(int16_t);
130 case ZIP_INT_32B
: return sizeof(int32_t);
131 case ZIP_INT_64B
: return sizeof(int64_t);
137 /* Decode the encoded length pointed by 'p'. If a pointer to 'lensize' is
138 * provided, it is set to the number of bytes required to encode the length. */
139 static unsigned int zipDecodeLength(unsigned char *p
, unsigned int *lensize
) {
140 unsigned char encoding
= zipEntryEncoding(p
);
141 unsigned int len
= 0;
143 if (ZIP_IS_STR(encoding
)) {
147 if (lensize
) *lensize
= 1;
150 len
= ((p
[0] & 0x3f) << 8) | p
[1];
151 if (lensize
) *lensize
= 2;
154 len
= (p
[1] << 24) | (p
[2] << 16) | (p
[3] << 8) | p
[4];
155 if (lensize
) *lensize
= 5;
161 len
= zipIntSize(encoding
);
162 if (lensize
) *lensize
= 1;
167 /* Encode the length 'l' writing it in 'p'. If p is NULL it just returns
168 * the amount of bytes required to encode such a length. */
169 static unsigned int zipEncodeLength(unsigned char *p
, unsigned char encoding
, unsigned int rawlen
) {
170 unsigned char len
= 1, buf
[5];
172 if (ZIP_IS_STR(encoding
)) {
173 /* Although encoding is given it may not be set for strings,
174 * so we determine it here using the raw length. */
175 if (rawlen
<= 0x3f) {
177 buf
[0] = ZIP_STR_06B
| rawlen
;
178 } else if (rawlen
<= 0x3fff) {
181 buf
[0] = ZIP_STR_14B
| ((rawlen
>> 8) & 0x3f);
182 buf
[1] = rawlen
& 0xff;
186 buf
[0] = ZIP_STR_32B
;
187 buf
[1] = (rawlen
>> 24) & 0xff;
188 buf
[2] = (rawlen
>> 16) & 0xff;
189 buf
[3] = (rawlen
>> 8) & 0xff;
190 buf
[4] = rawlen
& 0xff;
193 /* Implies integer encoding, so length is always 1. */
198 /* Store this length at p */
203 /* Decode the length of the previous element stored at "p". */
204 static unsigned int zipPrevDecodeLength(unsigned char *p
, unsigned int *lensize
) {
205 unsigned int len
= *p
;
206 if (len
< ZIP_BIGLEN
) {
207 if (lensize
) *lensize
= 1;
209 if (lensize
) *lensize
= 1+sizeof(len
);
210 memcpy(&len
,p
+1,sizeof(len
));
216 /* Encode the length of the previous entry and write it to "p". Return the
217 * number of bytes needed to encode this length if "p" is NULL. */
218 static unsigned int zipPrevEncodeLength(unsigned char *p
, unsigned int len
) {
220 return (len
< ZIP_BIGLEN
) ? 1 : sizeof(len
)+1;
222 if (len
< ZIP_BIGLEN
) {
227 memcpy(p
+1,&len
,sizeof(len
));
229 return 1+sizeof(len
);
234 /* Encode the length of the previous entry and write it to "p". This only
235 * uses the larger encoding (required in __ziplistCascadeUpdate). */
236 static void zipPrevEncodeLengthForceLarge(unsigned char *p
, unsigned int len
) {
237 if (p
== NULL
) return;
239 memcpy(p
+1,&len
,sizeof(len
));
243 /* Return the difference in number of bytes needed to store the new length
244 * "len" on the entry pointed to by "p". */
245 static int zipPrevLenByteDiff(unsigned char *p
, unsigned int len
) {
246 unsigned int prevlensize
;
247 zipPrevDecodeLength(p
,&prevlensize
);
248 return zipPrevEncodeLength(NULL
,len
)-prevlensize
;
251 /* Check if string pointed to by 'entry' can be encoded as an integer.
252 * Stores the integer value in 'v' and its encoding in 'encoding'. */
253 static int zipTryEncoding(unsigned char *entry
, unsigned int entrylen
, long long *v
, unsigned char *encoding
) {
258 if (entrylen
>= 32 || entrylen
== 0) return 0;
259 if (entry
[0] == '-' || (entry
[0] >= '0' && entry
[0] <= '9')) {
262 /* Perform a back-and-forth conversion to make sure that
263 * the string turned into an integer is not losing any info. */
264 memcpy(buf
,entry
,entrylen
);
265 buf
[entrylen
] = '\0';
266 value
= strtoll(buf
,&eptr
,10);
267 if (eptr
[0] != '\0') return 0;
268 slen
= ll2string(buf
,32,value
);
269 if (entrylen
!= (unsigned)slen
|| memcmp(buf
,entry
,slen
)) return 0;
271 /* Great, the string can be encoded. Check what's the smallest
272 * of our encoding types that can hold this value. */
273 if (value
>= INT16_MIN
&& value
<= INT16_MAX
) {
274 *encoding
= ZIP_INT_16B
;
275 } else if (value
>= INT32_MIN
&& value
<= INT32_MAX
) {
276 *encoding
= ZIP_INT_32B
;
278 *encoding
= ZIP_INT_64B
;
286 /* Store integer 'value' at 'p', encoded as 'encoding' */
287 static void zipSaveInteger(unsigned char *p
, int64_t value
, unsigned char encoding
) {
291 if (encoding
== ZIP_INT_16B
) {
293 memcpy(p
,&i16
,sizeof(i16
));
295 } else if (encoding
== ZIP_INT_32B
) {
297 memcpy(p
,&i32
,sizeof(i32
));
299 } else if (encoding
== ZIP_INT_64B
) {
301 memcpy(p
,&i64
,sizeof(i64
));
308 /* Read integer encoded as 'encoding' from 'p' */
309 static int64_t zipLoadInteger(unsigned char *p
, unsigned char encoding
) {
312 int64_t i64
, ret
= 0;
313 if (encoding
== ZIP_INT_16B
) {
314 memcpy(&i16
,p
,sizeof(i16
));
317 } else if (encoding
== ZIP_INT_32B
) {
318 memcpy(&i32
,p
,sizeof(i32
));
321 } else if (encoding
== ZIP_INT_64B
) {
322 memcpy(&i64
,p
,sizeof(i64
));
331 /* Return a struct with all information about an entry. */
332 static zlentry
zipEntry(unsigned char *p
) {
334 e
.prevrawlen
= zipPrevDecodeLength(p
,&e
.prevrawlensize
);
335 e
.len
= zipDecodeLength(p
+e
.prevrawlensize
,&e
.lensize
);
336 e
.headersize
= e
.prevrawlensize
+e
.lensize
;
337 e
.encoding
= zipEntryEncoding(p
+e
.prevrawlensize
);
342 /* Return the total number of bytes used by the entry at "p". */
343 static unsigned int zipRawEntryLength(unsigned char *p
) {
344 zlentry e
= zipEntry(p
);
345 return e
.headersize
+ e
.len
;
348 /* Create a new empty ziplist. */
349 unsigned char *ziplistNew(void) {
350 unsigned int bytes
= ZIPLIST_HEADER_SIZE
+1;
351 unsigned char *zl
= zmalloc(bytes
);
352 ZIPLIST_BYTES(zl
) = bytes
;
353 ZIPLIST_TAIL_OFFSET(zl
) = ZIPLIST_HEADER_SIZE
;
354 ZIPLIST_LENGTH(zl
) = 0;
355 zl
[bytes
-1] = ZIP_END
;
359 /* Resize the ziplist. */
360 static unsigned char *ziplistResize(unsigned char *zl
, unsigned int len
) {
361 zl
= zrealloc(zl
,len
);
362 ZIPLIST_BYTES(zl
) = len
;
367 /* When an entry is inserted, we need to set the prevlen field of the next
368 * entry to equal the length of the inserted entry. It can occur that this
369 * length cannot be encoded in 1 byte and the next entry needs to be grow
370 * a bit larger to hold the 5-byte encoded prevlen. This can be done for free,
371 * because this only happens when an entry is already being inserted (which
372 * causes a realloc and memmove). However, encoding the prevlen may require
373 * that this entry is grown as well. This effect may cascade throughout
374 * the ziplist when there are consecutive entries with a size close to
375 * ZIP_BIGLEN, so we need to check that the prevlen can be encoded in every
378 * Note that this effect can also happen in reverse, where the bytes required
379 * to encode the prevlen field can shrink. This effect is deliberately ignored,
380 * because it can cause a "flapping" effect where a chain prevlen fields is
381 * first grown and then shrunk again after consecutive inserts. Rather, the
382 * field is allowed to stay larger than necessary, because a large prevlen
383 * field implies the ziplist is holding large entries anyway.
385 * The pointer "p" points to the first entry that does NOT need to be
386 * updated, i.e. consecutive fields MAY need an update. */
387 static unsigned char *__ziplistCascadeUpdate(unsigned char *zl
, unsigned char *p
) {
388 size_t curlen
= ZIPLIST_BYTES(zl
), rawlen
, rawlensize
;
389 size_t offset
, noffset
, extra
;
393 while (p
[0] != ZIP_END
) {
395 rawlen
= cur
.headersize
+ cur
.len
;
396 rawlensize
= zipPrevEncodeLength(NULL
,rawlen
);
398 /* Abort if there is no next entry. */
399 if (p
[rawlen
] == ZIP_END
) break;
400 next
= zipEntry(p
+rawlen
);
402 /* Abort when "prevlen" has not changed. */
403 if (next
.prevrawlen
== rawlen
) break;
405 if (next
.prevrawlensize
< rawlensize
) {
406 /* The "prevlen" field of "next" needs more bytes to hold
407 * the raw length of "cur". */
409 extra
= rawlensize
-next
.prevrawlensize
;
410 zl
= ziplistResize(zl
,curlen
+extra
);
411 ZIPLIST_TAIL_OFFSET(zl
) += extra
;
414 /* Move the tail to the back. */
417 memmove(np
+rawlensize
,
418 np
+next
.prevrawlensize
,
419 curlen
-noffset
-next
.prevrawlensize
-1);
420 zipPrevEncodeLength(np
,rawlen
);
422 /* Advance the cursor */
426 if (next
.prevrawlensize
> rawlensize
) {
427 /* This would result in shrinking, which we want to avoid.
428 * So, set "rawlen" in the available bytes. */
429 zipPrevEncodeLengthForceLarge(p
+rawlen
,rawlen
);
431 zipPrevEncodeLength(p
+rawlen
,rawlen
);
434 /* Stop here, as the raw length of "next" has not changed. */
441 /* Delete "num" entries, starting at "p". Returns pointer to the ziplist. */
442 static unsigned char *__ziplistDelete(unsigned char *zl
, unsigned char *p
, unsigned int num
) {
443 unsigned int i
, totlen
, deleted
= 0;
449 for (i
= 0; p
[0] != ZIP_END
&& i
< num
; i
++) {
450 p
+= zipRawEntryLength(p
);
456 if (p
[0] != ZIP_END
) {
457 /* Tricky: storing the prevlen in this entry might reduce or
458 * increase the number of bytes needed, compared to the current
459 * prevlen. Note that we can always store this length because
460 * it was previously stored by an entry that is being deleted. */
461 nextdiff
= zipPrevLenByteDiff(p
,first
.prevrawlen
);
462 zipPrevEncodeLength(p
-nextdiff
,first
.prevrawlen
);
464 /* Update offset for tail */
465 ZIPLIST_TAIL_OFFSET(zl
) -= totlen
;
467 /* When the tail contains more than one entry, we need to take
468 * "nextdiff" in account as well. Otherwise, a change in the
469 * size of prevlen doesn't have an effect on the *tail* offset. */
471 if (p
[tail
.headersize
+tail
.len
] != ZIP_END
)
472 ZIPLIST_TAIL_OFFSET(zl
) += nextdiff
;
474 /* Move tail to the front of the ziplist */
475 memmove(first
.p
,p
-nextdiff
,ZIPLIST_BYTES(zl
)-(p
-zl
)-1+nextdiff
);
477 /* The entire tail was deleted. No need to move memory. */
478 ZIPLIST_TAIL_OFFSET(zl
) = (first
.p
-zl
)-first
.prevrawlen
;
481 /* Resize and update length */
483 zl
= ziplistResize(zl
, ZIPLIST_BYTES(zl
)-totlen
+nextdiff
);
484 ZIPLIST_INCR_LENGTH(zl
,-deleted
);
487 /* When nextdiff != 0, the raw length of the next entry has changed, so
488 * we need to cascade the update throughout the ziplist */
490 zl
= __ziplistCascadeUpdate(zl
,p
);
495 /* Insert item at "p". */
496 static unsigned char *__ziplistInsert(unsigned char *zl
, unsigned char *p
, unsigned char *s
, unsigned int slen
) {
497 size_t curlen
= ZIPLIST_BYTES(zl
), reqlen
, prevlen
= 0;
500 unsigned char encoding
= 0;
504 /* Find out prevlen for the entry that is inserted. */
505 if (p
[0] != ZIP_END
) {
507 prevlen
= entry
.prevrawlen
;
509 unsigned char *ptail
= ZIPLIST_ENTRY_TAIL(zl
);
510 if (ptail
[0] != ZIP_END
) {
511 prevlen
= zipRawEntryLength(ptail
);
515 /* See if the entry can be encoded */
516 if (zipTryEncoding(s
,slen
,&value
,&encoding
)) {
517 /* 'encoding' is set to the appropriate integer encoding */
518 reqlen
= zipIntSize(encoding
);
520 /* 'encoding' is untouched, however zipEncodeLength will use the
521 * string length to figure out how to encode it. */
524 /* We need space for both the length of the previous entry and
525 * the length of the payload. */
526 reqlen
+= zipPrevEncodeLength(NULL
,prevlen
);
527 reqlen
+= zipEncodeLength(NULL
,encoding
,slen
);
529 /* When the insert position is not equal to the tail, we need to
530 * make sure that the next entry can hold this entry's length in
531 * its prevlen field. */
532 nextdiff
= (p
[0] != ZIP_END
) ? zipPrevLenByteDiff(p
,reqlen
) : 0;
534 /* Store offset because a realloc may change the address of zl. */
536 zl
= ziplistResize(zl
,curlen
+reqlen
+nextdiff
);
539 /* Apply memory move when necessary and update tail offset. */
540 if (p
[0] != ZIP_END
) {
541 /* Subtract one because of the ZIP_END bytes */
542 memmove(p
+reqlen
,p
-nextdiff
,curlen
-offset
-1+nextdiff
);
544 /* Encode this entry's raw length in the next entry. */
545 zipPrevEncodeLength(p
+reqlen
,reqlen
);
547 /* Update offset for tail */
548 ZIPLIST_TAIL_OFFSET(zl
) += reqlen
;
550 /* When the tail contains more than one entry, we need to take
551 * "nextdiff" in account as well. Otherwise, a change in the
552 * size of prevlen doesn't have an effect on the *tail* offset. */
553 tail
= zipEntry(p
+reqlen
);
554 if (p
[reqlen
+tail
.headersize
+tail
.len
] != ZIP_END
)
555 ZIPLIST_TAIL_OFFSET(zl
) += nextdiff
;
557 /* This element will be the new tail. */
558 ZIPLIST_TAIL_OFFSET(zl
) = p
-zl
;
561 /* When nextdiff != 0, the raw length of the next entry has changed, so
562 * we need to cascade the update throughout the ziplist */
565 zl
= __ziplistCascadeUpdate(zl
,p
+reqlen
);
569 /* Write the entry */
570 p
+= zipPrevEncodeLength(p
,prevlen
);
571 p
+= zipEncodeLength(p
,encoding
,slen
);
572 if (ZIP_IS_STR(encoding
)) {
575 zipSaveInteger(p
,value
,encoding
);
577 ZIPLIST_INCR_LENGTH(zl
,1);
581 unsigned char *ziplistPush(unsigned char *zl
, unsigned char *s
, unsigned int slen
, int where
) {
583 p
= (where
== ZIPLIST_HEAD
) ? ZIPLIST_ENTRY_HEAD(zl
) : ZIPLIST_ENTRY_END(zl
);
584 return __ziplistInsert(zl
,p
,s
,slen
);
587 /* Returns an offset to use for iterating with ziplistNext. When the given
588 * index is negative, the list is traversed back to front. When the list
589 * doesn't contain an element at the provided index, NULL is returned. */
590 unsigned char *ziplistIndex(unsigned char *zl
, int index
) {
595 p
= ZIPLIST_ENTRY_TAIL(zl
);
596 if (p
[0] != ZIP_END
) {
598 while (entry
.prevrawlen
> 0 && index
--) {
599 p
-= entry
.prevrawlen
;
604 p
= ZIPLIST_ENTRY_HEAD(zl
);
605 while (p
[0] != ZIP_END
&& index
--) {
606 p
+= zipRawEntryLength(p
);
609 return (p
[0] == ZIP_END
|| index
> 0) ? NULL
: p
;
612 /* Return pointer to next entry in ziplist.
614 * zl is the pointer to the ziplist
615 * p is the pointer to the current element
617 * The element after 'p' is returned, otherwise NULL if we are at the end. */
618 unsigned char *ziplistNext(unsigned char *zl
, unsigned char *p
) {
621 /* "p" could be equal to ZIP_END, caused by ziplistDelete,
622 * and we should return NULL. Otherwise, we should return NULL
623 * when the *next* element is ZIP_END (there is no next entry). */
624 if (p
[0] == ZIP_END
) {
627 p
= p
+zipRawEntryLength(p
);
628 return (p
[0] == ZIP_END
) ? NULL
: p
;
632 /* Return pointer to previous entry in ziplist. */
633 unsigned char *ziplistPrev(unsigned char *zl
, unsigned char *p
) {
636 /* Iterating backwards from ZIP_END should return the tail. When "p" is
637 * equal to the first element of the list, we're already at the head,
638 * and should return NULL. */
639 if (p
[0] == ZIP_END
) {
640 p
= ZIPLIST_ENTRY_TAIL(zl
);
641 return (p
[0] == ZIP_END
) ? NULL
: p
;
642 } else if (p
== ZIPLIST_ENTRY_HEAD(zl
)) {
646 assert(entry
.prevrawlen
> 0);
647 return p
-entry
.prevrawlen
;
651 /* Get entry pointer to by 'p' and store in either 'e' or 'v' depending
652 * on the encoding of the entry. 'e' is always set to NULL to be able
653 * to find out whether the string pointer or the integer value was set.
654 * Return 0 if 'p' points to the end of the zipmap, 1 otherwise. */
655 unsigned int ziplistGet(unsigned char *p
, unsigned char **sstr
, unsigned int *slen
, long long *sval
) {
657 if (p
== NULL
|| p
[0] == ZIP_END
) return 0;
658 if (sstr
) *sstr
= NULL
;
661 if (ZIP_IS_STR(entry
.encoding
)) {
664 *sstr
= p
+entry
.headersize
;
668 *sval
= zipLoadInteger(p
+entry
.headersize
,entry
.encoding
);
674 /* Insert an entry at "p". */
675 unsigned char *ziplistInsert(unsigned char *zl
, unsigned char *p
, unsigned char *s
, unsigned int slen
) {
676 return __ziplistInsert(zl
,p
,s
,slen
);
679 /* Delete a single entry from the ziplist, pointed to by *p.
680 * Also update *p in place, to be able to iterate over the
681 * ziplist, while deleting entries. */
682 unsigned char *ziplistDelete(unsigned char *zl
, unsigned char **p
) {
683 size_t offset
= *p
-zl
;
684 zl
= __ziplistDelete(zl
,*p
,1);
686 /* Store pointer to current element in p, because ziplistDelete will
687 * do a realloc which might result in a different "zl"-pointer.
688 * When the delete direction is back to front, we might delete the last
689 * entry and end up with "p" pointing to ZIP_END, so check this. */
694 /* Delete a range of entries from the ziplist. */
695 unsigned char *ziplistDeleteRange(unsigned char *zl
, unsigned int index
, unsigned int num
) {
696 unsigned char *p
= ziplistIndex(zl
,index
);
697 return (p
== NULL
) ? zl
: __ziplistDelete(zl
,p
,num
);
700 /* Compare entry pointer to by 'p' with 'entry'. Return 1 if equal. */
701 unsigned int ziplistCompare(unsigned char *p
, unsigned char *sstr
, unsigned int slen
) {
703 unsigned char sencoding
;
704 long long zval
, sval
;
705 if (p
[0] == ZIP_END
) return 0;
708 if (ZIP_IS_STR(entry
.encoding
)) {
710 if (entry
.len
== slen
) {
711 return memcmp(p
+entry
.headersize
,sstr
,slen
) == 0;
716 /* Try to compare encoded values */
717 if (zipTryEncoding(sstr
,slen
,&sval
,&sencoding
)) {
718 if (entry
.encoding
== sencoding
) {
719 zval
= zipLoadInteger(p
+entry
.headersize
,entry
.encoding
);
727 /* Return length of ziplist. */
728 unsigned int ziplistLen(unsigned char *zl
) {
729 unsigned int len
= 0;
730 if (ZIPLIST_LENGTH(zl
) < UINT16_MAX
) {
731 len
= ZIPLIST_LENGTH(zl
);
733 unsigned char *p
= zl
+ZIPLIST_HEADER_SIZE
;
734 while (*p
!= ZIP_END
) {
735 p
+= zipRawEntryLength(p
);
739 /* Re-store length if small enough */
740 if (len
< UINT16_MAX
) ZIPLIST_LENGTH(zl
) = len
;
745 /* Return ziplist blob size in bytes. */
746 size_t ziplistBlobLen(unsigned char *zl
) {
747 return ZIPLIST_BYTES(zl
);
750 void ziplistRepr(unsigned char *zl
) {
758 "{tail offset %u}\n",
761 ZIPLIST_TAIL_OFFSET(zl
));
762 p
= ZIPLIST_ENTRY_HEAD(zl
);
763 while(*p
!= ZIP_END
) {
778 (unsigned long) (p
-zl
),
779 entry
.headersize
+entry
.len
,
782 entry
.prevrawlensize
,
784 p
+= entry
.headersize
;
785 if (ZIP_IS_STR(entry
.encoding
)) {
786 if (entry
.len
> 40) {
787 if (fwrite(p
,40,1,stdout
) == 0) perror("fwrite");
791 fwrite(p
,entry
.len
,1,stdout
) == 0) perror("fwrite");
794 printf("%lld", (long long) zipLoadInteger(p
,entry
.encoding
));
803 #ifdef ZIPLIST_TEST_MAIN
804 #include <sys/time.h>
808 #define debug(f, ...) { if (DEBUG) printf(f, __VA_ARGS__); }
810 unsigned char *createList() {
811 unsigned char *zl
= ziplistNew();
812 zl
= ziplistPush(zl
, (unsigned char*)"foo", 3, ZIPLIST_TAIL
);
813 zl
= ziplistPush(zl
, (unsigned char*)"quux", 4, ZIPLIST_TAIL
);
814 zl
= ziplistPush(zl
, (unsigned char*)"hello", 5, ZIPLIST_HEAD
);
815 zl
= ziplistPush(zl
, (unsigned char*)"1024", 4, ZIPLIST_TAIL
);
819 unsigned char *createIntList() {
820 unsigned char *zl
= ziplistNew();
824 zl
= ziplistPush(zl
, (unsigned char*)buf
, strlen(buf
), ZIPLIST_TAIL
);
825 sprintf(buf
, "128000");
826 zl
= ziplistPush(zl
, (unsigned char*)buf
, strlen(buf
), ZIPLIST_TAIL
);
827 sprintf(buf
, "-100");
828 zl
= ziplistPush(zl
, (unsigned char*)buf
, strlen(buf
), ZIPLIST_HEAD
);
829 sprintf(buf
, "4294967296");
830 zl
= ziplistPush(zl
, (unsigned char*)buf
, strlen(buf
), ZIPLIST_HEAD
);
831 sprintf(buf
, "non integer");
832 zl
= ziplistPush(zl
, (unsigned char*)buf
, strlen(buf
), ZIPLIST_TAIL
);
833 sprintf(buf
, "much much longer non integer");
834 zl
= ziplistPush(zl
, (unsigned char*)buf
, strlen(buf
), ZIPLIST_TAIL
);
838 long long usec(void) {
840 gettimeofday(&tv
,NULL
);
841 return (((long long)tv
.tv_sec
)*1000000)+tv
.tv_usec
;
844 void stress(int pos
, int num
, int maxsize
, int dnum
) {
847 char posstr
[2][5] = { "HEAD", "TAIL" };
849 for (i
= 0; i
< maxsize
; i
+=dnum
) {
851 for (j
= 0; j
< i
; j
++) {
852 zl
= ziplistPush(zl
,(unsigned char*)"quux",4,ZIPLIST_TAIL
);
855 /* Do num times a push+pop from pos */
857 for (k
= 0; k
< num
; k
++) {
858 zl
= ziplistPush(zl
,(unsigned char*)"quux",4,pos
);
859 zl
= ziplistDeleteRange(zl
,0,1);
861 printf("List size: %8d, bytes: %8d, %dx push+pop (%s): %6lld usec\n",
862 i
,ZIPLIST_BYTES(zl
),num
,posstr
[pos
],usec()-start
);
867 void pop(unsigned char *zl
, int where
) {
868 unsigned char *p
, *vstr
;
872 p
= ziplistIndex(zl
,where
== ZIPLIST_HEAD
? 0 : -1);
873 if (ziplistGet(p
,&vstr
,&vlen
,&vlong
)) {
874 if (where
== ZIPLIST_HEAD
)
875 printf("Pop head: ");
877 printf("Pop tail: ");
880 if (vlen
&& fwrite(vstr
,vlen
,1,stdout
) == 0) perror("fwrite");
882 printf("%lld", vlong
);
885 ziplistDeleteRange(zl
,-1,1);
887 printf("ERROR: Could not pop\n");
892 void randstring(char *target
, unsigned int min
, unsigned int max
) {
893 int p
, len
= min
+rand()%(max
-min
+1);
913 target
[p
++] = minval
+rand()%(maxval
-minval
+1);
918 int main(int argc
, char **argv
) {
919 unsigned char *zl
, *p
;
920 unsigned char *entry
;
924 /* If an argument is given, use it as the random seed. */
926 srand(atoi(argv
[1]));
928 zl
= createIntList();
934 pop(zl
,ZIPLIST_TAIL
);
937 pop(zl
,ZIPLIST_HEAD
);
940 pop(zl
,ZIPLIST_TAIL
);
943 pop(zl
,ZIPLIST_TAIL
);
946 printf("Get element at index 3:\n");
949 p
= ziplistIndex(zl
, 3);
950 if (!ziplistGet(p
, &entry
, &elen
, &value
)) {
951 printf("ERROR: Could not access index 3\n");
955 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0) perror("fwrite");
958 printf("%lld\n", value
);
963 printf("Get element at index 4 (out of range):\n");
966 p
= ziplistIndex(zl
, 4);
968 printf("No entry\n");
970 printf("ERROR: Out of range index should return NULL, returned offset: %ld\n", p
-zl
);
976 printf("Get element at index -1 (last element):\n");
979 p
= ziplistIndex(zl
, -1);
980 if (!ziplistGet(p
, &entry
, &elen
, &value
)) {
981 printf("ERROR: Could not access index -1\n");
985 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0) perror("fwrite");
988 printf("%lld\n", value
);
993 printf("Get element at index -4 (first element):\n");
996 p
= ziplistIndex(zl
, -4);
997 if (!ziplistGet(p
, &entry
, &elen
, &value
)) {
998 printf("ERROR: Could not access index -4\n");
1002 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0) perror("fwrite");
1005 printf("%lld\n", value
);
1010 printf("Get element at index -5 (reverse out of range):\n");
1013 p
= ziplistIndex(zl
, -5);
1015 printf("No entry\n");
1017 printf("ERROR: Out of range index should return NULL, returned offset: %ld\n", p
-zl
);
1023 printf("Iterate list from 0 to end:\n");
1026 p
= ziplistIndex(zl
, 0);
1027 while (ziplistGet(p
, &entry
, &elen
, &value
)) {
1030 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0) perror("fwrite");
1032 printf("%lld", value
);
1034 p
= ziplistNext(zl
,p
);
1040 printf("Iterate list from 1 to end:\n");
1043 p
= ziplistIndex(zl
, 1);
1044 while (ziplistGet(p
, &entry
, &elen
, &value
)) {
1047 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0) perror("fwrite");
1049 printf("%lld", value
);
1051 p
= ziplistNext(zl
,p
);
1057 printf("Iterate list from 2 to end:\n");
1060 p
= ziplistIndex(zl
, 2);
1061 while (ziplistGet(p
, &entry
, &elen
, &value
)) {
1064 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0) perror("fwrite");
1066 printf("%lld", value
);
1068 p
= ziplistNext(zl
,p
);
1074 printf("Iterate starting out of range:\n");
1077 p
= ziplistIndex(zl
, 4);
1078 if (!ziplistGet(p
, &entry
, &elen
, &value
)) {
1079 printf("No entry\n");
1086 printf("Iterate from back to front:\n");
1089 p
= ziplistIndex(zl
, -1);
1090 while (ziplistGet(p
, &entry
, &elen
, &value
)) {
1093 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0) perror("fwrite");
1095 printf("%lld", value
);
1097 p
= ziplistPrev(zl
,p
);
1103 printf("Iterate from back to front, deleting all items:\n");
1106 p
= ziplistIndex(zl
, -1);
1107 while (ziplistGet(p
, &entry
, &elen
, &value
)) {
1110 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0) perror("fwrite");
1112 printf("%lld", value
);
1114 zl
= ziplistDelete(zl
,&p
);
1115 p
= ziplistPrev(zl
,p
);
1121 printf("Delete inclusive range 0,0:\n");
1124 zl
= ziplistDeleteRange(zl
, 0, 1);
1128 printf("Delete inclusive range 0,1:\n");
1131 zl
= ziplistDeleteRange(zl
, 0, 2);
1135 printf("Delete inclusive range 1,2:\n");
1138 zl
= ziplistDeleteRange(zl
, 1, 2);
1142 printf("Delete with start index out of range:\n");
1145 zl
= ziplistDeleteRange(zl
, 5, 1);
1149 printf("Delete with num overflow:\n");
1152 zl
= ziplistDeleteRange(zl
, 1, 5);
1156 printf("Delete foo while iterating:\n");
1159 p
= ziplistIndex(zl
,0);
1160 while (ziplistGet(p
,&entry
,&elen
,&value
)) {
1161 if (entry
&& strncmp("foo",(char*)entry
,elen
) == 0) {
1162 printf("Delete foo\n");
1163 zl
= ziplistDelete(zl
,&p
);
1167 if (elen
&& fwrite(entry
,elen
,1,stdout
) == 0)
1170 printf("%lld",value
);
1172 p
= ziplistNext(zl
,p
);
1180 printf("Regression test for >255 byte strings:\n");
1182 char v1
[257],v2
[257];
1186 zl
= ziplistPush(zl
,(unsigned char*)v1
,strlen(v1
),ZIPLIST_TAIL
);
1187 zl
= ziplistPush(zl
,(unsigned char*)v2
,strlen(v2
),ZIPLIST_TAIL
);
1189 /* Pop values again and compare their value. */
1190 p
= ziplistIndex(zl
,0);
1191 assert(ziplistGet(p
,&entry
,&elen
,&value
));
1192 assert(strncmp(v1
,(char*)entry
,elen
) == 0);
1193 p
= ziplistIndex(zl
,1);
1194 assert(ziplistGet(p
,&entry
,&elen
,&value
));
1195 assert(strncmp(v2
,(char*)entry
,elen
) == 0);
1196 printf("SUCCESS\n\n");
1199 printf("Create long list and check indices:\n");
1204 for (i
= 0; i
< 1000; i
++) {
1205 len
= sprintf(buf
,"%d",i
);
1206 zl
= ziplistPush(zl
,(unsigned char*)buf
,len
,ZIPLIST_TAIL
);
1208 for (i
= 0; i
< 1000; i
++) {
1209 p
= ziplistIndex(zl
,i
);
1210 assert(ziplistGet(p
,NULL
,NULL
,&value
));
1213 p
= ziplistIndex(zl
,-i
-1);
1214 assert(ziplistGet(p
,NULL
,NULL
,&value
));
1215 assert(999-i
== value
);
1217 printf("SUCCESS\n\n");
1220 printf("Compare strings with ziplist entries:\n");
1223 p
= ziplistIndex(zl
,0);
1224 if (!ziplistCompare(p
,(unsigned char*)"hello",5)) {
1225 printf("ERROR: not \"hello\"\n");
1228 if (ziplistCompare(p
,(unsigned char*)"hella",5)) {
1229 printf("ERROR: \"hella\"\n");
1233 p
= ziplistIndex(zl
,3);
1234 if (!ziplistCompare(p
,(unsigned char*)"1024",4)) {
1235 printf("ERROR: not \"1024\"\n");
1238 if (ziplistCompare(p
,(unsigned char*)"1025",4)) {
1239 printf("ERROR: \"1025\"\n");
1242 printf("SUCCESS\n\n");
1245 printf("Stress with random payloads of different encoding:\n");
1253 /* Hold temp vars from ziplist */
1254 unsigned char *sstr
;
1258 /* In the regression for the cascade bug, it was triggered
1259 * with a random seed of 2. */
1262 for (i
= 0; i
< 20000; i
++) {
1265 listSetFreeMethod(ref
,sdsfree
);
1269 for (j
= 0; j
< len
; j
++) {
1270 where
= (rand() & 1) ? ZIPLIST_HEAD
: ZIPLIST_TAIL
;
1271 switch(rand() % 4) {
1273 sprintf(buf
,"%lld",(0LL + rand()) >> 20);
1276 sprintf(buf
,"%lld",(0LL + rand()));
1279 sprintf(buf
,"%lld",(0LL + rand()) << 20);
1282 randstring(buf
,0,256);
1288 /* Add to ziplist */
1289 zl
= ziplistPush(zl
, (unsigned char*)buf
, strlen(buf
), where
);
1291 /* Add to reference list */
1292 if (where
== ZIPLIST_HEAD
) {
1293 listAddNodeHead(ref
,sdsnew(buf
));
1294 } else if (where
== ZIPLIST_TAIL
) {
1295 listAddNodeTail(ref
,sdsnew(buf
));
1301 assert(listLength(ref
) == ziplistLen(zl
));
1302 for (j
= 0; j
< len
; j
++) {
1303 /* Naive way to get elements, but similar to the stresser
1304 * executed from the Tcl test suite. */
1305 p
= ziplistIndex(zl
,j
);
1306 refnode
= listIndex(ref
,j
);
1308 assert(ziplistGet(p
,&sstr
,&slen
,&sval
));
1310 sprintf(buf
,"%lld",sval
);
1312 memcpy(buf
,sstr
,slen
);
1315 assert(strcmp(buf
,listNodeValue(refnode
)) == 0);
1320 printf("SUCCESS\n\n");
1323 printf("Stress with variable ziplist size:\n");
1325 stress(ZIPLIST_HEAD
,100000,16384,256);
1326 stress(ZIPLIST_TAIL
,100000,16384,256);