2 * Copyright (c) 2009-2012, Salvatore Sanfilippo <antirez at gmail dot com>
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * * Neither the name of Redis nor the names of its contributors may be used
14 * to endorse or promote products derived from this software without
15 * specific prior written permission.
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
32 /*-----------------------------------------------------------------------------
34 *----------------------------------------------------------------------------*/
36 void sunionDiffGenericCommand(redisClient
*c
, robj
**setkeys
, int setnum
, robj
*dstkey
, int op
);
38 /* Factory method to return a set that *can* hold "value". When the object has
39 * an integer-encodable value, an intset will be returned. Otherwise a regular
41 robj
*setTypeCreate(robj
*value
) {
42 if (isObjectRepresentableAsLongLong(value
,NULL
) == REDIS_OK
)
43 return createIntsetObject();
44 return createSetObject();
47 int setTypeAdd(robj
*subject
, robj
*value
) {
49 if (subject
->encoding
== REDIS_ENCODING_HT
) {
50 if (dictAdd(subject
->ptr
,value
,NULL
) == DICT_OK
) {
54 } else if (subject
->encoding
== REDIS_ENCODING_INTSET
) {
55 if (isObjectRepresentableAsLongLong(value
,&llval
) == REDIS_OK
) {
57 subject
->ptr
= intsetAdd(subject
->ptr
,llval
,&success
);
59 /* Convert to regular set when the intset contains
60 * too many entries. */
61 if (intsetLen(subject
->ptr
) > server
.set_max_intset_entries
)
62 setTypeConvert(subject
,REDIS_ENCODING_HT
);
66 /* Failed to get integer from object, convert to regular set. */
67 setTypeConvert(subject
,REDIS_ENCODING_HT
);
69 /* The set *was* an intset and this value is not integer
70 * encodable, so dictAdd should always work. */
71 redisAssertWithInfo(NULL
,value
,dictAdd(subject
->ptr
,value
,NULL
) == DICT_OK
);
76 redisPanic("Unknown set encoding");
81 int setTypeRemove(robj
*setobj
, robj
*value
) {
83 if (setobj
->encoding
== REDIS_ENCODING_HT
) {
84 if (dictDelete(setobj
->ptr
,value
) == DICT_OK
) {
85 if (htNeedsResize(setobj
->ptr
)) dictResize(setobj
->ptr
);
88 } else if (setobj
->encoding
== REDIS_ENCODING_INTSET
) {
89 if (isObjectRepresentableAsLongLong(value
,&llval
) == REDIS_OK
) {
91 setobj
->ptr
= intsetRemove(setobj
->ptr
,llval
,&success
);
92 if (success
) return 1;
95 redisPanic("Unknown set encoding");
100 int setTypeIsMember(robj
*subject
, robj
*value
) {
102 if (subject
->encoding
== REDIS_ENCODING_HT
) {
103 return dictFind((dict
*)subject
->ptr
,value
) != NULL
;
104 } else if (subject
->encoding
== REDIS_ENCODING_INTSET
) {
105 if (isObjectRepresentableAsLongLong(value
,&llval
) == REDIS_OK
) {
106 return intsetFind((intset
*)subject
->ptr
,llval
);
109 redisPanic("Unknown set encoding");
114 setTypeIterator
*setTypeInitIterator(robj
*subject
) {
115 setTypeIterator
*si
= zmalloc(sizeof(setTypeIterator
));
116 si
->subject
= subject
;
117 si
->encoding
= subject
->encoding
;
118 if (si
->encoding
== REDIS_ENCODING_HT
) {
119 si
->di
= dictGetIterator(subject
->ptr
);
120 } else if (si
->encoding
== REDIS_ENCODING_INTSET
) {
123 redisPanic("Unknown set encoding");
128 void setTypeReleaseIterator(setTypeIterator
*si
) {
129 if (si
->encoding
== REDIS_ENCODING_HT
)
130 dictReleaseIterator(si
->di
);
134 /* Move to the next entry in the set. Returns the object at the current
137 * Since set elements can be internally be stored as redis objects or
138 * simple arrays of integers, setTypeNext returns the encoding of the
139 * set object you are iterating, and will populate the appropriate pointer
140 * (eobj) or (llobj) accordingly.
142 * When there are no longer elements -1 is returned.
143 * Returned objects ref count is not incremented, so this function is
144 * copy on write friendly. */
145 int setTypeNext(setTypeIterator
*si
, robj
**objele
, int64_t *llele
) {
146 if (si
->encoding
== REDIS_ENCODING_HT
) {
147 dictEntry
*de
= dictNext(si
->di
);
148 if (de
== NULL
) return -1;
149 *objele
= dictGetKey(de
);
150 } else if (si
->encoding
== REDIS_ENCODING_INTSET
) {
151 if (!intsetGet(si
->subject
->ptr
,si
->ii
++,llele
))
157 /* The not copy on write friendly version but easy to use version
158 * of setTypeNext() is setTypeNextObject(), returning new objects
159 * or incrementing the ref count of returned objects. So if you don't
160 * retain a pointer to this object you should call decrRefCount() against it.
162 * This function is the way to go for write operations where COW is not
163 * an issue as the result will be anyway of incrementing the ref count. */
164 robj
*setTypeNextObject(setTypeIterator
*si
) {
169 encoding
= setTypeNext(si
,&objele
,&intele
);
171 case -1: return NULL
;
172 case REDIS_ENCODING_INTSET
:
173 return createStringObjectFromLongLong(intele
);
174 case REDIS_ENCODING_HT
:
175 incrRefCount(objele
);
178 redisPanic("Unsupported encoding");
180 return NULL
; /* just to suppress warnings */
183 /* Return random element from a non empty set.
184 * The returned element can be a int64_t value if the set is encoded
185 * as an "intset" blob of integers, or a redis object if the set
188 * The caller provides both pointers to be populated with the right
189 * object. The return value of the function is the object->encoding
190 * field of the object and is used by the caller to check if the
191 * int64_t pointer or the redis object pointere was populated.
193 * When an object is returned (the set was a real set) the ref count
194 * of the object is not incremented so this function can be considered
195 * copy on write friendly. */
196 int setTypeRandomElement(robj
*setobj
, robj
**objele
, int64_t *llele
) {
197 if (setobj
->encoding
== REDIS_ENCODING_HT
) {
198 dictEntry
*de
= dictGetRandomKey(setobj
->ptr
);
199 *objele
= dictGetKey(de
);
200 } else if (setobj
->encoding
== REDIS_ENCODING_INTSET
) {
201 *llele
= intsetRandom(setobj
->ptr
);
203 redisPanic("Unknown set encoding");
205 return setobj
->encoding
;
208 unsigned long setTypeSize(robj
*subject
) {
209 if (subject
->encoding
== REDIS_ENCODING_HT
) {
210 return dictSize((dict
*)subject
->ptr
);
211 } else if (subject
->encoding
== REDIS_ENCODING_INTSET
) {
212 return intsetLen((intset
*)subject
->ptr
);
214 redisPanic("Unknown set encoding");
218 /* Convert the set to specified encoding. The resulting dict (when converting
219 * to a hash table) is presized to hold the number of elements in the original
221 void setTypeConvert(robj
*setobj
, int enc
) {
223 redisAssertWithInfo(NULL
,setobj
,setobj
->type
== REDIS_SET
&&
224 setobj
->encoding
== REDIS_ENCODING_INTSET
);
226 if (enc
== REDIS_ENCODING_HT
) {
228 dict
*d
= dictCreate(&setDictType
,NULL
);
231 /* Presize the dict to avoid rehashing */
232 dictExpand(d
,intsetLen(setobj
->ptr
));
234 /* To add the elements we extract integers and create redis objects */
235 si
= setTypeInitIterator(setobj
);
236 while (setTypeNext(si
,NULL
,&intele
) != -1) {
237 element
= createStringObjectFromLongLong(intele
);
238 redisAssertWithInfo(NULL
,element
,dictAdd(d
,element
,NULL
) == DICT_OK
);
240 setTypeReleaseIterator(si
);
242 setobj
->encoding
= REDIS_ENCODING_HT
;
246 redisPanic("Unsupported set conversion");
250 void saddCommand(redisClient
*c
) {
254 set
= lookupKeyWrite(c
->db
,c
->argv
[1]);
256 set
= setTypeCreate(c
->argv
[2]);
257 dbAdd(c
->db
,c
->argv
[1],set
);
259 if (set
->type
!= REDIS_SET
) {
260 addReply(c
,shared
.wrongtypeerr
);
265 for (j
= 2; j
< c
->argc
; j
++) {
266 c
->argv
[j
] = tryObjectEncoding(c
->argv
[j
]);
267 if (setTypeAdd(set
,c
->argv
[j
])) added
++;
269 if (added
) signalModifiedKey(c
->db
,c
->argv
[1]);
270 server
.dirty
+= added
;
271 addReplyLongLong(c
,added
);
274 void sremCommand(redisClient
*c
) {
278 if ((set
= lookupKeyWriteOrReply(c
,c
->argv
[1],shared
.czero
)) == NULL
||
279 checkType(c
,set
,REDIS_SET
)) return;
281 for (j
= 2; j
< c
->argc
; j
++) {
282 if (setTypeRemove(set
,c
->argv
[j
])) {
284 if (setTypeSize(set
) == 0) {
285 dbDelete(c
->db
,c
->argv
[1]);
291 signalModifiedKey(c
->db
,c
->argv
[1]);
292 server
.dirty
+= deleted
;
294 addReplyLongLong(c
,deleted
);
297 void smoveCommand(redisClient
*c
) {
298 robj
*srcset
, *dstset
, *ele
;
299 srcset
= lookupKeyWrite(c
->db
,c
->argv
[1]);
300 dstset
= lookupKeyWrite(c
->db
,c
->argv
[2]);
301 ele
= c
->argv
[3] = tryObjectEncoding(c
->argv
[3]);
303 /* If the source key does not exist return 0 */
304 if (srcset
== NULL
) {
305 addReply(c
,shared
.czero
);
309 /* If the source key has the wrong type, or the destination key
310 * is set and has the wrong type, return with an error. */
311 if (checkType(c
,srcset
,REDIS_SET
) ||
312 (dstset
&& checkType(c
,dstset
,REDIS_SET
))) return;
314 /* If srcset and dstset are equal, SMOVE is a no-op */
315 if (srcset
== dstset
) {
316 addReply(c
,shared
.cone
);
320 /* If the element cannot be removed from the src set, return 0. */
321 if (!setTypeRemove(srcset
,ele
)) {
322 addReply(c
,shared
.czero
);
326 /* Remove the src set from the database when empty */
327 if (setTypeSize(srcset
) == 0) dbDelete(c
->db
,c
->argv
[1]);
328 signalModifiedKey(c
->db
,c
->argv
[1]);
329 signalModifiedKey(c
->db
,c
->argv
[2]);
332 /* Create the destination set when it doesn't exist */
334 dstset
= setTypeCreate(ele
);
335 dbAdd(c
->db
,c
->argv
[2],dstset
);
338 /* An extra key has changed when ele was successfully added to dstset */
339 if (setTypeAdd(dstset
,ele
)) server
.dirty
++;
340 addReply(c
,shared
.cone
);
343 void sismemberCommand(redisClient
*c
) {
346 if ((set
= lookupKeyReadOrReply(c
,c
->argv
[1],shared
.czero
)) == NULL
||
347 checkType(c
,set
,REDIS_SET
)) return;
349 c
->argv
[2] = tryObjectEncoding(c
->argv
[2]);
350 if (setTypeIsMember(set
,c
->argv
[2]))
351 addReply(c
,shared
.cone
);
353 addReply(c
,shared
.czero
);
356 void scardCommand(redisClient
*c
) {
359 if ((o
= lookupKeyReadOrReply(c
,c
->argv
[1],shared
.czero
)) == NULL
||
360 checkType(c
,o
,REDIS_SET
)) return;
362 addReplyLongLong(c
,setTypeSize(o
));
365 void spopCommand(redisClient
*c
) {
366 robj
*set
, *ele
, *aux
;
370 if ((set
= lookupKeyWriteOrReply(c
,c
->argv
[1],shared
.nullbulk
)) == NULL
||
371 checkType(c
,set
,REDIS_SET
)) return;
373 encoding
= setTypeRandomElement(set
,&ele
,&llele
);
374 if (encoding
== REDIS_ENCODING_INTSET
) {
375 ele
= createStringObjectFromLongLong(llele
);
376 set
->ptr
= intsetRemove(set
->ptr
,llele
,NULL
);
379 setTypeRemove(set
,ele
);
382 /* Replicate/AOF this command as an SREM operation */
383 aux
= createStringObject("SREM",4);
384 rewriteClientCommandVector(c
,3,aux
,c
->argv
[1],ele
);
389 if (setTypeSize(set
) == 0) dbDelete(c
->db
,c
->argv
[1]);
390 signalModifiedKey(c
->db
,c
->argv
[1]);
394 /* handle the "SRANDMEMBER key <count>" variant. The normal version of the
395 * command is handled by the srandmemberCommand() function itself. */
397 /* How many times bigger should be the set compared to the requested size
398 * for us to don't use the "remove elements" strategy? Read later in the
399 * implementation for more info. */
400 #define SRANDMEMBER_SUB_STRATEGY_MUL 3
402 void srandmemberWithCountCommand(redisClient
*c
) {
404 unsigned long count
, size
;
412 if (getLongFromObjectOrReply(c
,c
->argv
[2],&l
,NULL
) != REDIS_OK
) return;
414 count
= (unsigned) l
;
416 /* A negative count means: return the same elements multiple times
417 * (i.e. don't remove the extracted element after every extraction). */
422 if ((set
= lookupKeyReadOrReply(c
,c
->argv
[1],shared
.emptymultibulk
))
423 == NULL
|| checkType(c
,set
,REDIS_SET
)) return;
424 size
= setTypeSize(set
);
426 /* If count is zero, serve it ASAP to avoid special cases later. */
428 addReply(c
,shared
.emptymultibulk
);
432 /* CASE 1: The count was negative, so the extraction method is just:
433 * "return N random elements" sampling the whole set every time.
434 * This case is trivial and can be served without auxiliary data
437 addReplyMultiBulkLen(c
,count
);
439 encoding
= setTypeRandomElement(set
,&ele
,&llele
);
440 if (encoding
== REDIS_ENCODING_INTSET
) {
441 addReplyBulkLongLong(c
,llele
);
450 * The number of requested elements is greater than the number of
451 * elements inside the set: simply return the whole set. */
453 sunionDiffGenericCommand(c
,c
->argv
,c
->argc
-1,NULL
,REDIS_OP_UNION
);
457 /* For CASE 3 and CASE 4 we need an auxiliary dictionary. */
458 d
= dictCreate(&setDictType
,NULL
);
461 * The number of elements inside the set is not greater than
462 * SRANDMEMBER_SUB_STRATEGY_MUL times the number of requested elements.
463 * In this case we create a set from scratch with all the elements, and
464 * subtract random elements to reach the requested number of elements.
466 * This is done because if the number of requsted elements is just
467 * a bit less than the number of elements in the set, the natural approach
468 * used into CASE 3 is highly inefficient. */
469 if (count
*SRANDMEMBER_SUB_STRATEGY_MUL
> size
) {
472 /* Add all the elements into the temporary dictionary. */
473 si
= setTypeInitIterator(set
);
474 while((encoding
= setTypeNext(si
,&ele
,&llele
)) != -1) {
477 if (encoding
== REDIS_ENCODING_INTSET
) {
478 retval
= dictAdd(d
,createStringObjectFromLongLong(llele
),NULL
);
479 } else if (ele
->encoding
== REDIS_ENCODING_RAW
) {
480 retval
= dictAdd(d
,dupStringObject(ele
),NULL
);
481 } else if (ele
->encoding
== REDIS_ENCODING_INT
) {
483 createStringObjectFromLongLong((long)ele
->ptr
),NULL
);
485 redisAssert(retval
== DICT_OK
);
487 setTypeReleaseIterator(si
);
488 redisAssert(dictSize(d
) == size
);
490 /* Remove random elements to reach the right count. */
491 while(size
> count
) {
494 de
= dictGetRandomKey(d
);
495 dictDelete(d
,dictGetKey(de
));
500 /* CASE 4: We have a big set compared to the requested number of elements.
501 * In this case we can simply get random elements from the set and add
502 * to the temporary set, trying to eventually get enough unique elements
503 * to reach the specified count. */
505 unsigned long added
= 0;
507 while(added
< count
) {
508 encoding
= setTypeRandomElement(set
,&ele
,&llele
);
509 if (encoding
== REDIS_ENCODING_INTSET
) {
510 ele
= createStringObjectFromLongLong(llele
);
511 } else if (ele
->encoding
== REDIS_ENCODING_RAW
) {
512 ele
= dupStringObject(ele
);
513 } else if (ele
->encoding
== REDIS_ENCODING_INT
) {
514 ele
= createStringObjectFromLongLong((long)ele
->ptr
);
516 /* Try to add the object to the dictionary. If it already exists
517 * free it, otherwise increment the number of objects we have
518 * in the result dictionary. */
519 if (dictAdd(d
,ele
,NULL
) == DICT_OK
)
526 /* CASE 3 & 4: send the result to the user. */
531 addReplyMultiBulkLen(c
,count
);
532 di
= dictGetIterator(d
);
533 while((de
= dictNext(di
)) != NULL
)
534 addReplyBulk(c
,dictGetKey(de
));
535 dictReleaseIterator(di
);
540 void srandmemberCommand(redisClient
*c
) {
546 srandmemberWithCountCommand(c
);
548 } else if (c
->argc
> 3) {
549 addReply(c
,shared
.syntaxerr
);
553 if ((set
= lookupKeyReadOrReply(c
,c
->argv
[1],shared
.nullbulk
)) == NULL
||
554 checkType(c
,set
,REDIS_SET
)) return;
556 encoding
= setTypeRandomElement(set
,&ele
,&llele
);
557 if (encoding
== REDIS_ENCODING_INTSET
) {
558 addReplyBulkLongLong(c
,llele
);
564 int qsortCompareSetsByCardinality(const void *s1
, const void *s2
) {
565 return setTypeSize(*(robj
**)s1
)-setTypeSize(*(robj
**)s2
);
568 /* This is used by SDIFF and in this case we can receive NULL that should
569 * be handled as empty sets. */
570 int qsortCompareSetsByRevCardinality(const void *s1
, const void *s2
) {
571 robj
*o1
= *(robj
**)s1
, *o2
= *(robj
**)s2
;
573 return (o2
? setTypeSize(o2
) : 0) - (o1
? setTypeSize(o1
) : 0);
576 void sinterGenericCommand(redisClient
*c
, robj
**setkeys
, unsigned long setnum
, robj
*dstkey
) {
577 robj
**sets
= zmalloc(sizeof(robj
*)*setnum
);
579 robj
*eleobj
, *dstset
= NULL
;
581 void *replylen
= NULL
;
582 unsigned long j
, cardinality
= 0;
585 for (j
= 0; j
< setnum
; j
++) {
586 robj
*setobj
= dstkey
?
587 lookupKeyWrite(c
->db
,setkeys
[j
]) :
588 lookupKeyRead(c
->db
,setkeys
[j
]);
592 if (dbDelete(c
->db
,dstkey
)) {
593 signalModifiedKey(c
->db
,dstkey
);
596 addReply(c
,shared
.czero
);
598 addReply(c
,shared
.emptymultibulk
);
602 if (checkType(c
,setobj
,REDIS_SET
)) {
608 /* Sort sets from the smallest to largest, this will improve our
609 * algorithm's performace */
610 qsort(sets
,setnum
,sizeof(robj
*),qsortCompareSetsByCardinality
);
612 /* The first thing we should output is the total number of elements...
613 * since this is a multi-bulk write, but at this stage we don't know
614 * the intersection set size, so we use a trick, append an empty object
615 * to the output list and save the pointer to later modify it with the
618 replylen
= addDeferredMultiBulkLength(c
);
620 /* If we have a target key where to store the resulting set
621 * create this key with an empty set inside */
622 dstset
= createIntsetObject();
625 /* Iterate all the elements of the first (smallest) set, and test
626 * the element against all the other sets, if at least one set does
627 * not include the element it is discarded */
628 si
= setTypeInitIterator(sets
[0]);
629 while((encoding
= setTypeNext(si
,&eleobj
,&intobj
)) != -1) {
630 for (j
= 1; j
< setnum
; j
++) {
631 if (sets
[j
] == sets
[0]) continue;
632 if (encoding
== REDIS_ENCODING_INTSET
) {
633 /* intset with intset is simple... and fast */
634 if (sets
[j
]->encoding
== REDIS_ENCODING_INTSET
&&
635 !intsetFind((intset
*)sets
[j
]->ptr
,intobj
))
638 /* in order to compare an integer with an object we
639 * have to use the generic function, creating an object
641 } else if (sets
[j
]->encoding
== REDIS_ENCODING_HT
) {
642 eleobj
= createStringObjectFromLongLong(intobj
);
643 if (!setTypeIsMember(sets
[j
],eleobj
)) {
644 decrRefCount(eleobj
);
647 decrRefCount(eleobj
);
649 } else if (encoding
== REDIS_ENCODING_HT
) {
650 /* Optimization... if the source object is integer
651 * encoded AND the target set is an intset, we can get
652 * a much faster path. */
653 if (eleobj
->encoding
== REDIS_ENCODING_INT
&&
654 sets
[j
]->encoding
== REDIS_ENCODING_INTSET
&&
655 !intsetFind((intset
*)sets
[j
]->ptr
,(long)eleobj
->ptr
))
658 /* else... object to object check is easy as we use the
659 * type agnostic API here. */
660 } else if (!setTypeIsMember(sets
[j
],eleobj
)) {
666 /* Only take action when all sets contain the member */
669 if (encoding
== REDIS_ENCODING_HT
)
670 addReplyBulk(c
,eleobj
);
672 addReplyBulkLongLong(c
,intobj
);
675 if (encoding
== REDIS_ENCODING_INTSET
) {
676 eleobj
= createStringObjectFromLongLong(intobj
);
677 setTypeAdd(dstset
,eleobj
);
678 decrRefCount(eleobj
);
680 setTypeAdd(dstset
,eleobj
);
685 setTypeReleaseIterator(si
);
688 /* Store the resulting set into the target, if the intersection
689 * is not an empty set. */
690 dbDelete(c
->db
,dstkey
);
691 if (setTypeSize(dstset
) > 0) {
692 dbAdd(c
->db
,dstkey
,dstset
);
693 addReplyLongLong(c
,setTypeSize(dstset
));
695 decrRefCount(dstset
);
696 addReply(c
,shared
.czero
);
698 signalModifiedKey(c
->db
,dstkey
);
701 setDeferredMultiBulkLength(c
,replylen
,cardinality
);
706 void sinterCommand(redisClient
*c
) {
707 sinterGenericCommand(c
,c
->argv
+1,c
->argc
-1,NULL
);
710 void sinterstoreCommand(redisClient
*c
) {
711 sinterGenericCommand(c
,c
->argv
+2,c
->argc
-2,c
->argv
[1]);
714 #define REDIS_OP_UNION 0
715 #define REDIS_OP_DIFF 1
716 #define REDIS_OP_INTER 2
718 void sunionDiffGenericCommand(redisClient
*c
, robj
**setkeys
, int setnum
, robj
*dstkey
, int op
) {
719 robj
**sets
= zmalloc(sizeof(robj
*)*setnum
);
721 robj
*ele
, *dstset
= NULL
;
722 int j
, cardinality
= 0;
725 for (j
= 0; j
< setnum
; j
++) {
726 robj
*setobj
= dstkey
?
727 lookupKeyWrite(c
->db
,setkeys
[j
]) :
728 lookupKeyRead(c
->db
,setkeys
[j
]);
733 if (checkType(c
,setobj
,REDIS_SET
)) {
740 /* Select what DIFF algorithm to use.
742 * Algorithm 1 is O(N*M) where N is the size of the element first set
743 * and M the total number of sets.
745 * Algorithm 2 is O(N) where N is the total number of elements in all
748 * We compute what is the best bet with the current input here. */
749 if (op
== REDIS_OP_DIFF
&& sets
[0]) {
750 long long algo_one_work
= 0, algo_two_work
= 0;
752 for (j
= 0; j
< setnum
; j
++) {
753 if (sets
[j
] == NULL
) continue;
755 algo_one_work
+= setTypeSize(sets
[0]);
756 algo_two_work
+= setTypeSize(sets
[j
]);
759 /* Algorithm 1 has better constant times and performs less operations
760 * if there are elements in common. Give it some advantage. */
762 diff_algo
= (algo_one_work
<= algo_two_work
) ? 1 : 2;
764 if (diff_algo
== 1 && setnum
> 1) {
765 /* With algorithm 1 it is better to order the sets to subtract
766 * by decreasing size, so that we are more likely to find
767 * duplicated elements ASAP. */
768 qsort(sets
+1,setnum
-1,sizeof(robj
*),
769 qsortCompareSetsByRevCardinality
);
773 /* We need a temp set object to store our union. If the dstkey
774 * is not NULL (that is, we are inside an SUNIONSTORE operation) then
775 * this set object will be the resulting object to set into the target key*/
776 dstset
= createIntsetObject();
778 if (op
== REDIS_OP_UNION
) {
779 /* Union is trivial, just add every element of every set to the
781 for (j
= 0; j
< setnum
; j
++) {
782 if (!sets
[j
]) continue; /* non existing keys are like empty sets */
784 si
= setTypeInitIterator(sets
[j
]);
785 while((ele
= setTypeNextObject(si
)) != NULL
) {
786 if (setTypeAdd(dstset
,ele
)) cardinality
++;
789 setTypeReleaseIterator(si
);
791 } else if (op
== REDIS_OP_DIFF
&& sets
[0] && diff_algo
== 1) {
794 * We perform the diff by iterating all the elements of the first set,
795 * and only adding it to the target set if the element does not exist
796 * into all the other sets.
798 * This way we perform at max N*M operations, where N is the size of
799 * the first set, and M the number of sets. */
800 si
= setTypeInitIterator(sets
[0]);
801 while((ele
= setTypeNextObject(si
)) != NULL
) {
802 for (j
= 1; j
< setnum
; j
++) {
803 if (!sets
[j
]) continue; /* no key is an empty set. */
804 if (setTypeIsMember(sets
[j
],ele
)) break;
807 /* There is no other set with this element. Add it. */
808 setTypeAdd(dstset
,ele
);
813 setTypeReleaseIterator(si
);
814 } else if (op
== REDIS_OP_DIFF
&& sets
[0] && diff_algo
== 2) {
817 * Add all the elements of the first set to the auxiliary set.
818 * Then remove all the elements of all the next sets from it.
820 * This is O(N) where N is the sum of all the elements in every
822 for (j
= 0; j
< setnum
; j
++) {
823 if (!sets
[j
]) continue; /* non existing keys are like empty sets */
825 si
= setTypeInitIterator(sets
[j
]);
826 while((ele
= setTypeNextObject(si
)) != NULL
) {
828 if (setTypeAdd(dstset
,ele
)) cardinality
++;
830 if (setTypeRemove(dstset
,ele
)) cardinality
--;
834 setTypeReleaseIterator(si
);
836 /* Exit if result set is empty as any additional removal
837 * of elements will have no effect. */
838 if (cardinality
== 0) break;
842 /* Output the content of the resulting set, if not in STORE mode */
844 addReplyMultiBulkLen(c
,cardinality
);
845 si
= setTypeInitIterator(dstset
);
846 while((ele
= setTypeNextObject(si
)) != NULL
) {
850 setTypeReleaseIterator(si
);
851 decrRefCount(dstset
);
853 /* If we have a target key where to store the resulting set
854 * create this key with the result set inside */
855 dbDelete(c
->db
,dstkey
);
856 if (setTypeSize(dstset
) > 0) {
857 dbAdd(c
->db
,dstkey
,dstset
);
858 addReplyLongLong(c
,setTypeSize(dstset
));
860 decrRefCount(dstset
);
861 addReply(c
,shared
.czero
);
863 signalModifiedKey(c
->db
,dstkey
);
869 void sunionCommand(redisClient
*c
) {
870 sunionDiffGenericCommand(c
,c
->argv
+1,c
->argc
-1,NULL
,REDIS_OP_UNION
);
873 void sunionstoreCommand(redisClient
*c
) {
874 sunionDiffGenericCommand(c
,c
->argv
+2,c
->argc
-2,c
->argv
[1],REDIS_OP_UNION
);
877 void sdiffCommand(redisClient
*c
) {
878 sunionDiffGenericCommand(c
,c
->argv
+1,c
->argc
-1,NULL
,REDIS_OP_DIFF
);
881 void sdiffstoreCommand(redisClient
*c
) {
882 sunionDiffGenericCommand(c
,c
->argv
+2,c
->argc
-2,c
->argv
[1],REDIS_OP_DIFF
);