Commit | Line | Data |
---|---|---|
e2641e09 | 1 | #include "redis.h" |
2 | #include "pqsort.h" /* Partial qsort for SORT+LIMIT */ | |
2c861050 | 3 | #include <math.h> /* isnan() */ |
e2641e09 | 4 | |
5 | redisSortOperation *createSortOperation(int type, robj *pattern) { | |
6 | redisSortOperation *so = zmalloc(sizeof(*so)); | |
7 | so->type = type; | |
8 | so->pattern = pattern; | |
9 | return so; | |
10 | } | |
11 | ||
68ee1855 | 12 | /* Return the value associated to the key with a name obtained using |
13 | * the following rules: | |
14 | * | |
15 | * 1) The first occurence of '*' in 'pattern' is substituted with 'subst'. | |
16 | * | |
17 | * 2) If 'pattern' matches the "->" string, everything on the left of | |
18 | * the arrow is treated as the name of an hash field, and the part on the | |
19 | * left as the key name containing an hash. The value of the specified | |
20 | * field is returned. | |
21 | * | |
22 | * 3) If 'pattern' equals "#", the function simply returns 'subst' itself so | |
23 | * that the SORT command can be used like: SORT key GET # to retrieve | |
24 | * the Set/List elements directly. | |
25 | * | |
e2641e09 | 26 | * The returned object will always have its refcount increased by 1 |
27 | * when it is non-NULL. */ | |
28 | robj *lookupKeyByPattern(redisDb *db, robj *pattern, robj *subst) { | |
68ee1855 | 29 | char *p, *f, *k; |
e2641e09 | 30 | sds spat, ssub; |
ae55245d | 31 | robj *keyobj, *fieldobj = NULL, *o; |
e2641e09 | 32 | int prefixlen, sublen, postfixlen, fieldlen; |
e2641e09 | 33 | |
34 | /* If the pattern is "#" return the substitution object itself in order | |
35 | * to implement the "SORT ... GET #" feature. */ | |
36 | spat = pattern->ptr; | |
37 | if (spat[0] == '#' && spat[1] == '\0') { | |
38 | incrRefCount(subst); | |
39 | return subst; | |
40 | } | |
41 | ||
42 | /* The substitution object may be specially encoded. If so we create | |
43 | * a decoded object on the fly. Otherwise getDecodedObject will just | |
44 | * increment the ref count, that we'll decrement later. */ | |
45 | subst = getDecodedObject(subst); | |
e2641e09 | 46 | ssub = subst->ptr; |
68ee1855 | 47 | |
48 | /* If we can't find '*' in the pattern we return NULL as to GET a | |
49 | * fixed key does not make sense. */ | |
e2641e09 | 50 | p = strchr(spat,'*'); |
51 | if (!p) { | |
52 | decrRefCount(subst); | |
53 | return NULL; | |
54 | } | |
55 | ||
56 | /* Find out if we're dealing with a hash dereference. */ | |
68ee1855 | 57 | if ((f = strstr(p+1, "->")) != NULL && *(f+2) != '\0') { |
58 | fieldlen = sdslen(spat)-(f-spat)-2; | |
59 | fieldobj = createStringObject(f+2,fieldlen); | |
e2641e09 | 60 | } else { |
61 | fieldlen = 0; | |
62 | } | |
63 | ||
68ee1855 | 64 | /* Perform the '*' substitution. */ |
e2641e09 | 65 | prefixlen = p-spat; |
66 | sublen = sdslen(ssub); | |
68ee1855 | 67 | postfixlen = sdslen(spat)-(prefixlen+1)-(fieldlen ? fieldlen+2 : 0); |
68 | keyobj = createStringObject(NULL,prefixlen+sublen+postfixlen); | |
69 | k = keyobj->ptr; | |
70 | memcpy(k,spat,prefixlen); | |
71 | memcpy(k+prefixlen,ssub,sublen); | |
72 | memcpy(k+prefixlen+sublen,p+1,postfixlen); | |
73 | decrRefCount(subst); /* Incremented by decodeObject() */ | |
e2641e09 | 74 | |
75 | /* Lookup substituted key */ | |
68ee1855 | 76 | o = lookupKeyRead(db,keyobj); |
77 | if (o == NULL) goto noobj; | |
e2641e09 | 78 | |
ae55245d | 79 | if (fieldobj) { |
68ee1855 | 80 | if (o->type != REDIS_HASH) goto noobj; |
e2641e09 | 81 | |
82 | /* Retrieve value from hash by the field name. This operation | |
83 | * already increases the refcount of the returned object. */ | |
68ee1855 | 84 | o = hashTypeGetObject(o, fieldobj); |
e2641e09 | 85 | } else { |
68ee1855 | 86 | if (o->type != REDIS_STRING) goto noobj; |
e2641e09 | 87 | |
88 | /* Every object that this function returns needs to have its refcount | |
89 | * increased. sortCommand decreases it again. */ | |
90 | incrRefCount(o); | |
91 | } | |
68ee1855 | 92 | decrRefCount(keyobj); |
ae55245d | 93 | if (fieldobj) decrRefCount(fieldobj); |
e2641e09 | 94 | return o; |
68ee1855 | 95 | |
96 | noobj: | |
97 | decrRefCount(keyobj); | |
98 | if (fieldlen) decrRefCount(fieldobj); | |
99 | return NULL; | |
e2641e09 | 100 | } |
101 | ||
102 | /* sortCompare() is used by qsort in sortCommand(). Given that qsort_r with | |
103 | * the additional parameter is not standard but a BSD-specific we have to | |
104 | * pass sorting parameters via the global 'server' structure */ | |
105 | int sortCompare(const void *s1, const void *s2) { | |
106 | const redisSortObject *so1 = s1, *so2 = s2; | |
107 | int cmp; | |
108 | ||
109 | if (!server.sort_alpha) { | |
110 | /* Numeric sorting. Here it's trivial as we precomputed scores */ | |
111 | if (so1->u.score > so2->u.score) { | |
112 | cmp = 1; | |
113 | } else if (so1->u.score < so2->u.score) { | |
114 | cmp = -1; | |
115 | } else { | |
2c861050 | 116 | /* Objects have the same score, but we don't want the comparison |
117 | * to be undefined, so we compare objects lexicographycally. | |
118 | * This way the result of SORT is deterministic. */ | |
119 | cmp = compareStringObjects(so1->obj,so2->obj); | |
e2641e09 | 120 | } |
121 | } else { | |
122 | /* Alphanumeric sorting */ | |
123 | if (server.sort_bypattern) { | |
124 | if (!so1->u.cmpobj || !so2->u.cmpobj) { | |
125 | /* At least one compare object is NULL */ | |
126 | if (so1->u.cmpobj == so2->u.cmpobj) | |
127 | cmp = 0; | |
128 | else if (so1->u.cmpobj == NULL) | |
129 | cmp = -1; | |
130 | else | |
131 | cmp = 1; | |
132 | } else { | |
133 | /* We have both the objects, use strcoll */ | |
134 | cmp = strcoll(so1->u.cmpobj->ptr,so2->u.cmpobj->ptr); | |
135 | } | |
136 | } else { | |
137 | /* Compare elements directly. */ | |
138 | cmp = compareStringObjects(so1->obj,so2->obj); | |
139 | } | |
140 | } | |
141 | return server.sort_desc ? -cmp : cmp; | |
142 | } | |
143 | ||
144 | /* The SORT command is the most complex command in Redis. Warning: this code | |
145 | * is optimized for speed and a bit less for readability */ | |
146 | void sortCommand(redisClient *c) { | |
147 | list *operations; | |
148 | unsigned int outputlen = 0; | |
149 | int desc = 0, alpha = 0; | |
706b32e0 | 150 | long limit_start = 0, limit_count = -1, start, end; |
e2641e09 | 151 | int j, dontsort = 0, vectorlen; |
152 | int getop = 0; /* GET operation counter */ | |
2c861050 | 153 | int int_convertion_error = 0; |
e2641e09 | 154 | robj *sortval, *sortby = NULL, *storekey = NULL; |
155 | redisSortObject *vector; /* Resulting vector to sort */ | |
156 | ||
157 | /* Lookup the key to sort. It must be of the right types */ | |
158 | sortval = lookupKeyRead(c->db,c->argv[1]); | |
237194b7 | 159 | if (sortval && sortval->type != REDIS_SET && sortval->type != REDIS_LIST && |
e2641e09 | 160 | sortval->type != REDIS_ZSET) |
161 | { | |
162 | addReply(c,shared.wrongtypeerr); | |
163 | return; | |
164 | } | |
165 | ||
166 | /* Create a list of operations to perform for every sorted element. | |
167 | * Operations can be GET/DEL/INCR/DECR */ | |
168 | operations = listCreate(); | |
169 | listSetFreeMethod(operations,zfree); | |
170 | j = 2; | |
171 | ||
172 | /* Now we need to protect sortval incrementing its count, in the future | |
173 | * SORT may have options able to overwrite/delete keys during the sorting | |
174 | * and the sorted key itself may get destroied */ | |
237194b7 | 175 | if (sortval) |
176 | incrRefCount(sortval); | |
177 | else | |
178 | sortval = createListObject(); | |
e2641e09 | 179 | |
180 | /* The SORT command has an SQL-alike syntax, parse it */ | |
181 | while(j < c->argc) { | |
182 | int leftargs = c->argc-j-1; | |
183 | if (!strcasecmp(c->argv[j]->ptr,"asc")) { | |
184 | desc = 0; | |
185 | } else if (!strcasecmp(c->argv[j]->ptr,"desc")) { | |
186 | desc = 1; | |
187 | } else if (!strcasecmp(c->argv[j]->ptr,"alpha")) { | |
188 | alpha = 1; | |
189 | } else if (!strcasecmp(c->argv[j]->ptr,"limit") && leftargs >= 2) { | |
706b32e0 B |
190 | if ((getLongFromObjectOrReply(c, c->argv[j+1], &limit_start, NULL) != REDIS_OK) || |
191 | (getLongFromObjectOrReply(c, c->argv[j+2], &limit_count, NULL) != REDIS_OK)) return; | |
e2641e09 | 192 | j+=2; |
193 | } else if (!strcasecmp(c->argv[j]->ptr,"store") && leftargs >= 1) { | |
194 | storekey = c->argv[j+1]; | |
195 | j++; | |
196 | } else if (!strcasecmp(c->argv[j]->ptr,"by") && leftargs >= 1) { | |
197 | sortby = c->argv[j+1]; | |
198 | /* If the BY pattern does not contain '*', i.e. it is constant, | |
199 | * we don't need to sort nor to lookup the weight keys. */ | |
200 | if (strchr(c->argv[j+1]->ptr,'*') == NULL) dontsort = 1; | |
201 | j++; | |
202 | } else if (!strcasecmp(c->argv[j]->ptr,"get") && leftargs >= 1) { | |
203 | listAddNodeTail(operations,createSortOperation( | |
204 | REDIS_SORT_GET,c->argv[j+1])); | |
205 | getop++; | |
206 | j++; | |
207 | } else { | |
208 | decrRefCount(sortval); | |
209 | listRelease(operations); | |
210 | addReply(c,shared.syntaxerr); | |
211 | return; | |
212 | } | |
213 | j++; | |
214 | } | |
215 | ||
de79a2ee | 216 | /* If we have STORE we need to force sorting for deterministic output |
217 | * and replication. We use alpha sorting since this is guaranteed to | |
5ddee9b7 | 218 | * work with any input. |
219 | * | |
220 | * We also want determinism when SORT is called from Lua scripts, so | |
221 | * in this case we also force alpha sorting. */ | |
222 | if ((storekey || c->flags & REDIS_LUA_CLIENT) && dontsort) { | |
de79a2ee | 223 | dontsort = 0; |
224 | alpha = 1; | |
225 | sortby = NULL; | |
226 | } | |
227 | ||
dddf5335 | 228 | /* Destructively convert encoded sorted sets for SORT. */ |
237194b7 | 229 | if (sortval->type == REDIS_ZSET) |
230 | zsetConvert(sortval, REDIS_ENCODING_SKIPLIST); | |
dddf5335 | 231 | |
e2641e09 | 232 | /* Load the sorting vector with all the objects to sort */ |
233 | switch(sortval->type) { | |
234 | case REDIS_LIST: vectorlen = listTypeLength(sortval); break; | |
029e5577 | 235 | case REDIS_SET: vectorlen = setTypeSize(sortval); break; |
e2641e09 | 236 | case REDIS_ZSET: vectorlen = dictSize(((zset*)sortval->ptr)->dict); break; |
237 | default: vectorlen = 0; redisPanic("Bad SORT type"); /* Avoid GCC warning */ | |
238 | } | |
239 | vector = zmalloc(sizeof(redisSortObject)*vectorlen); | |
240 | j = 0; | |
241 | ||
242 | if (sortval->type == REDIS_LIST) { | |
243 | listTypeIterator *li = listTypeInitIterator(sortval,0,REDIS_TAIL); | |
244 | listTypeEntry entry; | |
245 | while(listTypeNext(li,&entry)) { | |
246 | vector[j].obj = listTypeGet(&entry); | |
247 | vector[j].u.score = 0; | |
248 | vector[j].u.cmpobj = NULL; | |
249 | j++; | |
250 | } | |
251 | listTypeReleaseIterator(li); | |
029e5577 | 252 | } else if (sortval->type == REDIS_SET) { |
cb72d0f1 | 253 | setTypeIterator *si = setTypeInitIterator(sortval); |
029e5577 | 254 | robj *ele; |
1b508da7 | 255 | while((ele = setTypeNextObject(si)) != NULL) { |
029e5577 PN |
256 | vector[j].obj = ele; |
257 | vector[j].u.score = 0; | |
258 | vector[j].u.cmpobj = NULL; | |
259 | j++; | |
260 | } | |
261 | setTypeReleaseIterator(si); | |
262 | } else if (sortval->type == REDIS_ZSET) { | |
263 | dict *set = ((zset*)sortval->ptr)->dict; | |
e2641e09 | 264 | dictIterator *di; |
265 | dictEntry *setele; | |
e2641e09 | 266 | di = dictGetIterator(set); |
267 | while((setele = dictNext(di)) != NULL) { | |
c0ba9ebe | 268 | vector[j].obj = dictGetKey(setele); |
e2641e09 | 269 | vector[j].u.score = 0; |
270 | vector[j].u.cmpobj = NULL; | |
271 | j++; | |
272 | } | |
273 | dictReleaseIterator(di); | |
029e5577 PN |
274 | } else { |
275 | redisPanic("Unknown type"); | |
e2641e09 | 276 | } |
eab0e26e | 277 | redisAssertWithInfo(c,sortval,j == vectorlen); |
e2641e09 | 278 | |
279 | /* Now it's time to load the right scores in the sorting vector */ | |
280 | if (dontsort == 0) { | |
281 | for (j = 0; j < vectorlen; j++) { | |
282 | robj *byval; | |
283 | if (sortby) { | |
284 | /* lookup value to sort by */ | |
285 | byval = lookupKeyByPattern(c->db,sortby,vector[j].obj); | |
286 | if (!byval) continue; | |
287 | } else { | |
288 | /* use object itself to sort by */ | |
289 | byval = vector[j].obj; | |
290 | } | |
291 | ||
292 | if (alpha) { | |
293 | if (sortby) vector[j].u.cmpobj = getDecodedObject(byval); | |
294 | } else { | |
295 | if (byval->encoding == REDIS_ENCODING_RAW) { | |
2c861050 | 296 | char *eptr; |
297 | ||
298 | vector[j].u.score = strtod(byval->ptr,&eptr); | |
299 | if (eptr[0] != '\0' || errno == ERANGE || | |
300 | isnan(vector[j].u.score)) | |
301 | { | |
302 | int_convertion_error = 1; | |
303 | } | |
e2641e09 | 304 | } else if (byval->encoding == REDIS_ENCODING_INT) { |
305 | /* Don't need to decode the object if it's | |
306 | * integer-encoded (the only encoding supported) so | |
307 | * far. We can just cast it */ | |
308 | vector[j].u.score = (long)byval->ptr; | |
309 | } else { | |
eab0e26e | 310 | redisAssertWithInfo(c,sortval,1 != 1); |
e2641e09 | 311 | } |
312 | } | |
313 | ||
314 | /* when the object was retrieved using lookupKeyByPattern, | |
315 | * its refcount needs to be decreased. */ | |
316 | if (sortby) { | |
317 | decrRefCount(byval); | |
318 | } | |
319 | } | |
320 | } | |
321 | ||
322 | /* We are ready to sort the vector... perform a bit of sanity check | |
323 | * on the LIMIT option too. We'll use a partial version of quicksort. */ | |
324 | start = (limit_start < 0) ? 0 : limit_start; | |
325 | end = (limit_count < 0) ? vectorlen-1 : start+limit_count-1; | |
326 | if (start >= vectorlen) { | |
327 | start = vectorlen-1; | |
328 | end = vectorlen-2; | |
329 | } | |
330 | if (end >= vectorlen) end = vectorlen-1; | |
331 | ||
332 | if (dontsort == 0) { | |
333 | server.sort_desc = desc; | |
334 | server.sort_alpha = alpha; | |
335 | server.sort_bypattern = sortby ? 1 : 0; | |
336 | if (sortby && (start != 0 || end != vectorlen-1)) | |
337 | pqsort(vector,vectorlen,sizeof(redisSortObject),sortCompare, start,end); | |
338 | else | |
339 | qsort(vector,vectorlen,sizeof(redisSortObject),sortCompare); | |
340 | } | |
341 | ||
342 | /* Send command output to the output buffer, performing the specified | |
343 | * GET/DEL/INCR/DECR operations if any. */ | |
344 | outputlen = getop ? getop*(end-start+1) : end-start+1; | |
2c861050 | 345 | if (int_convertion_error) { |
346 | addReplyError(c,"One or more scores can't be converted into double"); | |
347 | } else if (storekey == NULL) { | |
e2641e09 | 348 | /* STORE option not specified, sent the sorting result to client */ |
0537e7bf | 349 | addReplyMultiBulkLen(c,outputlen); |
e2641e09 | 350 | for (j = start; j <= end; j++) { |
351 | listNode *ln; | |
352 | listIter li; | |
353 | ||
354 | if (!getop) addReplyBulk(c,vector[j].obj); | |
355 | listRewind(operations,&li); | |
356 | while((ln = listNext(&li))) { | |
357 | redisSortOperation *sop = ln->value; | |
358 | robj *val = lookupKeyByPattern(c->db,sop->pattern, | |
359 | vector[j].obj); | |
360 | ||
361 | if (sop->type == REDIS_SORT_GET) { | |
362 | if (!val) { | |
363 | addReply(c,shared.nullbulk); | |
364 | } else { | |
365 | addReplyBulk(c,val); | |
366 | decrRefCount(val); | |
367 | } | |
368 | } else { | |
eab0e26e | 369 | /* Always fails */ |
370 | redisAssertWithInfo(c,sortval,sop->type == REDIS_SORT_GET); | |
e2641e09 | 371 | } |
372 | } | |
373 | } | |
374 | } else { | |
375 | robj *sobj = createZiplistObject(); | |
376 | ||
377 | /* STORE option specified, set the sorting result as a List object */ | |
378 | for (j = start; j <= end; j++) { | |
379 | listNode *ln; | |
380 | listIter li; | |
381 | ||
382 | if (!getop) { | |
383 | listTypePush(sobj,vector[j].obj,REDIS_TAIL); | |
384 | } else { | |
385 | listRewind(operations,&li); | |
386 | while((ln = listNext(&li))) { | |
387 | redisSortOperation *sop = ln->value; | |
388 | robj *val = lookupKeyByPattern(c->db,sop->pattern, | |
389 | vector[j].obj); | |
390 | ||
391 | if (sop->type == REDIS_SORT_GET) { | |
392 | if (!val) val = createStringObject("",0); | |
393 | ||
394 | /* listTypePush does an incrRefCount, so we should take care | |
395 | * care of the incremented refcount caused by either | |
396 | * lookupKeyByPattern or createStringObject("",0) */ | |
397 | listTypePush(sobj,val,REDIS_TAIL); | |
398 | decrRefCount(val); | |
399 | } else { | |
eab0e26e | 400 | /* Always fails */ |
401 | redisAssertWithInfo(c,sortval,sop->type == REDIS_SORT_GET); | |
e2641e09 | 402 | } |
403 | } | |
404 | } | |
405 | } | |
a0bf8d0a MK |
406 | if (outputlen) { |
407 | setKey(c->db,storekey,sobj); | |
408 | server.dirty += outputlen; | |
409 | } else if (dbDelete(c->db,storekey)) { | |
410 | signalModifiedKey(c->db,storekey); | |
411 | server.dirty++; | |
412 | } | |
f85cd526 | 413 | decrRefCount(sobj); |
b70d3555 | 414 | addReplyLongLong(c,outputlen); |
e2641e09 | 415 | } |
416 | ||
417 | /* Cleanup */ | |
029e5577 | 418 | if (sortval->type == REDIS_LIST || sortval->type == REDIS_SET) |
e2641e09 | 419 | for (j = 0; j < vectorlen; j++) |
420 | decrRefCount(vector[j].obj); | |
421 | decrRefCount(sortval); | |
422 | listRelease(operations); | |
423 | for (j = 0; j < vectorlen; j++) { | |
424 | if (alpha && vector[j].u.cmpobj) | |
425 | decrRefCount(vector[j].u.cmpobj); | |
426 | } | |
427 | zfree(vector); | |
428 | } | |
429 | ||
430 |