git.saurik.com Git - apple/xnu.git/blob - libkern/kxld/WKdmDecompress.c

1 #include <sys/cdefs.h>

2 #include "WKdm.h"

4 /***************************************************************************

5 * THE UNPACKING ROUTINES should GO HERE

6 */

8 const char hashLookupTable[] = HASH_LOOKUP_TABLE_CONTENTS;

10 #if 0

11 #define GET_NEXT_TAG tags[tagsIndex++]

12 #define GET_NEXT_FULL_PATTERN fullPatterns[fullPatternsIndex++]

13 #define GET_NEXT_LOW_BITS lowBits[lowBitsIndex++]

14 #define GET_NEXT_DICTIONARY_INDEX dictionaryIndices[dictionaryIndicesIndex++]

15 #endif

17 /* WK_unpack_2bits takes any number of words containing 16 two-bit values

18 * and unpacks them into four times as many words containg those

19 * two bit values as bytes (with the low two bits of each byte holding

20 * the actual value.

21 */

22 static WK_word*

23 WK_unpack_2bits(WK_word *input_buf,

24 WK_word *input_end,

25 WK_word *output_buf)

26 {

27 WK_word *input_next = input_buf;

28 WK_word *output_next = output_buf;

29 WK_word packing_mask = TWO_BITS_PACKING_MASK;

31 /* loop to repeatedly grab one input word and unpack it into

32 * 4 output words. This loop could be unrolled a little---it's

33 * designed to be easy to do that.

34 */

35 while (input_next < input_end) {

36 WK_word temp = input_next[0];

                 DEBUG_PRINT_2("Unpacked tags word: %.8x\n", temp);

                 output_next[0] = temp & packing_mask;

                 output_next[1] = (temp >> 2) & packing_mask;

                 output_next[2] = (temp >> 4) & packing_mask;

                 output_next[3] = (temp >> 6) & packing_mask;

43 output_next += 4;

44 input_next++;

45 }

47 return output_next;

48 }

50 /* unpack four bits consumes any number of words (between input_buf

51 * and input_end) holding 8 4-bit values per word, and unpacks them

52 * into twice as many words, with each value in a separate byte.

53 * (The four-bit values occupy the low halves of the bytes in the

54 * result).

55 */

56 static WK_word*

57 WK_unpack_4bits(WK_word *input_buf,

58 WK_word *input_end,

59 WK_word *output_buf)

60 {

61 WK_word *input_next = input_buf;

62 WK_word *output_next = output_buf;

63 WK_word packing_mask = FOUR_BITS_PACKING_MASK;

66 /* loop to repeatedly grab one input word and unpack it into

67 * 4 output words. This loop should probably be unrolled

68 * a little---it's designed to be easy to do that.

69 */

70 while (input_next < input_end) {

71 WK_word temp = input_next[0];

                 DEBUG_PRINT_2("Unpacked dictionary indices word: %.8x\n", temp);

                 output_next[0] = temp & packing_mask;

                 output_next[1] = (temp >> 4) & packing_mask;

76 output_next += 2;

77 input_next++;

78 }

80 return output_next;

81 }

83 /* unpack_3_tenbits unpacks three 10-bit items from (the low 30 bits of)

84 * a 32-bit word

85 */

86 static WK_word*

87 WK_unpack_3_tenbits(WK_word *input_buf,

88 WK_word *input_end,

89 WK_word *output_buf)

90 {

91 WK_word *input_next = input_buf;

92 WK_word *output_next = output_buf;

93 WK_word packing_mask = LOW_BITS_MASK;

95 /* loop to fetch words of input, splitting each into three

96 * words of output with 10 meaningful low bits. This loop

97 * probably ought to be unrolled and maybe coiled

98 */

99 while (input_next < input_end) {

100 WK_word temp = input_next[0];

101

                 output_next[0] = temp & packing_mask;

                 output_next[1] = (temp >> 10) & packing_mask;

                 output_next[2] = temp >> 20;

105

106 input_next++;

107 output_next += 3;

108 }

109

110 return output_next;

111 }

112

113 /*********************************************************************

114 * WKdm_decompress --- THE DECOMPRESSOR

115 * Expects WORD pointers to the source and destination buffers

116 * and a page size in words. The page size had better be 1024 unless

117 * somebody finds the places that are dependent on the page size and

118 * fixes them

119 */

120

121 void

122 WKdm_decompress(WK_word* src_buf,

123 WK_word* dest_buf,

124 __unused unsigned int words)

125 {

126 DictionaryElement dictionary[DICTIONARY_SIZE];

127

128 /* arrays that hold output data in intermediate form during modeling */

129 /* and whose contents are packed into the actual output after modeling */

130

131 /* sizes of these arrays should be increased if you want to compress

132 * pages larger than 4KB

133 */

134 WK_word tempTagsArray[300]; /* tags for everything */

135 WK_word tempQPosArray[300]; /* queue positions for matches */

136 WK_word tempLowBitsArray[1200]; /* low bits for partial matches */

137

138 PRELOAD_DICTIONARY;

139

140 #ifdef WK_DEBUG

         printf("\nIn DECOMPRESSOR\n");

         printf("tempTagsArray is at %p\n", tempTagsArray);

         printf("tempQPosArray is at %p\n", tempQPosArray);

         printf("tempLowBitsArray is at %p\n", tempLowBitsArray);

145

         printf(" first four words of source buffer are:\n");

         printf("   %u\n   %u\n   %u\n   %u\n",

             src_buf[0], src_buf[1], src_buf[2], src_buf[3]);

149

150 { int i;

           WK_word *arr = (src_buf + TAGS_AREA_OFFSET + (PAGE_SIZE_IN_WORDS / 16));

152

           printf("  first 20 full patterns are: \n");

           for (i = 0; i < 20; i++) {

                   printf(" %d", arr[i]);

156 }

           printf("\n");}

158 #endif

159

         WK_unpack_2bits(TAGS_AREA_START(src_buf),

161 TAGS_AREA_END(src_buf),

162 tempTagsArray);

163

164 #ifdef WK_DEBUG

165 { int i;

           char* arr = (char *) tempTagsArray;

167

           printf("  first 200 tags are: \n");

           for (i = 0; i < 200; i++) {

                   printf(" %d", arr[i]);

171 }

           printf("\n");}

173 #endif

174

         WK_unpack_4bits(QPOS_AREA_START(src_buf),

176 QPOS_AREA_END(src_buf),

177 tempQPosArray);

178

179 #ifdef WK_DEBUG

180 { int i;

           char* arr = (char *) tempQPosArray;

182

           printf("  first 200 queue positions are: \n");

           for (i = 0; i < 200; i++) {

                   printf(" %d", arr[i]);

186 }

           printf("\n");}

188 #endif

189

         WK_unpack_3_tenbits(LOW_BITS_AREA_START(src_buf),

191 LOW_BITS_AREA_END(src_buf),

192 tempLowBitsArray);

193

194 #ifdef WK_DEBUG

         printf("AFTER UNPACKING, about to enter main block \n");

196 #endif

197

198 {

                 char *next_tag = (char *) tempTagsArray;

200 char *tags_area_end =

                     ((char *) tempTagsArray) + PAGE_SIZE_IN_WORDS;

                 char *next_q_pos = (char *) tempQPosArray;

203 WK_word *next_low_bits = tempLowBitsArray;

                 WK_word *next_full_word = FULL_WORD_AREA_START(src_buf);

205

206 WK_word *next_output = dest_buf;

207

208 #ifdef WK_DEBUG

                 printf("next_output is %u\n", next_output);

210

                 printf("next_tag is %u \n", next_tag);

                 printf("tags_area_end is %u\n", tags_area_end);

                 printf("next_q_pos is %u\n", next_q_pos);

                 printf("next_low_bits is %u\n", next_low_bits);

                 printf("next_full_word is %u\n", next_full_word);

216 #endif

217

218 /* this loop should probably be unrolled. Maybe we should unpack

219 * as 4 bit values, giving two consecutive tags, and switch on

220 * that 16 ways to decompress 2 words at a whack

221 */

222 while (next_tag < tags_area_end) {

                         char tag = next_tag[0];

224

225 switch (tag) {

226 case ZERO_TAG: {

227 *next_output = 0;

228 break;

229 }

230 case EXACT_TAG: {

231 WK_word *dict_location = dictionary + *(next_q_pos++);

232 /* no need to replace dict. entry if matched exactly */

233 *next_output = *dict_location;

234 break;

235 }

236 case PARTIAL_TAG: {

237 WK_word *dict_location = dictionary + *(next_q_pos++);

238 {

239 WK_word temp = *dict_location;

240

241 /* strip out low bits */

242 temp = ((temp >> NUM_LOW_BITS) << NUM_LOW_BITS);

243

244 /* add in stored low bits from temp array */

245 temp = temp | *(next_low_bits++);

246

247 *dict_location = temp; /* replace old value in dict. */

248 *next_output = temp; /* and echo it to output */

249 }

250 break;

251 }

252 case MISS_TAG: {

253 WK_word missed_word = *(next_full_word++);

254 WK_word *dict_location =

255 (WK_word *)

                                     ((void *) (((char *) dictionary) + HASH_TO_DICT_BYTE_OFFSET(missed_word)));

257 *dict_location = missed_word;

258 *next_output = missed_word;

259 break;

260 }

261 }

262 next_tag++;

263 next_output++;

264 }

265

266 #ifdef WK_DEBUG

                 printf("AFTER DECOMPRESSING\n");

                 printf("next_output is %p\n", next_output);

                 printf("next_tag is %p\n", next_tag);

                 printf("next_full_word is %p\n", next_full_word);

                 printf("next_q_pos is %p\n", next_q_pos);

272 #endif

273 }

274 }