2 * Copyright (c) 2000-2013 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 /* direct-mapped partial matching compressor with simple 22/10 split
31 * Compresses buffers using a dictionary based match and partial match
32 * (high bits only or full match) scheme.
34 * Paul Wilson -- wilson@cs.utexas.edu
35 * Scott F. Kaplan -- sfkaplan@cs.utexas.edu
39 /* compressed output format, in memory order
40 * 1. a four-word HEADER containing four one-word values:
41 * i. a one-word code saying what algorithm compressed the data
42 * ii. an integer WORD offset into the page saying
43 * where the queue position area starts
44 * iii. an integer WORD offset into the page saying where
45 * the low-bits area starts
46 * iv. an integer WORD offset into the page saying where the
49 * 2. a 64-word TAGS AREA holding one two-bit tag for each word in
50 * the original (1024-word) page, packed 16 per word
52 * 3. a variable-sized FULL WORDS AREA (always word aligned and an
53 * integral number of words) holding full-word patterns that
54 * were not in the dictionary when encoded (i.e., dictionary misses)
56 * 4. a variable-sized QUEUE POSITIONS AREA (always word aligned and
57 * an integral number of words) holding four-bit queue positions,
58 * packed eight per word.
60 * 5. a variable-sized LOW BITS AREA (always word aligned and an
61 * integral number of words) holding ten-bit low-bit patterns
62 * (from partial matches), packed three per word.
70 /* ============================================================ */
80 typedef unsigned int WK_word
;
82 /* at the moment we have dependencies on the page size. That should
83 * be changed to work for any power-of-two size that's at least 16
84 * words, or something like that
87 #define PAGE_SIZE_IN_WORDS 1024
88 #define PAGE_SIZE_IN_BYTES 4096
90 #define DICTIONARY_SIZE 16
93 * macros defining the basic layout of stuff in a page
95 #define HEADER_SIZE_IN_WORDS 3
96 #define TAGS_AREA_OFFSET 3
97 #define TAGS_AREA_SIZE 64
99 /* the next few are used during compression to write the header */
100 #define SET_QPOS_AREA_START(compr_dest_buf,qpos_start_addr) \
101 (compr_dest_buf[0] = qpos_start_addr - compr_dest_buf)
102 #define SET_LOW_BITS_AREA_START(compr_dest_buf,lb_start_addr) \
103 (compr_dest_buf[1] = lb_start_addr - compr_dest_buf)
104 #define SET_LOW_BITS_AREA_END(compr_dest_buf,lb_end_addr) \
105 (compr_dest_buf[2] = lb_end_addr - compr_dest_buf)
107 /* the next few are only use during decompression to read the header */
108 #define TAGS_AREA_START(decomp_src_buf) \
109 (decomp_src_buf + TAGS_AREA_OFFSET)
110 #define TAGS_AREA_END(decomp_src_buf) \
111 (TAGS_AREA_START(decomp_src_buf) + TAGS_AREA_SIZE)
112 #define FULL_WORD_AREA_START(the_buf) TAGS_AREA_END(the_buf)
113 #define QPOS_AREA_START(decomp_src_buf) \
114 (decomp_src_buf + decomp_src_buf[0])
115 #define LOW_BITS_AREA_START(decomp_src_buf) \
116 (decomp_src_buf + (decomp_src_buf[1]))
117 #define QPOS_AREA_END(the_buf) LOW_BITS_AREA_START(the_buf)
118 #define LOW_BITS_AREA_END(decomp_src_buf) \
119 (decomp_src_buf + (decomp_src_buf[2]))
121 /* ============================================================ */
122 /* Types and structures */
124 /* A structure to store each element of the dictionary. */
125 typedef WK_word DictionaryElement
;
127 /* ============================================================ */
130 #define BITS_PER_WORD 32
131 #define BYTES_PER_WORD 4
132 #define NUM_LOW_BITS 10
133 #define LOW_BITS_MASK 0x3FF
134 #define ALL_ONES_MASK 0xFFFFFFFF
136 #define TWO_BITS_PACKING_MASK 0x03030303
137 #define FOUR_BITS_PACKING_MASK 0x0F0F0F0F
138 #define TEN_LOW_BITS_MASK 0x000003FF
139 #define TWENTY_TWO_HIGH_BITS_MASK 0xFFFFFC00
141 /* Tag values. NOTE THAT CODE MAY DEPEND ON THE NUMBERS USED.
142 * Check for conditionals doing arithmetic on these things
143 * before changing them
146 #define PARTIAL_TAG 0x1
148 #define EXACT_TAG 0x3
150 #define BITS_PER_BYTE 8
152 /* ============================================================ */
155 /* Shift out the low bits of a pattern to give the high bits pattern.
156 The stripped patterns are used for initial tests of partial
158 #define HIGH_BITS(word_pattern) (word_pattern >> NUM_LOW_BITS)
160 /* String the high bits of a pattern so the low order bits can
161 be included in an encoding of a partial match. */
162 #define LOW_BITS(word_pattern) (word_pattern & LOW_BITS_MASK)
165 #define DEBUG_PRINT_1(string) printf (string)
166 #define DEBUG_PRINT_2(string,value) printf(string, value)
168 #define DEBUG_PRINT_1(string)
169 #define DEBUG_PRINT_2(string, value)
172 /* Set up the dictionary before performing compression or
173 decompression. Each element is loaded with some value, the
174 high-bits version of that value, and a next pointer. */
175 #define PRELOAD_DICTIONARY { \
186 dictionary[10] = 1; \
187 dictionary[11] = 1; \
188 dictionary[12] = 1; \
189 dictionary[13] = 1; \
190 dictionary[14] = 1; \
191 dictionary[15] = 1; \
194 /* these are the constants for the hash function lookup table.
195 * Only zero maps to zero. The rest of the tabale is the result
196 * of appending 17 randomizations of the multiples of 4 from
197 * 4 to 56. Generated by a Scheme script in hash.scm.
199 #define HASH_LOOKUP_TABLE_CONTENTS { \
200 0, 52, 8, 56, 16, 12, 28, 20, 4, 36, 48, 24, 44, 40, 32, 60, \
201 8, 12, 28, 20, 4, 60, 16, 36, 24, 48, 44, 32, 52, 56, 40, 12, \
202 8, 48, 16, 52, 60, 28, 56, 32, 20, 24, 36, 40, 44, 4, 8, 40, \
203 60, 32, 20, 44, 4, 36, 52, 24, 16, 56, 48, 12, 28, 16, 8, 40, \
204 36, 28, 32, 12, 4, 44, 52, 20, 24, 48, 60, 56, 40, 48, 8, 32, \
205 28, 36, 4, 44, 20, 56, 60, 24, 52, 16, 12, 12, 4, 48, 20, 8, \
206 52, 16, 60, 24, 36, 44, 28, 56, 40, 32, 36, 20, 24, 60, 40, 44, \
207 52, 16, 32, 4, 48, 8, 28, 56, 12, 28, 32, 40, 52, 36, 16, 20, \
208 48, 8, 4, 60, 24, 56, 44, 12, 8, 36, 24, 28, 16, 60, 20, 56, \
209 32, 40, 48, 12, 4, 44, 52, 44, 40, 12, 56, 8, 36, 24, 60, 28, \
210 48, 4, 32, 20, 16, 52, 60, 12, 24, 36, 8, 4, 16, 56, 48, 44, \
211 40, 52, 32, 20, 28, 32, 12, 36, 28, 24, 56, 40, 16, 52, 44, 4, \
212 20, 60, 8, 48, 48, 52, 12, 20, 32, 44, 36, 28, 4, 40, 24, 8, \
213 56, 60, 16, 36, 32, 8, 40, 4, 52, 24, 44, 20, 12, 28, 48, 56, \
214 16, 60, 4, 52, 60, 48, 20, 16, 56, 44, 24, 8, 40, 12, 32, 28, \
215 36, 24, 32, 12, 4, 20, 16, 60, 36, 28, 8, 52, 40, 48, 44, 56 \
218 #define HASH_TO_DICT_BYTE_OFFSET(pattern) \
219 (hashLookupTable[((pattern) >> 10) & 0xFF])
221 extern const char hashLookupTable
[];
223 /* EMIT... macros emit bytes or words into the intermediate arrays
226 #define EMIT_BYTE(fill_ptr, byte_value) {*fill_ptr++ = byte_value; }
227 #define EMIT_WORD(fill_ptr,word_value) {*fill_ptr++ = word_value; }
229 /* RECORD... macros record the results of modeling in the intermediate
233 #define RECORD_ZERO { EMIT_BYTE(next_tag,ZERO_TAG); }
235 #define RECORD_EXACT(queue_posn) EMIT_BYTE(next_tag,EXACT_TAG); \
236 EMIT_BYTE(next_qp,(queue_posn));
238 #define RECORD_PARTIAL(queue_posn,low_bits_pattern) { \
239 EMIT_BYTE(next_tag,PARTIAL_TAG); \
240 EMIT_BYTE(next_qp,(queue_posn)); \
241 EMIT_WORD(next_low_bits,(low_bits_pattern)) }
243 #define RECORD_MISS(word_pattern) EMIT_BYTE(next_tag,MISS_TAG); \
244 EMIT_WORD(next_full_patt,(word_pattern));
247 #define WKdm_SCRATCH_BUF_SIZE 4096
250 WKdm_decompress_new (WK_word
* src_buf
,
255 WKdm_compress_new (WK_word
* src_buf
,