Parolin 0.7.9 6796
Console (soon DLLs) to do a tar like job
Loading...
Searching...
No Matches
range_encoder.h
Go to the documentation of this file.
1// SPDX-License-Identifier: 0BSD
2
4//
8// Authors: Igor Pavlov
9// Lasse Collin
10//
12
13#ifndef LZMA_RANGE_ENCODER_H
14#define LZMA_RANGE_ENCODER_H
15
16#include "range_common.h"
17#include "price.h"
18
19
23#define RC_SYMBOLS_MAX 53
24
25
26typedef struct {
27 uint64_t low;
28 uint64_t cache_size;
29 uint32_t range;
30 uint8_t cache;
31
33 uint64_t out_total;
34
36 size_t count;
37
39 size_t pos;
40
42 enum {
45 RC_DIRECT_0,
46 RC_DIRECT_1,
47 RC_FLUSH,
48 } symbols[RC_SYMBOLS_MAX];
49
52
54
55
56static inline void
58{
59 rc->low = 0;
60 rc->cache_size = 1;
61 rc->range = UINT32_MAX;
62 rc->cache = 0;
63 rc->out_total = 0;
64 rc->count = 0;
65 rc->pos = 0;
66}
67
68
69static inline void
70rc_forget(lzma_range_encoder *rc)
71{
72 // This must not be called when rc_encode() is partially done.
73 assert(rc->pos == 0);
74 rc->count = 0;
75}
76
77
78static inline void
79rc_bit(lzma_range_encoder *rc, probability *prob, uint32_t bit)
80{
81 rc->symbols[rc->count] = bit;
82 rc->probs[rc->count] = prob;
83 ++rc->count;
84}
85
86
87static inline void
88rc_bittree(lzma_range_encoder *rc, probability *probs,
89 uint32_t bit_count, uint32_t symbol)
90{
91 uint32_t model_index = 1;
92
93 do {
94 const uint32_t bit = (symbol >> --bit_count) & 1;
95 rc_bit(rc, &probs[model_index], bit);
96 model_index = (model_index << 1) + bit;
97 } while (bit_count != 0);
98}
99
100
101static inline void
102rc_bittree_reverse(lzma_range_encoder *rc, probability *probs,
103 uint32_t bit_count, uint32_t symbol)
104{
105 uint32_t model_index = 1;
106
107 do {
108 const uint32_t bit = symbol & 1;
109 symbol >>= 1;
110 rc_bit(rc, &probs[model_index], bit);
111 model_index = (model_index << 1) + bit;
112 } while (--bit_count != 0);
113}
114
115
116static inline void
118 uint32_t value, uint32_t bit_count)
119{
120 do {
121 rc->symbols[rc->count++]
122 = RC_DIRECT_0 + ((value >> --bit_count) & 1);
123 } while (bit_count != 0);
124}
125
126
127static inline void
128rc_flush(lzma_range_encoder *rc)
129{
130 for (size_t i = 0; i < 5; ++i)
131 rc->symbols[rc->count++] = RC_FLUSH;
132}
133
134
135static inline bool
136rc_shift_low(lzma_range_encoder *rc,
137 uint8_t *out, size_t *out_pos, size_t out_size)
138{
139 if ((uint32_t)(rc->low) < (uint32_t)(0xFF000000)
140 || (uint32_t)(rc->low >> 32) != 0) {
141 do {
142 if (*out_pos == out_size)
143 return true;
144
145 out[*out_pos] = rc->cache + (uint8_t)(rc->low >> 32);
146 ++*out_pos;
147 ++rc->out_total;
148 rc->cache = 0xFF;
149
150 } while (--rc->cache_size != 0);
151
152 rc->cache = (rc->low >> 24) & 0xFF;
153 }
154
155 ++rc->cache_size;
156 rc->low = (rc->low & 0x00FFFFFF) << RC_SHIFT_BITS;
157
158 return false;
159}
160
161
162// NOTE: The last two arguments are uint64_t instead of size_t because in
163// the dummy version these refer to the size of the whole range-encoded
164// output stream, not just to the currently available output buffer space.
165static inline bool
166rc_shift_low_dummy(uint64_t *low, uint64_t *cache_size, uint8_t *cache,
167 uint64_t *out_pos, uint64_t out_size)
168{
169 if ((uint32_t)(*low) < (uint32_t)(0xFF000000)
170 || (uint32_t)(*low >> 32) != 0) {
171 do {
172 if (*out_pos == out_size)
173 return true;
174
175 ++*out_pos;
176 *cache = 0xFF;
177
178 } while (--*cache_size != 0);
179
180 *cache = (*low >> 24) & 0xFF;
181 }
182
183 ++*cache_size;
184 *low = (*low & 0x00FFFFFF) << RC_SHIFT_BITS;
185
186 return false;
187}
188
189
190static inline bool
191rc_encode(lzma_range_encoder *rc,
192 uint8_t *out, size_t *out_pos, size_t out_size)
193{
195
196 while (rc->pos < rc->count) {
197 // Normalize
198 if (rc->range < RC_TOP_VALUE) {
199 if (rc_shift_low(rc, out, out_pos, out_size))
200 return true;
201
202 rc->range <<= RC_SHIFT_BITS;
203 }
204
205 // Encode a bit
206 switch (rc->symbols[rc->pos]) {
207 case RC_BIT_0: {
208 probability prob = *rc->probs[rc->pos];
209 rc->range = (rc->range >> RC_BIT_MODEL_TOTAL_BITS)
210 * prob;
211 prob += (RC_BIT_MODEL_TOTAL - prob) >> RC_MOVE_BITS;
212 *rc->probs[rc->pos] = prob;
213 break;
214 }
215
216 case RC_BIT_1: {
217 probability prob = *rc->probs[rc->pos];
218 const uint32_t bound = prob * (rc->range
220 rc->low += bound;
221 rc->range -= bound;
222 prob -= prob >> RC_MOVE_BITS;
223 *rc->probs[rc->pos] = prob;
224 break;
225 }
226
227 case RC_DIRECT_0:
228 rc->range >>= 1;
229 break;
230
231 case RC_DIRECT_1:
232 rc->range >>= 1;
233 rc->low += rc->range;
234 break;
235
236 case RC_FLUSH:
237 // Prevent further normalizations.
238 rc->range = UINT32_MAX;
239
240 // Flush the last five bytes (see rc_flush()).
241 do {
242 if (rc_shift_low(rc, out, out_pos, out_size))
243 return true;
244 } while (++rc->pos < rc->count);
245
246 // Reset the range encoder so we are ready to continue
247 // encoding if we weren't finishing the stream.
248 rc_reset(rc);
249 return false;
250
251 default:
252 assert(0);
253 break;
254 }
255
256 ++rc->pos;
257 }
258
259 rc->count = 0;
260 rc->pos = 0;
261
262 return false;
263}
264
265
266static inline bool
267rc_encode_dummy(const lzma_range_encoder *rc, uint64_t out_limit)
268{
270
271 uint64_t low = rc->low;
272 uint64_t cache_size = rc->cache_size;
273 uint32_t range = rc->range;
274 uint8_t cache = rc->cache;
275 uint64_t out_pos = rc->out_total;
276
277 size_t pos = rc->pos;
278
279 while (true) {
280 // Normalize
281 if (range < RC_TOP_VALUE) {
282 if (rc_shift_low_dummy(&low, &cache_size, &cache,
283 &out_pos, out_limit))
284 return true;
285
286 range <<= RC_SHIFT_BITS;
287 }
288
289 // This check is here because the normalization above must
290 // be done before flushing the last bytes.
291 if (pos == rc->count)
292 break;
293
294 // Encode a bit
295 switch (rc->symbols[pos]) {
296 case RC_BIT_0: {
297 probability prob = *rc->probs[pos];
298 range = (range >> RC_BIT_MODEL_TOTAL_BITS)
299 * prob;
300 break;
301 }
302
303 case RC_BIT_1: {
304 probability prob = *rc->probs[pos];
305 const uint32_t bound = prob * (range
307 low += bound;
308 range -= bound;
309 break;
310 }
311
312 case RC_DIRECT_0:
313 range >>= 1;
314 break;
315
316 case RC_DIRECT_1:
317 range >>= 1;
318 low += range;
319 break;
320
321 case RC_FLUSH:
322 default:
323 assert(0);
324 break;
325 }
326
327 ++pos;
328 }
329
330 // Flush the last bytes. This isn't in rc->symbols[] so we do
331 // it after the above loop to take into account the size of
332 // the flushing that will be done at the end of the stream.
333 for (pos = 0; pos < 5; ++pos) {
334 if (rc_shift_low_dummy(&low, &cache_size,
335 &cache, &out_pos, out_limit))
336 return true;
337 }
338
339 return false;
340}
341
342
343static inline uint64_t
344rc_pending(const lzma_range_encoder *rc)
345{
346 return rc->cache_size + 5 - 1;
347}
348
349#endif
#define RC_BIT_1(p, prob)
Definition LzmaEnc.c:808
#define RC_BIT_0(p, prob)
Definition LzmaEnc.c:804
#define assert(condition)
Definition lz4.c:273
Definition range_encoder.h:27
probability * probs[RC_SYMBOLS_MAX]
Probabilities associated with RC_BIT_0 or RC_BIT_1.
Definition range_encoder.h:52
uint64_t cache_size
Definition range_encoder.h:29
size_t pos
rc_encode()'s position in the tables
Definition range_encoder.h:40
uint32_t range
Definition range_encoder.h:30
enum lzma_range_encoder::@106 symbols[RC_SYMBOLS_MAX]
Symbols to encode.
uint8_t cache
Definition range_encoder.h:31
size_t count
Number of symbols in the tables.
Definition range_encoder.h:37
uint64_t out_total
Number of bytes written out by rc_encode() -> rc_shift_low()
Definition range_encoder.h:34
uint64_t low
Definition range_encoder.h:28
const lzma_allocator const uint8_t size_t uint8_t size_t * out_pos
Definition block.h:528
const lzma_allocator const uint8_t size_t uint8_t * out
Definition block.h:528
lzma_index ** i
Definition index.h:629
#define UINT32_MAX
Definition lzma.h:158
uint16_t probability
Type of probabilities used with range coder.
Definition range_common.h:69
#define RC_BIT_MODEL_TOTAL_BITS
Definition range_common.h:27
#define RC_MOVE_BITS
Definition range_common.h:29
#define RC_SHIFT_BITS
Definition range_common.h:24
#define RC_TOP_VALUE
Definition range_common.h:26
#define RC_BIT_MODEL_TOTAL
Definition range_common.h:28
#define rc_direct(dest, seq)
Decode a bit without using a probability.
Definition range_decoder.h:171
#define rc_bit(prob, action0, action1, seq)
Definition range_decoder.h:154
#define rc_reset(range_decoder)
Resets the range decoder structure.
Definition range_decoder.h:69
#define RC_SYMBOLS_MAX
Definition range_encoder.h:24
Probability price calculation.
Common things for range encoder and decoder.