1 |
/* lzo1x_9x.c -- implementation of the LZO1X-999 compression algorithm
|
2 |
|
3 |
This file is part of the LZO real-time data compression library.
|
4 |
|
5 |
Copyright (C) 2008 Markus Franz Xaver Johannes Oberhumer
|
6 |
Copyright (C) 2007 Markus Franz Xaver Johannes Oberhumer
|
7 |
Copyright (C) 2006 Markus Franz Xaver Johannes Oberhumer
|
8 |
Copyright (C) 2005 Markus Franz Xaver Johannes Oberhumer
|
9 |
Copyright (C) 2004 Markus Franz Xaver Johannes Oberhumer
|
10 |
Copyright (C) 2003 Markus Franz Xaver Johannes Oberhumer
|
11 |
Copyright (C) 2002 Markus Franz Xaver Johannes Oberhumer
|
12 |
Copyright (C) 2001 Markus Franz Xaver Johannes Oberhumer
|
13 |
Copyright (C) 2000 Markus Franz Xaver Johannes Oberhumer
|
14 |
Copyright (C) 1999 Markus Franz Xaver Johannes Oberhumer
|
15 |
Copyright (C) 1998 Markus Franz Xaver Johannes Oberhumer
|
16 |
Copyright (C) 1997 Markus Franz Xaver Johannes Oberhumer
|
17 |
Copyright (C) 1996 Markus Franz Xaver Johannes Oberhumer
|
18 |
All Rights Reserved.
|
19 |
|
20 |
The LZO library is free software; you can redistribute it and/or
|
21 |
modify it under the terms of the GNU General Public License as
|
22 |
published by the Free Software Foundation; either version 2 of
|
23 |
the License, or (at your option) any later version.
|
24 |
|
25 |
The LZO library is distributed in the hope that it will be useful,
|
26 |
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
27 |
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
28 |
GNU General Public License for more details.
|
29 |
|
30 |
You should have received a copy of the GNU General Public License
|
31 |
along with the LZO library; see the file COPYING.
|
32 |
If not, write to the Free Software Foundation, Inc.,
|
33 |
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
34 |
|
35 |
Markus F.X.J. Oberhumer
|
36 |
<markus@oberhumer.com>
|
37 |
http://www.oberhumer.com/opensource/lzo/
|
38 |
*/
|
39 |
|
40 |
|
41 |
#if !defined(LZO1X) && !defined(LZO1Y) && !defined(LZO1Z)
|
42 |
# define LZO1X
|
43 |
#endif
|
44 |
|
45 |
#if defined(LZO1X)
|
46 |
# include "config1x.h"
|
47 |
#elif defined(LZO1Y)
|
48 |
# include "config1y.h"
|
49 |
#elif defined(LZO1Z)
|
50 |
# include "config1z.h"
|
51 |
#else
|
52 |
# error
|
53 |
#endif
|
54 |
|
55 |
|
56 |
/***********************************************************************
|
57 |
//
|
58 |
************************************************************************/
|
59 |
|
60 |
#define N M4_MAX_OFFSET /* size of ring buffer */
|
61 |
#define THRESHOLD 1 /* lower limit for match length */
|
62 |
#define F 2048 /* upper limit for match length */
|
63 |
|
64 |
#define SWD_BEST_OFF (LZO_MAX3( M2_MAX_LEN, M3_MAX_LEN, M4_MAX_LEN ) + 1)
|
65 |
|
66 |
#if defined(LZO1X)
|
67 |
# define LZO_COMPRESS_T lzo1x_999_t
|
68 |
# define lzo_swd_t lzo1x_999_swd_t
|
69 |
#elif defined(LZO1Y)
|
70 |
# define LZO_COMPRESS_T lzo1y_999_t
|
71 |
# define lzo_swd_t lzo1y_999_swd_t
|
72 |
# define lzo1x_999_compress_internal lzo1y_999_compress_internal
|
73 |
# define lzo1x_999_compress_dict lzo1y_999_compress_dict
|
74 |
# define lzo1x_999_compress_level lzo1y_999_compress_level
|
75 |
# define lzo1x_999_compress lzo1y_999_compress
|
76 |
#elif defined(LZO1Z)
|
77 |
# define LZO_COMPRESS_T lzo1z_999_t
|
78 |
# define lzo_swd_t lzo1z_999_swd_t
|
79 |
# define lzo1x_999_compress_internal lzo1z_999_compress_internal
|
80 |
# define lzo1x_999_compress_dict lzo1z_999_compress_dict
|
81 |
# define lzo1x_999_compress_level lzo1z_999_compress_level
|
82 |
# define lzo1x_999_compress lzo1z_999_compress
|
83 |
#else
|
84 |
# error
|
85 |
#endif
|
86 |
|
87 |
#if 0
|
88 |
# define HEAD3(b,p) \
|
89 |
((((((lzo_xint)b[p]<<3)^b[p+1])<<3)^b[p+2]) & (SWD_HSIZE-1))
|
90 |
#endif
|
91 |
#if 0 && defined(LZO_UNALIGNED_OK_4) && defined(LZO_ABI_LITTLE_ENDIAN)
|
92 |
# define HEAD3(b,p) \
|
93 |
(((* (lzo_uint32p) &b[p]) ^ ((* (lzo_uint32p) &b[p])>>10)) & (SWD_HSIZE-1))
|
94 |
#endif
|
95 |
|
96 |
#include "lzo_mchw.ch"
|
97 |
|
98 |
|
99 |
/* this is a public functions, but there is no prototype in a header file */
|
100 |
LZO_EXTERN(int)
|
101 |
lzo1x_999_compress_internal ( const lzo_bytep in , lzo_uint in_len,
|
102 |
lzo_bytep out, lzo_uintp out_len,
|
103 |
lzo_voidp wrkmem,
|
104 |
const lzo_bytep dict, lzo_uint dict_len,
|
105 |
lzo_callback_p cb,
|
106 |
int try_lazy,
|
107 |
lzo_uint good_length,
|
108 |
lzo_uint max_lazy,
|
109 |
lzo_uint nice_length,
|
110 |
lzo_uint max_chain,
|
111 |
lzo_uint32 flags );
|
112 |
|
113 |
|
114 |
/***********************************************************************
|
115 |
//
|
116 |
************************************************************************/
|
117 |
|
118 |
static lzo_bytep
|
119 |
code_match ( LZO_COMPRESS_T *c, lzo_bytep op, lzo_uint m_len, lzo_uint m_off )
|
120 |
{
|
121 |
lzo_uint x_len = m_len;
|
122 |
lzo_uint x_off = m_off;
|
123 |
|
124 |
c->match_bytes += (unsigned long) m_len;
|
125 |
|
126 |
#if 0
|
127 |
/*
|
128 |
static lzo_uint last_m_len = 0, last_m_off = 0;
|
129 |
static lzo_uint prev_m_off[4];
|
130 |
static int prev_m_off_ptr = 0;
|
131 |
int i;
|
132 |
|
133 |
//if (m_len >= 3 && m_len <= M2_MAX_LEN && m_off <= M2_MAX_OFFSET)
|
134 |
if (m_len >= 3 && m_len <= M2_MAX_LEN)
|
135 |
{
|
136 |
//if (m_len == last_m_len && m_off == last_m_off)
|
137 |
//printf("last_m_len + last_m_off\n");
|
138 |
//else
|
139 |
if (m_off == last_m_off)
|
140 |
printf("last_m_off\n");
|
141 |
else
|
142 |
{
|
143 |
for (i = 0; i < 4; i++)
|
144 |
if (m_off == prev_m_off[i])
|
145 |
printf("prev_m_off %d: %5ld\n",i,(long)m_off);
|
146 |
}
|
147 |
}
|
148 |
last_m_len = m_len;
|
149 |
last_m_off = prev_m_off[prev_m_off_ptr] = m_off;
|
150 |
prev_m_off_ptr = (prev_m_off_ptr + 1) & 3;
|
151 |
*/
|
152 |
#endif
|
153 |
|
154 |
assert(op > c->out);
|
155 |
if (m_len == 2)
|
156 |
{
|
157 |
assert(m_off <= M1_MAX_OFFSET);
|
158 |
assert(c->r1_lit > 0); assert(c->r1_lit < 4);
|
159 |
m_off -= 1;
|
160 |
#if defined(LZO1Z)
|
161 |
*op++ = LZO_BYTE(M1_MARKER | (m_off >> 6));
|
162 |
*op++ = LZO_BYTE(m_off << 2);
|
163 |
#else
|
164 |
*op++ = LZO_BYTE(M1_MARKER | ((m_off & 3) << 2));
|
165 |
*op++ = LZO_BYTE(m_off >> 2);
|
166 |
#endif
|
167 |
c->m1a_m++;
|
168 |
}
|
169 |
#if defined(LZO1Z)
|
170 |
else if (m_len <= M2_MAX_LEN && (m_off <= M2_MAX_OFFSET || m_off == c->last_m_off))
|
171 |
#else
|
172 |
else if (m_len <= M2_MAX_LEN && m_off <= M2_MAX_OFFSET)
|
173 |
#endif
|
174 |
{
|
175 |
assert(m_len >= 3);
|
176 |
#if defined(LZO1X)
|
177 |
m_off -= 1;
|
178 |
*op++ = LZO_BYTE(((m_len - 1) << 5) | ((m_off & 7) << 2));
|
179 |
*op++ = LZO_BYTE(m_off >> 3);
|
180 |
assert(op[-2] >= M2_MARKER);
|
181 |
#elif defined(LZO1Y)
|
182 |
m_off -= 1;
|
183 |
*op++ = LZO_BYTE(((m_len + 1) << 4) | ((m_off & 3) << 2));
|
184 |
*op++ = LZO_BYTE(m_off >> 2);
|
185 |
assert(op[-2] >= M2_MARKER);
|
186 |
#elif defined(LZO1Z)
|
187 |
if (m_off == c->last_m_off)
|
188 |
*op++ = LZO_BYTE(((m_len - 1) << 5) | (0x700 >> 6));
|
189 |
else
|
190 |
{
|
191 |
m_off -= 1;
|
192 |
*op++ = LZO_BYTE(((m_len - 1) << 5) | (m_off >> 6));
|
193 |
*op++ = LZO_BYTE(m_off << 2);
|
194 |
}
|
195 |
#endif
|
196 |
c->m2_m++;
|
197 |
}
|
198 |
else if (m_len == M2_MIN_LEN && m_off <= MX_MAX_OFFSET && c->r1_lit >= 4)
|
199 |
{
|
200 |
assert(m_len == 3);
|
201 |
assert(m_off > M2_MAX_OFFSET);
|
202 |
m_off -= 1 + M2_MAX_OFFSET;
|
203 |
#if defined(LZO1Z)
|
204 |
*op++ = LZO_BYTE(M1_MARKER | (m_off >> 6));
|
205 |
*op++ = LZO_BYTE(m_off << 2);
|
206 |
#else
|
207 |
*op++ = LZO_BYTE(M1_MARKER | ((m_off & 3) << 2));
|
208 |
*op++ = LZO_BYTE(m_off >> 2);
|
209 |
#endif
|
210 |
c->m1b_m++;
|
211 |
}
|
212 |
else if (m_off <= M3_MAX_OFFSET)
|
213 |
{
|
214 |
assert(m_len >= 3);
|
215 |
m_off -= 1;
|
216 |
if (m_len <= M3_MAX_LEN)
|
217 |
*op++ = LZO_BYTE(M3_MARKER | (m_len - 2));
|
218 |
else
|
219 |
{
|
220 |
m_len -= M3_MAX_LEN;
|
221 |
*op++ = M3_MARKER | 0;
|
222 |
while (m_len > 255)
|
223 |
{
|
224 |
m_len -= 255;
|
225 |
*op++ = 0;
|
226 |
}
|
227 |
assert(m_len > 0);
|
228 |
*op++ = LZO_BYTE(m_len);
|
229 |
}
|
230 |
#if defined(LZO1Z)
|
231 |
*op++ = LZO_BYTE(m_off >> 6);
|
232 |
*op++ = LZO_BYTE(m_off << 2);
|
233 |
#else
|
234 |
*op++ = LZO_BYTE(m_off << 2);
|
235 |
*op++ = LZO_BYTE(m_off >> 6);
|
236 |
#endif
|
237 |
c->m3_m++;
|
238 |
}
|
239 |
else
|
240 |
{
|
241 |
lzo_uint k;
|
242 |
|
243 |
assert(m_len >= 3);
|
244 |
assert(m_off > 0x4000); assert(m_off <= 0xbfff);
|
245 |
m_off -= 0x4000;
|
246 |
k = (m_off & 0x4000) >> 11;
|
247 |
if (m_len <= M4_MAX_LEN)
|
248 |
*op++ = LZO_BYTE(M4_MARKER | k | (m_len - 2));
|
249 |
else
|
250 |
{
|
251 |
m_len -= M4_MAX_LEN;
|
252 |
*op++ = LZO_BYTE(M4_MARKER | k | 0);
|
253 |
while (m_len > 255)
|
254 |
{
|
255 |
m_len -= 255;
|
256 |
*op++ = 0;
|
257 |
}
|
258 |
assert(m_len > 0);
|
259 |
*op++ = LZO_BYTE(m_len);
|
260 |
}
|
261 |
#if defined(LZO1Z)
|
262 |
*op++ = LZO_BYTE(m_off >> 6);
|
263 |
*op++ = LZO_BYTE(m_off << 2);
|
264 |
#else
|
265 |
*op++ = LZO_BYTE(m_off << 2);
|
266 |
*op++ = LZO_BYTE(m_off >> 6);
|
267 |
#endif
|
268 |
c->m4_m++;
|
269 |
}
|
270 |
|
271 |
c->last_m_len = x_len;
|
272 |
c->last_m_off = x_off;
|
273 |
return op;
|
274 |
}
|
275 |
|
276 |
|
277 |
static lzo_bytep
|
278 |
STORE_RUN ( LZO_COMPRESS_T *c, lzo_bytep op, const lzo_bytep ii, lzo_uint t )
|
279 |
{
|
280 |
c->lit_bytes += (unsigned long) t;
|
281 |
|
282 |
if (op == c->out && t <= 238)
|
283 |
{
|
284 |
*op++ = LZO_BYTE(17 + t);
|
285 |
}
|
286 |
else if (t <= 3)
|
287 |
{
|
288 |
#if defined(LZO1Z)
|
289 |
op[-1] |= LZO_BYTE(t);
|
290 |
#else
|
291 |
op[-2] |= LZO_BYTE(t);
|
292 |
#endif
|
293 |
c->lit1_r++;
|
294 |
}
|
295 |
else if (t <= 18)
|
296 |
{
|
297 |
*op++ = LZO_BYTE(t - 3);
|
298 |
c->lit2_r++;
|
299 |
}
|
300 |
else
|
301 |
{
|
302 |
lzo_uint tt = t - 18;
|
303 |
|
304 |
*op++ = 0;
|
305 |
while (tt > 255)
|
306 |
{
|
307 |
tt -= 255;
|
308 |
*op++ = 0;
|
309 |
}
|
310 |
assert(tt > 0);
|
311 |
*op++ = LZO_BYTE(tt);
|
312 |
c->lit3_r++;
|
313 |
}
|
314 |
do *op++ = *ii++; while (--t > 0);
|
315 |
|
316 |
return op;
|
317 |
}
|
318 |
|
319 |
|
320 |
static lzo_bytep
|
321 |
code_run ( LZO_COMPRESS_T *c, lzo_bytep op, const lzo_bytep ii,
|
322 |
lzo_uint lit, lzo_uint m_len )
|
323 |
{
|
324 |
if (lit > 0)
|
325 |
{
|
326 |
assert(m_len >= 2);
|
327 |
op = STORE_RUN(c,op,ii,lit);
|
328 |
c->r1_m_len = m_len;
|
329 |
c->r1_lit = lit;
|
330 |
}
|
331 |
else
|
332 |
{
|
333 |
assert(m_len >= 3);
|
334 |
c->r1_m_len = 0;
|
335 |
c->r1_lit = 0;
|
336 |
}
|
337 |
|
338 |
return op;
|
339 |
}
|
340 |
|
341 |
|
342 |
/***********************************************************************
|
343 |
//
|
344 |
************************************************************************/
|
345 |
|
346 |
static int
|
347 |
len_of_coded_match ( lzo_uint m_len, lzo_uint m_off, lzo_uint lit )
|
348 |
{
|
349 |
int n = 4;
|
350 |
|
351 |
if (m_len < 2)
|
352 |
return -1;
|
353 |
if (m_len == 2)
|
354 |
return (m_off <= M1_MAX_OFFSET && lit > 0 && lit < 4) ? 2 : -1;
|
355 |
if (m_len <= M2_MAX_LEN && m_off <= M2_MAX_OFFSET)
|
356 |
return 2;
|
357 |
if (m_len == M2_MIN_LEN && m_off <= MX_MAX_OFFSET && lit >= 4)
|
358 |
return 2;
|
359 |
if (m_off <= M3_MAX_OFFSET)
|
360 |
{
|
361 |
if (m_len <= M3_MAX_LEN)
|
362 |
return 3;
|
363 |
m_len -= M3_MAX_LEN;
|
364 |
while (m_len > 255)
|
365 |
{
|
366 |
m_len -= 255;
|
367 |
n++;
|
368 |
}
|
369 |
return n;
|
370 |
}
|
371 |
if (m_off <= M4_MAX_OFFSET)
|
372 |
{
|
373 |
if (m_len <= M4_MAX_LEN)
|
374 |
return 3;
|
375 |
m_len -= M4_MAX_LEN;
|
376 |
while (m_len > 255)
|
377 |
{
|
378 |
m_len -= 255;
|
379 |
n++;
|
380 |
}
|
381 |
return n;
|
382 |
}
|
383 |
return -1;
|
384 |
}
|
385 |
|
386 |
|
387 |
static lzo_int
|
388 |
min_gain(lzo_uint ahead, lzo_uint lit1, lzo_uint lit2, int l1, int l2, int l3)
|
389 |
{
|
390 |
lzo_int lazy_match_min_gain = 0;
|
391 |
|
392 |
assert (ahead >= 1);
|
393 |
lazy_match_min_gain += ahead;
|
394 |
|
395 |
#if 0
|
396 |
if (l3 > 0)
|
397 |
lit2 -= ahead;
|
398 |
#endif
|
399 |
|
400 |
if (lit1 <= 3)
|
401 |
lazy_match_min_gain += (lit2 <= 3) ? 0 : 2;
|
402 |
else if (lit1 <= 18)
|
403 |
lazy_match_min_gain += (lit2 <= 18) ? 0 : 1;
|
404 |
|
405 |
lazy_match_min_gain += (l2 - l1) * 2;
|
406 |
if (l3 > 0)
|
407 |
lazy_match_min_gain -= (ahead - l3) * 2;
|
408 |
|
409 |
if (lazy_match_min_gain < 0)
|
410 |
lazy_match_min_gain = 0;
|
411 |
|
412 |
#if 0
|
413 |
if (l1 == 2)
|
414 |
if (lazy_match_min_gain == 0)
|
415 |
lazy_match_min_gain = 1;
|
416 |
#endif
|
417 |
|
418 |
return lazy_match_min_gain;
|
419 |
}
|
420 |
|
421 |
|
422 |
/***********************************************************************
|
423 |
//
|
424 |
************************************************************************/
|
425 |
|
426 |
#if !defined(NDEBUG)
|
427 |
static
|
428 |
void assert_match( const lzo_swd_p swd, lzo_uint m_len, lzo_uint m_off )
|
429 |
{
|
430 |
const LZO_COMPRESS_T *c = swd->c;
|
431 |
lzo_uint d_off;
|
432 |
|
433 |
assert(m_len >= 2);
|
434 |
if (m_off <= (lzo_uint) (c->bp - c->in))
|
435 |
{
|
436 |
assert(c->bp - m_off + m_len < c->ip);
|
437 |
assert(lzo_memcmp(c->bp, c->bp - m_off, m_len) == 0);
|
438 |
}
|
439 |
else
|
440 |
{
|
441 |
assert(swd->dict != NULL);
|
442 |
d_off = m_off - (lzo_uint) (c->bp - c->in);
|
443 |
assert(d_off <= swd->dict_len);
|
444 |
if (m_len > d_off)
|
445 |
{
|
446 |
assert(lzo_memcmp(c->bp, swd->dict_end - d_off, d_off) == 0);
|
447 |
assert(c->in + m_len - d_off < c->ip);
|
448 |
assert(lzo_memcmp(c->bp + d_off, c->in, m_len - d_off) == 0);
|
449 |
}
|
450 |
else
|
451 |
{
|
452 |
assert(lzo_memcmp(c->bp, swd->dict_end - d_off, m_len) == 0);
|
453 |
}
|
454 |
}
|
455 |
}
|
456 |
#else
|
457 |
# define assert_match(a,b,c) ((void)0)
|
458 |
#endif
|
459 |
|
460 |
|
461 |
#if defined(SWD_BEST_OFF)
|
462 |
|
463 |
static void
|
464 |
better_match ( const lzo_swd_p swd, lzo_uint *m_len, lzo_uint *m_off )
|
465 |
{
|
466 |
#if defined(LZO1Z)
|
467 |
const LZO_COMPRESS_T *c = swd->c;
|
468 |
#endif
|
469 |
|
470 |
if (*m_len <= M2_MIN_LEN)
|
471 |
return;
|
472 |
#if defined(LZO1Z)
|
473 |
if (*m_off == c->last_m_off && *m_len <= M2_MAX_LEN)
|
474 |
return;
|
475 |
#if 1
|
476 |
if (*m_len >= M2_MIN_LEN + 1 && *m_len <= M2_MAX_LEN + 1 &&
|
477 |
c->last_m_off && swd->best_off[*m_len-1] == c->last_m_off)
|
478 |
{
|
479 |
*m_len = *m_len - 1;
|
480 |
*m_off = swd->best_off[*m_len];
|
481 |
return;
|
482 |
}
|
483 |
#endif
|
484 |
#endif
|
485 |
|
486 |
if (*m_off <= M2_MAX_OFFSET)
|
487 |
return;
|
488 |
|
489 |
#if 1
|
490 |
/* M3/M4 -> M2 */
|
491 |
if (*m_off > M2_MAX_OFFSET &&
|
492 |
*m_len >= M2_MIN_LEN + 1 && *m_len <= M2_MAX_LEN + 1 &&
|
493 |
swd->best_off[*m_len-1] && swd->best_off[*m_len-1] <= M2_MAX_OFFSET)
|
494 |
{
|
495 |
*m_len = *m_len - 1;
|
496 |
*m_off = swd->best_off[*m_len];
|
497 |
return;
|
498 |
}
|
499 |
#endif
|
500 |
|
501 |
#if 1
|
502 |
/* M4 -> M2 */
|
503 |
if (*m_off > M3_MAX_OFFSET &&
|
504 |
*m_len >= M4_MAX_LEN + 1 && *m_len <= M2_MAX_LEN + 2 &&
|
505 |
swd->best_off[*m_len-2] && swd->best_off[*m_len-2] <= M2_MAX_OFFSET)
|
506 |
{
|
507 |
*m_len = *m_len - 2;
|
508 |
*m_off = swd->best_off[*m_len];
|
509 |
return;
|
510 |
}
|
511 |
#endif
|
512 |
|
513 |
#if 1
|
514 |
/* M4 -> M3 */
|
515 |
if (*m_off > M3_MAX_OFFSET &&
|
516 |
*m_len >= M4_MAX_LEN + 1 && *m_len <= M3_MAX_LEN + 1 &&
|
517 |
swd->best_off[*m_len-1] && swd->best_off[*m_len-1] <= M3_MAX_OFFSET)
|
518 |
{
|
519 |
*m_len = *m_len - 1;
|
520 |
*m_off = swd->best_off[*m_len];
|
521 |
}
|
522 |
#endif
|
523 |
}
|
524 |
|
525 |
#endif
|
526 |
|
527 |
|
528 |
/***********************************************************************
|
529 |
//
|
530 |
************************************************************************/
|
531 |
|
532 |
LZO_PUBLIC(int)
|
533 |
lzo1x_999_compress_internal ( const lzo_bytep in , lzo_uint in_len,
|
534 |
lzo_bytep out, lzo_uintp out_len,
|
535 |
lzo_voidp wrkmem,
|
536 |
const lzo_bytep dict, lzo_uint dict_len,
|
537 |
lzo_callback_p cb,
|
538 |
int try_lazy,
|
539 |
lzo_uint good_length,
|
540 |
lzo_uint max_lazy,
|
541 |
lzo_uint nice_length,
|
542 |
lzo_uint max_chain,
|
543 |
lzo_uint32 flags )
|
544 |
{
|
545 |
lzo_bytep op;
|
546 |
const lzo_bytep ii;
|
547 |
lzo_uint lit;
|
548 |
lzo_uint m_len, m_off;
|
549 |
LZO_COMPRESS_T cc;
|
550 |
LZO_COMPRESS_T * const c = &cc;
|
551 |
lzo_swd_p const swd = (lzo_swd_p) wrkmem;
|
552 |
int r;
|
553 |
|
554 |
/* sanity check */
|
555 |
#if defined(LZO1X)
|
556 |
LZO_COMPILE_TIME_ASSERT(LZO1X_999_MEM_COMPRESS >= SIZEOF_LZO_SWD_T)
|
557 |
#elif defined(LZO1Y)
|
558 |
LZO_COMPILE_TIME_ASSERT(LZO1Y_999_MEM_COMPRESS >= SIZEOF_LZO_SWD_T)
|
559 |
#elif defined(LZO1Z)
|
560 |
LZO_COMPILE_TIME_ASSERT(LZO1Z_999_MEM_COMPRESS >= SIZEOF_LZO_SWD_T)
|
561 |
#else
|
562 |
# error
|
563 |
#endif
|
564 |
|
565 |
/* setup parameter defaults */
|
566 |
/* number of lazy match tries */
|
567 |
if (try_lazy < 0)
|
568 |
try_lazy = 1;
|
569 |
/* reduce lazy match search if we already have a match with this length */
|
570 |
if (good_length <= 0)
|
571 |
good_length = 32;
|
572 |
/* do not try a lazy match if we already have a match with this length */
|
573 |
if (max_lazy <= 0)
|
574 |
max_lazy = 32;
|
575 |
/* stop searching for longer matches than this one */
|
576 |
if (nice_length <= 0)
|
577 |
nice_length = 0;
|
578 |
/* don't search more positions than this */
|
579 |
if (max_chain <= 0)
|
580 |
max_chain = SWD_MAX_CHAIN;
|
581 |
|
582 |
c->init = 0;
|
583 |
c->ip = c->in = in;
|
584 |
c->in_end = in + in_len;
|
585 |
c->out = out;
|
586 |
c->cb = cb;
|
587 |
c->m1a_m = c->m1b_m = c->m2_m = c->m3_m = c->m4_m = 0;
|
588 |
c->lit1_r = c->lit2_r = c->lit3_r = 0;
|
589 |
|
590 |
op = out;
|
591 |
ii = c->ip; /* point to start of literal run */
|
592 |
lit = 0;
|
593 |
c->r1_lit = c->r1_m_len = 0;
|
594 |
|
595 |
r = init_match(c,swd,dict,dict_len,flags);
|
596 |
if (r != 0)
|
597 |
return r;
|
598 |
if (max_chain > 0)
|
599 |
swd->max_chain = max_chain;
|
600 |
if (nice_length > 0)
|
601 |
swd->nice_length = nice_length;
|
602 |
|
603 |
r = find_match(c,swd,0,0);
|
604 |
if (r != 0)
|
605 |
return r;
|
606 |
while (c->look > 0)
|
607 |
{
|
608 |
lzo_uint ahead;
|
609 |
lzo_uint max_ahead;
|
610 |
int l1, l2, l3;
|
611 |
|
612 |
c->codesize = pd(op, out);
|
613 |
|
614 |
m_len = c->m_len;
|
615 |
m_off = c->m_off;
|
616 |
|
617 |
assert(c->bp == c->ip - c->look);
|
618 |
assert(c->bp >= in);
|
619 |
if (lit == 0)
|
620 |
ii = c->bp;
|
621 |
assert(ii + lit == c->bp);
|
622 |
assert(swd->b_char == *(c->bp));
|
623 |
|
624 |
if ( m_len < 2 ||
|
625 |
(m_len == 2 && (m_off > M1_MAX_OFFSET || lit == 0 || lit >= 4)) ||
|
626 |
#if 1
|
627 |
/* Do not accept this match for compressed-data compatibility
|
628 |
* with LZO v1.01 and before
|
629 |
* [ might be a problem for decompress() and optimize() ]
|
630 |
*/
|
631 |
(m_len == 2 && op == out) ||
|
632 |
#endif
|
633 |
(op == out && lit == 0))
|
634 |
{
|
635 |
/* a literal */
|
636 |
m_len = 0;
|
637 |
}
|
638 |
else if (m_len == M2_MIN_LEN)
|
639 |
{
|
640 |
/* compression ratio improves if we code a literal in some cases */
|
641 |
if (m_off > MX_MAX_OFFSET && lit >= 4)
|
642 |
m_len = 0;
|
643 |
}
|
644 |
|
645 |
if (m_len == 0)
|
646 |
{
|
647 |
/* a literal */
|
648 |
lit++;
|
649 |
swd->max_chain = max_chain;
|
650 |
r = find_match(c,swd,1,0);
|
651 |
assert(r == 0);
|
652 |
continue;
|
653 |
}
|
654 |
|
655 |
/* a match */
|
656 |
#if defined(SWD_BEST_OFF)
|
657 |
if (swd->use_best_off)
|
658 |
better_match(swd,&m_len,&m_off);
|
659 |
#endif
|
660 |
assert_match(swd,m_len,m_off);
|
661 |
|
662 |
|
663 |
|
664 |
/* shall we try a lazy match ? */
|
665 |
ahead = 0;
|
666 |
if (try_lazy <= 0 || m_len >= max_lazy)
|
667 |
{
|
668 |
/* no */
|
669 |
l1 = 0;
|
670 |
max_ahead = 0;
|
671 |
}
|
672 |
else
|
673 |
{
|
674 |
/* yes, try a lazy match */
|
675 |
l1 = len_of_coded_match(m_len,m_off,lit);
|
676 |
assert(l1 > 0);
|
677 |
#if 1
|
678 |
max_ahead = LZO_MIN((lzo_uint)try_lazy, (lzo_uint)l1 - 1);
|
679 |
#else
|
680 |
max_ahead = LZO_MIN3(try_lazy, l1, m_len - 1);
|
681 |
#endif
|
682 |
}
|
683 |
|
684 |
|
685 |
while (ahead < max_ahead && c->look > m_len)
|
686 |
{
|
687 |
lzo_int lazy_match_min_gain;
|
688 |
|
689 |
if (m_len >= good_length)
|
690 |
swd->max_chain = max_chain >> 2;
|
691 |
else
|
692 |
swd->max_chain = max_chain;
|
693 |
r = find_match(c,swd,1,0);
|
694 |
ahead++;
|
695 |
|
696 |
assert(r == 0);
|
697 |
assert(c->look > 0);
|
698 |
assert(ii + lit + ahead == c->bp);
|
699 |
|
700 |
#if defined(LZO1Z)
|
701 |
if (m_off == c->last_m_off && c->m_off != c->last_m_off)
|
702 |
if (m_len >= M2_MIN_LEN && m_len <= M2_MAX_LEN)
|
703 |
c->m_len = 0;
|
704 |
#endif
|
705 |
if (c->m_len < m_len)
|
706 |
continue;
|
707 |
#if 1
|
708 |
if (c->m_len == m_len && c->m_off >= m_off)
|
709 |
continue;
|
710 |
#endif
|
711 |
#if defined(SWD_BEST_OFF)
|
712 |
if (swd->use_best_off)
|
713 |
better_match(swd,&c->m_len,&c->m_off);
|
714 |
#endif
|
715 |
l2 = len_of_coded_match(c->m_len,c->m_off,lit+ahead);
|
716 |
if (l2 < 0)
|
717 |
continue;
|
718 |
#if 0
|
719 |
if (c->m_len == m_len && l2 >= l1)
|
720 |
continue;
|
721 |
#endif
|
722 |
|
723 |
|
724 |
#if 1
|
725 |
/* compressed-data compatibility [see above] */
|
726 |
l3 = (op == out) ? -1 : len_of_coded_match(ahead,m_off,lit);
|
727 |
#else
|
728 |
l3 = len_of_coded_match(ahead,m_off,lit);
|
729 |
#endif
|
730 |
|
731 |
lazy_match_min_gain = min_gain(ahead,lit,lit+ahead,l1,l2,l3);
|
732 |
if (c->m_len >= m_len + lazy_match_min_gain)
|
733 |
{
|
734 |
c->lazy++;
|
735 |
assert_match(swd,c->m_len,c->m_off);
|
736 |
|
737 |
if (l3 > 0)
|
738 |
{
|
739 |
/* code previous run */
|
740 |
op = code_run(c,op,ii,lit,ahead);
|
741 |
lit = 0;
|
742 |
/* code shortened match */
|
743 |
op = code_match(c,op,ahead,m_off);
|
744 |
}
|
745 |
else
|
746 |
{
|
747 |
lit += ahead;
|
748 |
assert(ii + lit == c->bp);
|
749 |
}
|
750 |
goto lazy_match_done;
|
751 |
}
|
752 |
}
|
753 |
|
754 |
|
755 |
assert(ii + lit + ahead == c->bp);
|
756 |
|
757 |
/* 1 - code run */
|
758 |
op = code_run(c,op,ii,lit,m_len);
|
759 |
lit = 0;
|
760 |
|
761 |
/* 2 - code match */
|
762 |
op = code_match(c,op,m_len,m_off);
|
763 |
swd->max_chain = max_chain;
|
764 |
r = find_match(c,swd,m_len,1+ahead);
|
765 |
assert(r == 0);
|
766 |
|
767 |
lazy_match_done: ;
|
768 |
}
|
769 |
|
770 |
|
771 |
/* store final run */
|
772 |
if (lit > 0)
|
773 |
op = STORE_RUN(c,op,ii,lit);
|
774 |
|
775 |
#if defined(LZO_EOF_CODE)
|
776 |
*op++ = M4_MARKER | 1;
|
777 |
*op++ = 0;
|
778 |
*op++ = 0;
|
779 |
#endif
|
780 |
|
781 |
c->codesize = pd(op, out);
|
782 |
assert(c->textsize == in_len);
|
783 |
|
784 |
*out_len = pd(op, out);
|
785 |
|
786 |
if (c->cb && c->cb->nprogress)
|
787 |
(*c->cb->nprogress)(c->cb, c->textsize, c->codesize, 0);
|
788 |
|
789 |
#if 0
|
790 |
printf("%ld %ld -> %ld %ld: %ld %ld %ld %ld %ld %ld: %ld %ld %ld %ld\n",
|
791 |
(long) c->textsize, (long) in_len, (long) c->codesize,
|
792 |
c->match_bytes, c->m1a_m, c->m1b_m, c->m2_m, c->m3_m, c->m4_m,
|
793 |
c->lit_bytes, c->lit1_r, c->lit2_r, c->lit3_r, c->lazy);
|
794 |
#endif
|
795 |
assert(c->lit_bytes + c->match_bytes == in_len);
|
796 |
|
797 |
return LZO_E_OK;
|
798 |
}
|
799 |
|
800 |
|
801 |
/***********************************************************************
|
802 |
//
|
803 |
************************************************************************/
|
804 |
|
805 |
LZO_PUBLIC(int)
|
806 |
lzo1x_999_compress_level ( const lzo_bytep in , lzo_uint in_len,
|
807 |
lzo_bytep out, lzo_uintp out_len,
|
808 |
lzo_voidp wrkmem,
|
809 |
const lzo_bytep dict, lzo_uint dict_len,
|
810 |
lzo_callback_p cb,
|
811 |
int compression_level )
|
812 |
{
|
813 |
static const struct
|
814 |
{
|
815 |
int try_lazy;
|
816 |
lzo_uint good_length;
|
817 |
lzo_uint max_lazy;
|
818 |
lzo_uint nice_length;
|
819 |
lzo_uint max_chain;
|
820 |
lzo_uint32 flags;
|
821 |
} c[9] = {
|
822 |
{ 0, 0, 0, 8, 4, 0 }, /* faster compression */
|
823 |
{ 0, 0, 0, 16, 8, 0 },
|
824 |
{ 0, 0, 0, 32, 16, 0 },
|
825 |
|
826 |
{ 1, 4, 4, 16, 16, 0 },
|
827 |
{ 1, 8, 16, 32, 32, 0 },
|
828 |
{ 1, 8, 16, 128, 128, 0 },
|
829 |
|
830 |
{ 2, 8, 32, 128, 256, 0 },
|
831 |
{ 2, 32, 128, F, 2048, 1 },
|
832 |
{ 2, F, F, F, 4096, 1 } /* max. compression */
|
833 |
};
|
834 |
|
835 |
if (compression_level < 1 || compression_level > 9)
|
836 |
return LZO_E_ERROR;
|
837 |
|
838 |
compression_level -= 1;
|
839 |
return lzo1x_999_compress_internal(in, in_len, out, out_len, wrkmem,
|
840 |
dict, dict_len, cb,
|
841 |
c[compression_level].try_lazy,
|
842 |
c[compression_level].good_length,
|
843 |
c[compression_level].max_lazy,
|
844 |
#if 0
|
845 |
c[compression_level].nice_length,
|
846 |
#else
|
847 |
0,
|
848 |
#endif
|
849 |
c[compression_level].max_chain,
|
850 |
c[compression_level].flags);
|
851 |
}
|
852 |
|
853 |
|
854 |
/***********************************************************************
|
855 |
//
|
856 |
************************************************************************/
|
857 |
|
858 |
LZO_PUBLIC(int)
|
859 |
lzo1x_999_compress_dict ( const lzo_bytep in , lzo_uint in_len,
|
860 |
lzo_bytep out, lzo_uintp out_len,
|
861 |
lzo_voidp wrkmem,
|
862 |
const lzo_bytep dict, lzo_uint dict_len )
|
863 |
{
|
864 |
return lzo1x_999_compress_level(in, in_len, out, out_len, wrkmem,
|
865 |
dict, dict_len, 0, 8);
|
866 |
}
|
867 |
|
868 |
LZO_PUBLIC(int)
|
869 |
lzo1x_999_compress ( const lzo_bytep in , lzo_uint in_len,
|
870 |
lzo_bytep out, lzo_uintp out_len,
|
871 |
lzo_voidp wrkmem )
|
872 |
{
|
873 |
return lzo1x_999_compress_level(in, in_len, out, out_len, wrkmem,
|
874 |
NULL, 0, (lzo_callback_p) 0, 8);
|
875 |
}
|
876 |
|
877 |
|
878 |
/*
|
879 |
vi:ts=4:et
|
880 |
*/
|
881 |
|