1 |
/* lzo1x_oo.ch -- LZO1X compressed data optimizer
|
2 |
|
3 |
This file is part of the LZO real-time data compression library.
|
4 |
|
5 |
Copyright (C) 2008 Markus Franz Xaver Johannes Oberhumer
|
6 |
Copyright (C) 2007 Markus Franz Xaver Johannes Oberhumer
|
7 |
Copyright (C) 2006 Markus Franz Xaver Johannes Oberhumer
|
8 |
Copyright (C) 2005 Markus Franz Xaver Johannes Oberhumer
|
9 |
Copyright (C) 2004 Markus Franz Xaver Johannes Oberhumer
|
10 |
Copyright (C) 2003 Markus Franz Xaver Johannes Oberhumer
|
11 |
Copyright (C) 2002 Markus Franz Xaver Johannes Oberhumer
|
12 |
Copyright (C) 2001 Markus Franz Xaver Johannes Oberhumer
|
13 |
Copyright (C) 2000 Markus Franz Xaver Johannes Oberhumer
|
14 |
Copyright (C) 1999 Markus Franz Xaver Johannes Oberhumer
|
15 |
Copyright (C) 1998 Markus Franz Xaver Johannes Oberhumer
|
16 |
Copyright (C) 1997 Markus Franz Xaver Johannes Oberhumer
|
17 |
Copyright (C) 1996 Markus Franz Xaver Johannes Oberhumer
|
18 |
All Rights Reserved.
|
19 |
|
20 |
The LZO library is free software; you can redistribute it and/or
|
21 |
modify it under the terms of the GNU General Public License as
|
22 |
published by the Free Software Foundation; either version 2 of
|
23 |
the License, or (at your option) any later version.
|
24 |
|
25 |
The LZO library is distributed in the hope that it will be useful,
|
26 |
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
27 |
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
28 |
GNU General Public License for more details.
|
29 |
|
30 |
You should have received a copy of the GNU General Public License
|
31 |
along with the LZO library; see the file COPYING.
|
32 |
If not, write to the Free Software Foundation, Inc.,
|
33 |
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
34 |
|
35 |
Markus F.X.J. Oberhumer
|
36 |
<markus@oberhumer.com>
|
37 |
http://www.oberhumer.com/opensource/lzo/
|
38 |
*/
|
39 |
|
40 |
|
41 |
#define TEST_IP (ip < ip_end)
|
42 |
#define TEST_OP (op <= op_end)
|
43 |
|
44 |
#define NO_LIT LZO_UINT_MAX
|
45 |
|
46 |
|
47 |
/***********************************************************************
|
48 |
//
|
49 |
************************************************************************/
|
50 |
|
51 |
static void copy2(lzo_bytep ip, const lzo_bytep m_pos, lzo_uint off)
|
52 |
{
|
53 |
assert(off > 0);
|
54 |
ip[0] = m_pos[0];
|
55 |
if (off == 1)
|
56 |
ip[1] = m_pos[0];
|
57 |
else
|
58 |
ip[1] = m_pos[1];
|
59 |
}
|
60 |
|
61 |
|
62 |
static void copy3(lzo_bytep ip, const lzo_bytep m_pos, lzo_uint off)
|
63 |
{
|
64 |
assert(off > 0);
|
65 |
ip[0] = m_pos[0];
|
66 |
if (off == 1)
|
67 |
{
|
68 |
ip[2] = ip[1] = m_pos[0];
|
69 |
}
|
70 |
else if (off == 2)
|
71 |
{
|
72 |
ip[1] = m_pos[1];
|
73 |
ip[2] = m_pos[0];
|
74 |
}
|
75 |
else
|
76 |
{
|
77 |
ip[1] = m_pos[1];
|
78 |
ip[2] = m_pos[2];
|
79 |
}
|
80 |
}
|
81 |
|
82 |
|
83 |
/***********************************************************************
|
84 |
// optimize a block of data.
|
85 |
************************************************************************/
|
86 |
|
87 |
LZO_PUBLIC(int)
|
88 |
DO_OPTIMIZE ( lzo_bytep in , lzo_uint in_len,
|
89 |
lzo_bytep out, lzo_uintp out_len,
|
90 |
lzo_voidp wrkmem )
|
91 |
{
|
92 |
lzo_bytep op;
|
93 |
lzo_bytep ip;
|
94 |
lzo_uint t;
|
95 |
lzo_bytep m_pos;
|
96 |
lzo_bytep const ip_end = in + in_len;
|
97 |
lzo_bytep const op_end = out + *out_len;
|
98 |
lzo_bytep litp = NULL;
|
99 |
lzo_uint lit = 0;
|
100 |
lzo_uint next_lit = NO_LIT;
|
101 |
lzo_uint nl;
|
102 |
unsigned long o_m1_a = 0, o_m1_b = 0, o_m2 = 0, o_m3_a = 0, o_m3_b = 0;
|
103 |
|
104 |
LZO_UNUSED(wrkmem);
|
105 |
|
106 |
*out_len = 0;
|
107 |
|
108 |
op = out;
|
109 |
ip = in;
|
110 |
|
111 |
assert(in_len >= 3);
|
112 |
if (*ip > 17)
|
113 |
{
|
114 |
t = *ip++ - 17;
|
115 |
if (t < 4)
|
116 |
goto match_next;
|
117 |
goto first_literal_run;
|
118 |
}
|
119 |
assert(*ip < 16 || (*ip == 17 && in_len == 3));
|
120 |
|
121 |
while (TEST_IP && TEST_OP)
|
122 |
{
|
123 |
t = *ip++;
|
124 |
if (t >= 16)
|
125 |
goto match;
|
126 |
/* a literal run */
|
127 |
litp = ip - 1;
|
128 |
if (t == 0)
|
129 |
{
|
130 |
t = 15;
|
131 |
while (*ip == 0)
|
132 |
t += 255, ip++;
|
133 |
t += *ip++;
|
134 |
}
|
135 |
lit = t + 3;
|
136 |
/* copy literals */
|
137 |
copy_literal_run:
|
138 |
*op++ = *ip++; *op++ = *ip++; *op++ = *ip++;
|
139 |
first_literal_run:
|
140 |
do *op++ = *ip++; while (--t > 0);
|
141 |
|
142 |
|
143 |
t = *ip++;
|
144 |
|
145 |
if (t >= 16)
|
146 |
goto match;
|
147 |
#if defined(LZO1X)
|
148 |
m_pos = op - 1 - 0x800;
|
149 |
#elif defined(LZO1Y)
|
150 |
m_pos = op - 1 - 0x400;
|
151 |
#endif
|
152 |
m_pos -= t >> 2;
|
153 |
m_pos -= *ip++ << 2;
|
154 |
*op++ = *m_pos++; *op++ = *m_pos++; *op++ = *m_pos++;
|
155 |
lit = 0;
|
156 |
goto match_done;
|
157 |
|
158 |
|
159 |
/* handle matches */
|
160 |
do {
|
161 |
if (t < 16) /* a M1 match */
|
162 |
{
|
163 |
m_pos = op - 1;
|
164 |
m_pos -= t >> 2;
|
165 |
m_pos -= *ip++ << 2;
|
166 |
|
167 |
if (litp == NULL)
|
168 |
goto copy_m1;
|
169 |
|
170 |
/* assert that there was a match just before */
|
171 |
assert(lit >= 1 && lit <= 3);
|
172 |
assert(litp == ip - 2 - lit - 2);
|
173 |
assert((lzo_uint)(*litp & 3) == lit);
|
174 |
nl = ip[-2] & 3;
|
175 |
/* test if a match follows */
|
176 |
if (nl == 0 && lit == 1 && ip[0] >= 16)
|
177 |
{
|
178 |
next_lit = nl;
|
179 |
/* adjust length of previous short run */
|
180 |
lit += 2;
|
181 |
*litp = LZO_BYTE((*litp & ~3) | lit);
|
182 |
/* copy over the 2 literals that replace the match */
|
183 |
copy2(ip-2,m_pos,pd(op,m_pos));
|
184 |
o_m1_a++;
|
185 |
}
|
186 |
/* test if a literal run follows */
|
187 |
else if (nl == 0 && ip[0] < 16 && ip[0] != 0 &&
|
188 |
(lit + 2 + ip[0] < 16))
|
189 |
{
|
190 |
t = *ip++;
|
191 |
/* remove short run */
|
192 |
*litp &= ~3;
|
193 |
/* copy over the 2 literals that replace the match */
|
194 |
copy2(ip-3+1,m_pos,pd(op,m_pos));
|
195 |
/* move literals 1 byte ahead */
|
196 |
litp += 2;
|
197 |
if (lit > 0)
|
198 |
lzo_memmove(litp+1,litp,lit);
|
199 |
/* insert new length of long literal run */
|
200 |
lit += 2 + t + 3; assert(lit <= 18);
|
201 |
*litp = LZO_BYTE(lit - 3);
|
202 |
|
203 |
o_m1_b++;
|
204 |
*op++ = *m_pos++; *op++ = *m_pos++;
|
205 |
goto copy_literal_run;
|
206 |
}
|
207 |
copy_m1:
|
208 |
*op++ = *m_pos++; *op++ = *m_pos++;
|
209 |
}
|
210 |
else
|
211 |
{
|
212 |
match:
|
213 |
if (t >= 64) /* a M2 match */
|
214 |
{
|
215 |
m_pos = op - 1;
|
216 |
#if defined(LZO1X)
|
217 |
m_pos -= (t >> 2) & 7;
|
218 |
m_pos -= *ip++ << 3;
|
219 |
t = (t >> 5) - 1;
|
220 |
#elif defined(LZO1Y)
|
221 |
m_pos -= (t >> 2) & 3;
|
222 |
m_pos -= *ip++ << 2;
|
223 |
t = (t >> 4) - 3;
|
224 |
#endif
|
225 |
if (litp == NULL)
|
226 |
goto copy_m;
|
227 |
|
228 |
nl = ip[-2] & 3;
|
229 |
/* test if in beetween two long literal runs */
|
230 |
if (t == 1 && lit > 3 && nl == 0 &&
|
231 |
ip[0] < 16 && ip[0] != 0 && (lit + 3 + ip[0] < 16))
|
232 |
{
|
233 |
assert(*litp == lit - 3);
|
234 |
t = *ip++;
|
235 |
/* copy over the 3 literals that replace the match */
|
236 |
copy3(ip-1-2,m_pos,pd(op,m_pos));
|
237 |
/* set new length of previous literal run */
|
238 |
lit += 3 + t + 3; assert(lit <= 18);
|
239 |
*litp = LZO_BYTE(lit - 3);
|
240 |
o_m2++;
|
241 |
*op++ = *m_pos++; *op++ = *m_pos++; *op++ = *m_pos++;
|
242 |
goto copy_literal_run;
|
243 |
}
|
244 |
}
|
245 |
else
|
246 |
{
|
247 |
if (t >= 32) /* a M3 match */
|
248 |
{
|
249 |
t &= 31;
|
250 |
if (t == 0)
|
251 |
{
|
252 |
t = 31;
|
253 |
while (*ip == 0)
|
254 |
t += 255, ip++;
|
255 |
t += *ip++;
|
256 |
}
|
257 |
m_pos = op - 1;
|
258 |
m_pos -= *ip++ >> 2;
|
259 |
m_pos -= *ip++ << 6;
|
260 |
}
|
261 |
else /* a M4 match */
|
262 |
{
|
263 |
m_pos = op;
|
264 |
m_pos -= (t & 8) << 11;
|
265 |
t &= 7;
|
266 |
if (t == 0)
|
267 |
{
|
268 |
t = 7;
|
269 |
while (*ip == 0)
|
270 |
t += 255, ip++;
|
271 |
t += *ip++;
|
272 |
}
|
273 |
m_pos -= *ip++ >> 2;
|
274 |
m_pos -= *ip++ << 6;
|
275 |
if (m_pos == op)
|
276 |
goto eof_found;
|
277 |
m_pos -= 0x4000;
|
278 |
}
|
279 |
if (litp == NULL)
|
280 |
goto copy_m;
|
281 |
|
282 |
nl = ip[-2] & 3;
|
283 |
/* test if in beetween two matches */
|
284 |
if (t == 1 && lit == 0 && nl == 0 && ip[0] >= 16)
|
285 |
{
|
286 |
assert(litp == ip - 3 - lit - 2);
|
287 |
assert((lzo_uint)(*litp & 3) == lit);
|
288 |
next_lit = nl;
|
289 |
/* make a previous short run */
|
290 |
lit += 3;
|
291 |
*litp = LZO_BYTE((*litp & ~3) | lit);
|
292 |
/* copy over the 3 literals that replace the match */
|
293 |
copy3(ip-3,m_pos,pd(op,m_pos));
|
294 |
o_m3_a++;
|
295 |
}
|
296 |
/* test if a literal run follows */
|
297 |
else if (t == 1 && lit <= 3 && nl == 0 &&
|
298 |
ip[0] < 16 && ip[0] != 0 && (lit + 3 + ip[0] < 16))
|
299 |
{
|
300 |
assert(litp == ip - 3 - lit - 2);
|
301 |
assert((lzo_uint)(*litp & 3) == lit);
|
302 |
t = *ip++;
|
303 |
/* remove short run */
|
304 |
*litp &= ~3;
|
305 |
/* copy over the 3 literals that replace the match */
|
306 |
copy3(ip-4+1,m_pos,pd(op,m_pos));
|
307 |
/* move literals 1 byte ahead */
|
308 |
litp += 2;
|
309 |
if (lit > 0)
|
310 |
lzo_memmove(litp+1,litp,lit);
|
311 |
/* insert new length of long literal run */
|
312 |
lit += 3 + t + 3; assert(lit <= 18);
|
313 |
*litp = LZO_BYTE(lit - 3);
|
314 |
|
315 |
o_m3_b++;
|
316 |
*op++ = *m_pos++; *op++ = *m_pos++; *op++ = *m_pos++;
|
317 |
goto copy_literal_run;
|
318 |
}
|
319 |
}
|
320 |
copy_m:
|
321 |
*op++ = *m_pos++; *op++ = *m_pos++;
|
322 |
do *op++ = *m_pos++; while (--t > 0);
|
323 |
}
|
324 |
|
325 |
match_done:
|
326 |
if (next_lit == NO_LIT)
|
327 |
{
|
328 |
t = ip[-2] & 3;
|
329 |
lit = t;
|
330 |
litp = ip - 2;
|
331 |
}
|
332 |
else
|
333 |
t = next_lit;
|
334 |
assert(t <= 3);
|
335 |
next_lit = NO_LIT;
|
336 |
if (t == 0)
|
337 |
break;
|
338 |
/* copy literals */
|
339 |
match_next:
|
340 |
do *op++ = *ip++; while (--t > 0);
|
341 |
t = *ip++;
|
342 |
} while (TEST_IP && TEST_OP);
|
343 |
}
|
344 |
|
345 |
/* no EOF code was found */
|
346 |
*out_len = pd(op, out);
|
347 |
return LZO_E_EOF_NOT_FOUND;
|
348 |
|
349 |
eof_found:
|
350 |
assert(t == 1);
|
351 |
#if 0
|
352 |
printf("optimize: %5lu %5lu %5lu %5lu %5lu\n",
|
353 |
o_m1_a, o_m1_b, o_m2, o_m3_a, o_m3_b);
|
354 |
#endif
|
355 |
LZO_UNUSED(o_m1_a); LZO_UNUSED(o_m1_b); LZO_UNUSED(o_m2);
|
356 |
LZO_UNUSED(o_m3_a); LZO_UNUSED(o_m3_b);
|
357 |
*out_len = pd(op, out);
|
358 |
return (ip == ip_end ? LZO_E_OK :
|
359 |
(ip < ip_end ? LZO_E_INPUT_NOT_CONSUMED : LZO_E_INPUT_OVERRUN));
|
360 |
}
|
361 |
|
362 |
|
363 |
/*
|
364 |
vi:ts=4:et
|
365 |
*/
|
366 |
|