/* lzo_swd.ch -- sliding window dictionary This file is part of the LZO real-time data compression library. Copyright (C) 1996-2002 Markus Franz Xaver Johannes Oberhumer All Rights Reserved. The LZO library is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. The LZO library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with the LZO library; see the file COPYING. If not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. Markus F.X.J. Oberhumer */ #if (LZO_UINT_MAX < LZO_0xffffffffL) # error "LZO_UINT_MAX" #endif /*********************************************************************** // ************************************************************************/ #ifndef SWD_N # define SWD_N N #endif #ifndef SWD_F # define SWD_F F #endif #ifndef SWD_THRESHOLD # define SWD_THRESHOLD THRESHOLD #endif /* unsigned type for dictionary access - don't waste memory here */ #if (SWD_N + SWD_F + SWD_F < USHRT_MAX) typedef unsigned short swd_uint; # define SWD_UINT_MAX USHRT_MAX #else typedef lzo_uint swd_uint; # define SWD_UINT_MAX LZO_UINT_MAX #endif #define SWD_UINT(x) ((swd_uint)(x)) #ifndef SWD_HSIZE # define SWD_HSIZE 16384 #endif #ifndef SWD_MAX_CHAIN # define SWD_MAX_CHAIN 2048 #endif #if !defined(HEAD3) #if 1 # define HEAD3(b,p) \ (((0x9f5f*(((((lzo_uint32)b[p]<<5)^b[p+1])<<5)^b[p+2]))>>5) & (SWD_HSIZE-1)) #else # define HEAD3(b,p) \ (((0x9f5f*(((((lzo_uint32)b[p+2]<<5)^b[p+1])<<5)^b[p]))>>5) & (SWD_HSIZE-1)) #endif #endif #if (SWD_THRESHOLD == 1) && !defined(HEAD2) # if 1 && defined(LZO_UNALIGNED_OK_2) # define HEAD2(b,p) (* (lzo_ushortp) &(b[p])) # else # define HEAD2(b,p) (b[p] ^ ((unsigned)b[p+1]<<8)) # endif # define NIL2 SWD_UINT_MAX #endif typedef struct { /* public - "built-in" */ lzo_uint n; lzo_uint f; lzo_uint threshold; /* public - configuration */ lzo_uint max_chain; lzo_uint nice_length; lzo_bool use_best_off; lzo_uint lazy_insert; /* public - output */ lzo_uint m_len; lzo_uint m_off; lzo_uint look; int b_char; #if defined(SWD_BEST_OFF) lzo_uint best_off[ SWD_BEST_OFF ]; #endif /* semi public */ LZO_COMPRESS_T *c; lzo_uint m_pos; #if defined(SWD_BEST_OFF) lzo_uint best_pos[ SWD_BEST_OFF ]; #endif /* private */ const lzo_byte *dict; const lzo_byte *dict_end; lzo_uint dict_len; /* private */ lzo_uint ip; /* input pointer (lookahead) */ lzo_uint bp; /* buffer pointer */ lzo_uint rp; /* remove pointer */ lzo_uint b_size; unsigned char *b_wrap; lzo_uint node_count; lzo_uint first_rp; #if defined(__LZO_CHECKER) /* malloc arrays of the exact size to detect any overrun */ unsigned char *b; swd_uint *head3; swd_uint *succ3; swd_uint *best3; swd_uint *llen3; #ifdef HEAD2 swd_uint *head2; #endif #else unsigned char b [ SWD_N + SWD_F + SWD_F ]; swd_uint head3 [ SWD_HSIZE ]; swd_uint succ3 [ SWD_N + SWD_F ]; swd_uint best3 [ SWD_N + SWD_F ]; swd_uint llen3 [ SWD_HSIZE ]; #ifdef HEAD2 swd_uint head2 [ 65536L ]; #endif #endif } lzo_swd_t; /* Access macro for head3. * head3[key] may be uninitialized, but then its value will never be used. */ #if defined(__LZO_CHECKER) # define s_head3(s,key) \ ((s->llen3[key] == 0) ? SWD_UINT_MAX : s->head3[key]) #else # define s_head3(s,key) s->head3[key] #endif /*********************************************************************** // ************************************************************************/ static void swd_initdict(lzo_swd_t *s, const lzo_byte *dict, lzo_uint dict_len) { s->dict = s->dict_end = NULL; s->dict_len = 0; if (!dict || dict_len <= 0) return; if (dict_len > s->n) { dict += dict_len - s->n; dict_len = s->n; } s->dict = dict; s->dict_len = dict_len; s->dict_end = dict + dict_len; memcpy(s->b,dict,dict_len); s->ip = dict_len; } static void swd_insertdict(lzo_swd_t *s, lzo_uint node, lzo_uint len) { lzo_uint key; s->node_count = s->n - len; s->first_rp = node; while (len-- > 0) { key = HEAD3(s->b,node); s->succ3[node] = s_head3(s,key); s->head3[key] = SWD_UINT(node); s->best3[node] = SWD_UINT(s->f + 1); s->llen3[key]++; assert(s->llen3[key] <= SWD_N); #ifdef HEAD2 key = HEAD2(s->b,node); s->head2[key] = SWD_UINT(node); #endif node++; } } /*********************************************************************** // ************************************************************************/ static int swd_init(lzo_swd_t *s, const lzo_byte *dict, lzo_uint dict_len) { lzo_uint i = 0; int c = 0; #if defined(__LZO_CHECKER) s->b = malloc(SWD_N + SWD_F + SWD_F); s->head3 = malloc(sizeof(swd_uint) * SWD_HSIZE); s->succ3 = malloc(sizeof(swd_uint) * (SWD_N + SWD_F)); s->best3 = malloc(sizeof(swd_uint) * (SWD_N + SWD_F)); s->llen3 = malloc(sizeof(swd_uint) * SWD_HSIZE); #ifdef HEAD2 s->head2 = malloc(sizeof(swd_uint) * 65536L); #endif #endif s->n = SWD_N; s->f = SWD_F; s->threshold = SWD_THRESHOLD; /* defaults */ s->max_chain = SWD_MAX_CHAIN; s->nice_length = SWD_F; s->use_best_off = 0; s->lazy_insert = 0; s->b_size = s->n + s->f; if (2 * s->f >= s->n || s->b_size + s->f >= SWD_UINT_MAX) return LZO_E_ERROR; s->b_wrap = s->b + s->b_size; s->node_count = s->n; memset(s->llen3, 0, sizeof(s->llen3[0]) * SWD_HSIZE); #ifdef HEAD2 #if 1 memset(s->head2, 0xff, sizeof(s->head2[0]) * 65536L); assert(s->head2[0] == NIL2); #else for (i = 0; i < 65536L; i++) s->head2[i] = NIL2; #endif #endif s->ip = 0; swd_initdict(s,dict,dict_len); s->bp = s->ip; s->first_rp = s->ip; assert(s->ip + s->f <= s->b_size); #if 1 s->look = (lzo_uint) (s->c->in_end - s->c->ip); if (s->look > 0) { if (s->look > s->f) s->look = s->f; memcpy(&s->b[s->ip],s->c->ip,s->look); s->c->ip += s->look; s->ip += s->look; } #else s->look = 0; while (s->look < s->f) { if ((c = getbyte(*(s->c))) < 0) break; s->b[s->ip] = LZO_BYTE(c); s->ip++; s->look++; } #endif if (s->ip == s->b_size) s->ip = 0; if (s->look >= 2 && s->dict_len > 0) swd_insertdict(s,0,s->dict_len); s->rp = s->first_rp; if (s->rp >= s->node_count) s->rp -= s->node_count; else s->rp += s->b_size - s->node_count; #if defined(__LZO_CHECKER) /* initialize memory for the first few HEAD3 (if s->ip is not far * enough ahead to do this job for us). The value doesn't matter. */ if (s->look < 3) memset(&s->b[s->bp+s->look],0,3); #endif LZO_UNUSED(i); LZO_UNUSED(c); return LZO_E_OK; } static void swd_exit(lzo_swd_t *s) { #if defined(__LZO_CHECKER) /* free in reverse order of allocations */ #ifdef HEAD2 free(s->head2); s->head2 = NULL; #endif free(s->llen3); s->llen3 = NULL; free(s->best3); s->best3 = NULL; free(s->succ3); s->succ3 = NULL; free(s->head3); s->head3 = NULL; free(s->b); s->b = NULL; #else LZO_UNUSED(s); #endif } #define swd_pos2off(s,pos) \ (s->bp > (pos) ? s->bp - (pos) : s->b_size - ((pos) - s->bp)) /*********************************************************************** // ************************************************************************/ static __inline__ void swd_getbyte(lzo_swd_t *s) { int c; if ((c = getbyte(*(s->c))) < 0) { if (s->look > 0) --s->look; #if defined(__LZO_CHECKER) /* initialize memory - value doesn't matter */ s->b[s->ip] = 0; if (s->ip < s->f) s->b_wrap[s->ip] = 0; #endif } else { s->b[s->ip] = LZO_BYTE(c); if (s->ip < s->f) s->b_wrap[s->ip] = LZO_BYTE(c); } if (++s->ip == s->b_size) s->ip = 0; if (++s->bp == s->b_size) s->bp = 0; if (++s->rp == s->b_size) s->rp = 0; } /*********************************************************************** // remove node from lists ************************************************************************/ static __inline__ void swd_remove_node(lzo_swd_t *s, lzo_uint node) { if (s->node_count == 0) { lzo_uint key; #ifdef LZO_DEBUG if (s->first_rp != LZO_UINT_MAX) { if (node != s->first_rp) printf("Remove %5d: %5d %5d %5d %5d %6d %6d\n", node, s->rp, s->ip, s->bp, s->first_rp, s->ip - node, s->ip - s->bp); assert(node == s->first_rp); s->first_rp = LZO_UINT_MAX; } #endif key = HEAD3(s->b,node); assert(s->llen3[key] > 0); --s->llen3[key]; #ifdef HEAD2 key = HEAD2(s->b,node); assert(s->head2[key] != NIL2); if ((lzo_uint) s->head2[key] == node) s->head2[key] = NIL2; #endif } else --s->node_count; } /*********************************************************************** // ************************************************************************/ static void swd_accept(lzo_swd_t *s, lzo_uint n) { assert(n <= s->look); while (n--) { lzo_uint key; swd_remove_node(s,s->rp); /* add bp into HEAD3 */ key = HEAD3(s->b,s->bp); s->succ3[s->bp] = s_head3(s,key); s->head3[key] = SWD_UINT(s->bp); s->best3[s->bp] = SWD_UINT(s->f + 1); s->llen3[key]++; assert(s->llen3[key] <= SWD_N); #ifdef HEAD2 /* add bp into HEAD2 */ key = HEAD2(s->b,s->bp); s->head2[key] = SWD_UINT(s->bp); #endif swd_getbyte(s); } } /*********************************************************************** // ************************************************************************/ static void swd_search(lzo_swd_t *s, lzo_uint node, lzo_uint cnt) { #if 0 && defined(__GNUC__) && defined(__i386__) register const unsigned char *p1 __asm__("%edi"); register const unsigned char *p2 __asm__("%esi"); register const unsigned char *px __asm__("%edx"); #else const unsigned char *p1; const unsigned char *p2; const unsigned char *px; #endif lzo_uint m_len = s->m_len; const unsigned char * b = s->b; const unsigned char * bp = s->b + s->bp; const unsigned char * bx = s->b + s->bp + s->look; unsigned char scan_end1; assert(s->m_len > 0); scan_end1 = bp[m_len - 1]; for ( ; cnt-- > 0; node = s->succ3[node]) { p1 = bp; p2 = b + node; px = bx; assert(m_len < s->look); if ( #if 1 p2[m_len - 1] == scan_end1 && p2[m_len] == p1[m_len] && #endif p2[0] == p1[0] && p2[1] == p1[1]) { lzo_uint i; assert(memcmp(bp,&b[node],3) == 0); #if 0 && defined(LZO_UNALIGNED_OK_4) p1 += 3; p2 += 3; while (p1 < px && * (const lzo_uint32p) p1 == * (const lzo_uint32p) p2) p1 += 4, p2 += 4; while (p1 < px && *p1 == *p2) p1 += 1, p2 += 1; #else p1 += 2; p2 += 2; do {} while (++p1 < px && *p1 == *++p2); #endif i = p1 - bp; #ifdef LZO_DEBUG if (memcmp(bp,&b[node],i) != 0) printf("%5ld %5ld %02x%02x %02x%02x\n", (long)s->bp, (long) node, bp[0], bp[1], b[node], b[node+1]); #endif assert(memcmp(bp,&b[node],i) == 0); #if defined(SWD_BEST_OFF) if (i < SWD_BEST_OFF) { if (s->best_pos[i] == 0) s->best_pos[i] = node + 1; } #endif if (i > m_len) { s->m_len = m_len = i; s->m_pos = node; if (m_len == s->look) return; if (m_len >= s->nice_length) return; if (m_len > (lzo_uint) s->best3[node]) return; scan_end1 = bp[m_len - 1]; } } } } /*********************************************************************** // ************************************************************************/ #ifdef HEAD2 static lzo_bool swd_search2(lzo_swd_t *s) { lzo_uint key; assert(s->look >= 2); assert(s->m_len > 0); key = s->head2[ HEAD2(s->b,s->bp) ]; if (key == NIL2) return 0; #ifdef LZO_DEBUG if (memcmp(&s->b[s->bp],&s->b[key],2) != 0) printf("%5ld %5ld %02x%02x %02x%02x\n", (long)s->bp, (long)key, s->b[s->bp], s->b[s->bp+1], s->b[key], s->b[key+1]); #endif assert(memcmp(&s->b[s->bp],&s->b[key],2) == 0); #if defined(SWD_BEST_OFF) if (s->best_pos[2] == 0) s->best_pos[2] = key + 1; #endif if (s->m_len < 2) { s->m_len = 2; s->m_pos = key; } return 1; } #endif /*********************************************************************** // ************************************************************************/ static void swd_findbest(lzo_swd_t *s) { lzo_uint key; lzo_uint cnt, node; lzo_uint len; assert(s->m_len > 0); /* get current head, add bp into HEAD3 */ key = HEAD3(s->b,s->bp); node = s->succ3[s->bp] = s_head3(s,key); cnt = s->llen3[key]++; assert(s->llen3[key] <= SWD_N + SWD_F); if (cnt > s->max_chain && s->max_chain > 0) cnt = s->max_chain; s->head3[key] = SWD_UINT(s->bp); s->b_char = s->b[s->bp]; len = s->m_len; if (s->m_len >= s->look) { if (s->look == 0) s->b_char = -1; s->m_off = 0; s->best3[s->bp] = SWD_UINT(s->f + 1); } else { #ifdef HEAD2 if (swd_search2(s)) #endif if (s->look >= 3) swd_search(s,node,cnt); if (s->m_len > len) s->m_off = swd_pos2off(s,s->m_pos); s->best3[s->bp] = SWD_UINT(s->m_len); #if defined(SWD_BEST_OFF) if (s->use_best_off) { int i; for (i = 2; i < SWD_BEST_OFF; i++) if (s->best_pos[i] > 0) s->best_off[i] = swd_pos2off(s,s->best_pos[i]-1); else s->best_off[i] = 0; } #endif } swd_remove_node(s,s->rp); #ifdef HEAD2 /* add bp into HEAD2 */ key = HEAD2(s->b,s->bp); s->head2[key] = SWD_UINT(s->bp); #endif } #undef HEAD3 #undef HEAD2 #undef s_head3 /* vi:ts=4:et */