1 /* Because this code is derived from the 4.3BSD compress source:
4 * Copyright (c) 1985, 1986 The Regents of the University of California.
7 * This code is derived from software contributed to Berkeley by
8 * James A. Woods, derived from original work by Spencer Thomas
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 3. All advertising materials mentioning features or use of this software
20 * must display the following acknowledgement:
21 * This product includes software developed by the University of
22 * California, Berkeley and its contributors.
23 * 4. Neither the name of the University nor the names of its contributors
24 * may be used to endorse or promote products derived from this software
25 * without specific prior written permission.
27 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
28 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
31 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
32 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
33 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
34 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
35 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
36 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
41 * $Id: bsd-comp.c,v 1.3 1999/04/16 11:35:59 paulus Exp $
44 #include <sys/types.h>
47 #ifdef PPP_DEFS_IN_NET
48 #include <net/ppp_defs.h>
57 * PPP "BSD compress" compression
58 * The differences between this compression and the classic BSD LZW
59 * source are obvious from the requirement that the classic code worked
60 * with files while this handles arbitrarily long streams that
61 * are broken into packets. They are:
63 * When the code size expands, a block of junk is not emitted by
64 * the compressor and not expected by the decompressor.
66 * New codes are not necessarily assigned every time an old
67 * code is output by the compressor. This is because a packet
68 * end forces a code to be emitted, but does not imply that a
69 * new sequence has been seen.
71 * The compression ratio is checked at the first end of a packet
72 * after the appropriate gap. Besides simplifying and speeding
73 * things up, this makes it more likely that the transmitter
74 * and receiver will agree when the dictionary is cleared when
75 * compression is not going well.
79 * A dictionary for doing BSD compress.
82 int totlen
; /* length of this structure */
83 u_int hsize
; /* size of the hash table */
84 u_char hshift
; /* used in hash function */
85 u_char n_bits
; /* current bits/code */
89 u_short seqno
; /* sequence number of next packet */
90 u_int hdrlen
; /* header length to preallocate */
92 u_int maxmaxcode
; /* largest valid code */
93 u_int max_ent
; /* largest code in use */
94 u_int in_count
; /* uncompressed bytes, aged */
95 u_int bytes_out
; /* compressed bytes, aged */
96 u_int ratio
; /* recent compression ratio */
97 u_int checkpoint
; /* when to next check the ratio */
98 u_int clear_count
; /* times dictionary cleared */
99 u_int incomp_count
; /* incompressible packets */
100 u_int incomp_bytes
; /* incompressible bytes */
101 u_int uncomp_count
; /* uncompressed packets */
102 u_int uncomp_bytes
; /* uncompressed bytes */
103 u_int comp_count
; /* compressed packets */
104 u_int comp_bytes
; /* compressed bytes */
105 u_short
*lens
; /* array of lengths of codes */
107 union { /* hash value */
110 #ifdef BSD_LITTLE_ENDIAN
111 u_short prefix
; /* preceding code */
112 u_char suffix
; /* last character of new code */
116 u_char suffix
; /* last character of new code */
117 u_short prefix
; /* preceding code */
121 u_short codem1
; /* output of hash table -1 */
122 u_short cptr
; /* map code to hash table entry */
126 #define BSD_OVHD 2 /* BSD compress overhead/packet */
127 #define BSD_INIT_BITS BSD_MIN_BITS
129 static void *bsd_decomp_alloc
__P((u_char
*options
, int opt_len
));
130 static void bsd_free
__P((void *state
));
131 static int bsd_decomp_init
__P((void *state
, u_char
*options
, int opt_len
,
132 int unit
, int hdrlen
, int mru
, int debug
));
133 static void bsd_incomp
__P((void *state
, u_char
*dmsg
, int len
));
134 static int bsd_decompress
__P((void *state
, u_char
*cmp
, int inlen
,
135 u_char
*dmp
, int *outlen
));
136 static void bsd_reset
__P((void *state
));
137 static void bsd_comp_stats
__P((void *state
, struct compstat
*stats
));
140 * Exported procedures.
142 struct compressor ppp_bsd_compress
= {
143 CI_BSD_COMPRESS
, /* compress_proto */
144 bsd_decomp_alloc
, /* decomp_alloc */
145 bsd_free
, /* decomp_free */
146 bsd_decomp_init
, /* decomp_init */
147 bsd_reset
, /* decomp_reset */
148 bsd_decompress
, /* decompress */
149 bsd_incomp
, /* incomp */
150 bsd_comp_stats
, /* decomp_stat */
154 * the next two codes should not be changed lightly, as they must not
155 * lie within the contiguous general code space.
157 #define CLEAR 256 /* table clear output code */
158 #define FIRST 257 /* first free entry */
161 #define MAXCODE(b) ((1 << (b)) - 1)
162 #define BADCODEM1 MAXCODE(BSD_MAX_BITS)
164 #define BSD_HASH(prefix,suffix,hshift) ((((u_int32_t)(suffix)) << (hshift)) \
165 ^ (u_int32_t)(prefix))
166 #define BSD_KEY(prefix,suffix) ((((u_int32_t)(suffix)) << 16) \
167 + (u_int32_t)(prefix))
169 #define CHECK_GAP 10000 /* Ratio check interval */
171 #define RATIO_SCALE_LOG 8
172 #define RATIO_SCALE (1<<RATIO_SCALE_LOG)
173 #define RATIO_MAX (0x7fffffff>>RATIO_SCALE_LOG)
176 * clear the dictionary
183 db
->max_ent
= FIRST
-1;
184 db
->n_bits
= BSD_INIT_BITS
;
188 db
->checkpoint
= CHECK_GAP
;
192 * If the dictionary is full, then see if it is time to reset it.
194 * Compute the compression ratio using fixed-point arithmetic
195 * with 8 fractional bits.
197 * Since we have an infinite stream instead of a single file,
198 * watch only the local compression ratio.
200 * Since both peers must reset the dictionary at the same time even in
201 * the absence of CLEAR codes (while packets are incompressible), they
202 * must compute the same ratio.
204 static int /* 1=output CLEAR */
210 if (db
->in_count
>= db
->checkpoint
) {
211 /* age the ratio by limiting the size of the counts */
212 if (db
->in_count
>= RATIO_MAX
213 || db
->bytes_out
>= RATIO_MAX
) {
214 db
->in_count
-= db
->in_count
/4;
215 db
->bytes_out
-= db
->bytes_out
/4;
218 db
->checkpoint
= db
->in_count
+ CHECK_GAP
;
220 if (db
->max_ent
>= db
->maxmaxcode
) {
221 /* Reset the dictionary only if the ratio is worse,
222 * or if it looks as if it has been poisoned
223 * by incompressible data.
225 * This does not overflow, because
226 * db->in_count <= RATIO_MAX.
228 new_ratio
= db
->in_count
<< RATIO_SCALE_LOG
;
229 if (db
->bytes_out
!= 0)
230 new_ratio
/= db
->bytes_out
;
232 if (new_ratio
< db
->ratio
|| new_ratio
< 1 * RATIO_SCALE
) {
236 db
->ratio
= new_ratio
;
246 bsd_comp_stats(state
, stats
)
248 struct compstat
*stats
;
250 struct bsd_db
*db
= (struct bsd_db
*) state
;
253 stats
->unc_bytes
= db
->uncomp_bytes
;
254 stats
->unc_packets
= db
->uncomp_count
;
255 stats
->comp_bytes
= db
->comp_bytes
;
256 stats
->comp_packets
= db
->comp_count
;
257 stats
->inc_bytes
= db
->incomp_bytes
;
258 stats
->inc_packets
= db
->incomp_count
;
259 stats
->ratio
= db
->in_count
;
261 if (stats
->ratio
<= 0x7fffff)
270 * Reset state, as on a CCP ResetReq.
276 struct bsd_db
*db
= (struct bsd_db
*) state
;
284 * Allocate space for a (de) compressor.
287 bsd_alloc(options
, opt_len
, decomp
)
292 u_int newlen
, hsize
, hshift
, maxmaxcode
;
295 if (opt_len
!= 3 || options
[0] != CI_BSD_COMPRESS
|| options
[1] != 3
296 || BSD_VERSION(options
[2]) != BSD_CURRENT_VERSION
)
299 bits
= BSD_NBITS(options
[2]);
301 case 9: /* needs 82152 for both directions */
302 case 10: /* needs 84144 */
303 case 11: /* needs 88240 */
304 case 12: /* needs 96432 */
308 case 13: /* needs 176784 */
312 case 14: /* needs 353744 */
316 case 15: /* needs 691440 */
320 case 16: /* needs 1366160--far too much, */
321 /* hsize = 69001; */ /* and 69001 is too big for cptr */
322 /* hshift = 8; */ /* in struct bsd_db */
328 maxmaxcode
= MAXCODE(bits
);
329 newlen
= sizeof(*db
) + (hsize
-1) * (sizeof(db
->dict
[0]));
330 db
= (struct bsd_db
*) malloc(newlen
);
333 memset(db
, 0, sizeof(*db
) - sizeof(db
->dict
));
338 db
->lens
= (u_short
*) malloc((maxmaxcode
+1) * sizeof(db
->lens
[0]));
348 db
->maxmaxcode
= maxmaxcode
;
358 struct bsd_db
*db
= (struct bsd_db
*) state
;
365 bsd_decomp_alloc(options
, opt_len
)
369 return bsd_alloc(options
, opt_len
, 1);
373 * Initialize the database.
376 bsd_init(db
, options
, opt_len
, unit
, hdrlen
, mru
, debug
, decomp
)
379 int opt_len
, unit
, hdrlen
, mru
, debug
, decomp
;
383 if (opt_len
< CILEN_BSD_COMPRESS
384 || options
[0] != CI_BSD_COMPRESS
|| options
[1] != CILEN_BSD_COMPRESS
385 || BSD_VERSION(options
[2]) != BSD_CURRENT_VERSION
386 || BSD_NBITS(options
[2]) != db
->maxbits
387 || decomp
&& db
->lens
== NULL
)
397 db
->dict
[--i
].codem1
= BADCODEM1
;
398 db
->dict
[i
].cptr
= 0;
413 bsd_decomp_init(state
, options
, opt_len
, unit
, hdrlen
, mru
, debug
)
416 int opt_len
, unit
, hdrlen
, mru
, debug
;
418 return bsd_init((struct bsd_db
*) state
, options
, opt_len
,
419 unit
, hdrlen
, mru
, debug
, 1);
424 * Update the "BSD Compress" dictionary on the receiver for
425 * incompressible data by pretending to compress the incoming data.
428 bsd_incomp(state
, dmsg
, mlen
)
433 struct bsd_db
*db
= (struct bsd_db
*) state
;
434 u_int hshift
= db
->hshift
;
435 u_int max_ent
= db
->max_ent
;
436 u_int n_bits
= db
->n_bits
;
437 struct bsd_dict
*dictp
;
447 ent
= rptr
[0]; /* get the protocol */
453 if ((ent
& 1) == 0 || ent
< 0x21 || ent
> 0xf9)
457 ilen
= 1; /* count the protocol as 1 byte */
459 slen
= dmsg
+ mlen
- rptr
;
461 for (; slen
> 0; --slen
) {
463 fcode
= BSD_KEY(ent
, c
);
464 hval
= BSD_HASH(ent
, c
, hshift
);
465 dictp
= &db
->dict
[hval
];
467 /* validate and then check the entry */
468 if (dictp
->codem1
>= max_ent
)
470 if (dictp
->f
.fcode
== fcode
) {
471 ent
= dictp
->codem1
+1;
472 continue; /* found (prefix,suffix) */
475 /* continue probing until a match or invalid entry */
476 disp
= (hval
== 0) ? 1 : hval
;
479 if (hval
>= db
->hsize
)
481 dictp
= &db
->dict
[hval
];
482 if (dictp
->codem1
>= max_ent
)
484 } while (dictp
->f
.fcode
!= fcode
);
485 ent
= dictp
->codem1
+1;
486 continue; /* finally found (prefix,suffix) */
488 nomatch
: /* output (count) the prefix */
491 /* code -> hashtable */
492 if (max_ent
< db
->maxmaxcode
) {
493 struct bsd_dict
*dictp2
;
494 /* expand code size if needed */
495 if (max_ent
>= MAXCODE(n_bits
))
496 db
->n_bits
= ++n_bits
;
498 /* Invalidate previous hash table entry
499 * assigned this code, and then take it over.
501 dictp2
= &db
->dict
[max_ent
+1];
502 if (db
->dict
[dictp2
->cptr
].codem1
== max_ent
)
503 db
->dict
[dictp2
->cptr
].codem1
= BADCODEM1
;
505 dictp
->codem1
= max_ent
;
506 dictp
->f
.fcode
= fcode
;
508 db
->max_ent
= ++max_ent
;
509 db
->lens
[max_ent
] = db
->lens
[ent
]+1;
513 bitno
+= n_bits
; /* output (count) the last code */
514 db
->bytes_out
+= bitno
/8;
515 db
->in_count
+= ilen
;
519 db
->incomp_bytes
+= ilen
;
521 db
->uncomp_bytes
+= ilen
;
523 /* Increase code size if we would have without the packet
524 * boundary and as the decompressor will.
526 if (max_ent
>= MAXCODE(n_bits
) && max_ent
< db
->maxmaxcode
)
532 * Decompress "BSD Compress"
534 * Because of patent problems, we return DECOMP_ERROR for errors
535 * found by inspecting the input data and for system problems, but
536 * DECOMP_FATALERROR for any errors which could possibly be said to
537 * be being detected "after" decompression. For DECOMP_ERROR,
538 * we can issue a CCP reset-request; for DECOMP_FATALERROR, we may be
539 * infringing a patent of Motorola's if we do, so we take CCP down
542 * Given that the frame has the correct sequence number and a good FCS,
543 * errors such as invalid codes in the input most likely indicate a
544 * bug, so we return DECOMP_FATALERROR for them in order to turn off
545 * compression, even though they are detected by inspecting the input.
548 bsd_decompress(state
, cmsg
, inlen
, dmp
, outlenp
)
553 struct bsd_db
*db
= (struct bsd_db
*) state
;
554 u_int max_ent
= db
->max_ent
;
556 u_int bitno
= 32; /* 1st valid bit in accm */
557 u_int n_bits
= db
->n_bits
;
558 u_int tgtbitno
= 32-n_bits
; /* bitno when we have a code */
559 struct bsd_dict
*dictp
;
560 int explen
, i
, seq
, len
;
561 u_int incode
, oldcode
, finchar
;
562 u_char
*p
, *rptr
, *wptr
;
564 int dlen
, space
, codelen
, extra
;
569 ++rptr
; /* skip protocol (assumed 0xfd) */
570 seq
= (rptr
[0] << 8) + rptr
[1];
572 ilen
= len
= cmsg
+ inlen
- rptr
;
575 * Check the sequence number and give up if it is not what we expect.
577 if (seq
!= db
->seqno
++) {
579 printf("bsd_decomp%d: bad sequence # %d, expected %d\n",
580 db
->unit
, seq
, db
->seqno
- 1);
584 wptr
= dmp
+ db
->hdrlen
;
590 * Accumulate bytes until we have a complete code.
591 * Then get the next code, relying on the 32-bit,
592 * unsigned accm to mask the result.
595 accm
|= *rptr
++ << bitno
;
597 if (tgtbitno
< bitno
)
599 incode
= accm
>> tgtbitno
;
603 if (incode
== CLEAR
) {
605 * The dictionary must only be cleared at
606 * the end of a packet. But there could be an
607 * empty message block at the end.
611 printf("bsd_decomp%d: bad CLEAR\n", db
->unit
);
612 return DECOMP_FATALERROR
;
619 if (incode
> max_ent
+ 2 || incode
> db
->maxmaxcode
620 || incode
> max_ent
&& oldcode
== CLEAR
) {
622 printf("bsd_decomp%d: bad code 0x%x oldcode=0x%x ",
623 db
->unit
, incode
, oldcode
);
624 printf("max_ent=0x%x dlen=%d seqno=%d\n",
625 max_ent
, dlen
, db
->seqno
);
627 return DECOMP_FATALERROR
; /* probably a bug */
630 /* Special case for KwKwK string. */
631 if (incode
> max_ent
) {
639 codelen
= db
->lens
[finchar
];
640 explen
+= codelen
+ extra
;
641 if (explen
> db
->mru
+ 1) {
643 printf("bsd_decomp%d: ran out of mru\n", db
->unit
);
644 return DECOMP_FATALERROR
;
648 * Decode this code and install it in the decompressed buffer.
650 p
= (wptr
+= codelen
);
651 while (finchar
> LAST
) {
652 dictp
= &db
->dict
[db
->dict
[finchar
].cptr
];
656 printf("bsd_decomp%d: fell off end of chain ", db
->unit
);
657 printf("0x%x at 0x%x by 0x%x, max_ent=0x%x\n",
658 incode
, finchar
, db
->dict
[finchar
].cptr
, max_ent
);
659 return DECOMP_FATALERROR
;
661 if (dictp
->codem1
!= finchar
-1) {
662 printf("bsd_decomp%d: bad code chain 0x%x finchar=0x%x ",
663 db
->unit
, incode
, finchar
);
664 printf("oldcode=0x%x cptr=0x%x codem1=0x%x\n", oldcode
,
665 db
->dict
[finchar
].cptr
, dictp
->codem1
);
666 return DECOMP_FATALERROR
;
669 *--p
= dictp
->f
.hs
.suffix
;
670 finchar
= dictp
->f
.hs
.prefix
;
676 printf("bsd_decomp%d: short by %d after code 0x%x, max_ent=0x%x\n",
677 db
->unit
, codelen
, incode
, max_ent
);
680 if (extra
) /* the KwKwK case again */
684 * If not first code in a packet, and
685 * if not out of code space, then allocate a new code.
687 * Keep the hash table correct so it can be used
688 * with uncompressed packets.
690 if (oldcode
!= CLEAR
&& max_ent
< db
->maxmaxcode
) {
691 struct bsd_dict
*dictp2
;
695 fcode
= BSD_KEY(oldcode
,finchar
);
696 hval
= BSD_HASH(oldcode
,finchar
,db
->hshift
);
697 dictp
= &db
->dict
[hval
];
699 /* look for a free hash table entry */
700 if (dictp
->codem1
< max_ent
) {
701 disp
= (hval
== 0) ? 1 : hval
;
704 if (hval
>= db
->hsize
)
706 dictp
= &db
->dict
[hval
];
707 } while (dictp
->codem1
< max_ent
);
711 * Invalidate previous hash table entry
712 * assigned this code, and then take it over
714 dictp2
= &db
->dict
[max_ent
+1];
715 if (db
->dict
[dictp2
->cptr
].codem1
== max_ent
) {
716 db
->dict
[dictp2
->cptr
].codem1
= BADCODEM1
;
719 dictp
->codem1
= max_ent
;
720 dictp
->f
.fcode
= fcode
;
722 db
->max_ent
= ++max_ent
;
723 db
->lens
[max_ent
] = db
->lens
[oldcode
]+1;
725 /* Expand code size if needed. */
726 if (max_ent
>= MAXCODE(n_bits
) && max_ent
< db
->maxmaxcode
) {
727 db
->n_bits
= ++n_bits
;
728 tgtbitno
= 32-n_bits
;
733 *outlenp
= wptr
- (dmp
+ db
->hdrlen
);
736 * Keep the checkpoint right so that incompressible packets
737 * clear the dictionary at the right times.
739 db
->bytes_out
+= ilen
;
740 db
->in_count
+= explen
;
741 if (bsd_check(db
) && db
->debug
) {
742 printf("bsd_decomp%d: peer should have cleared dictionary\n",
747 db
->comp_bytes
+= ilen
+ BSD_OVHD
;
749 db
->uncomp_bytes
+= explen
;
753 #endif /* DO_BSD_COMPRESS */