GNU Classpath (0.91) | |
Frames | No Frames |
1: /* Deflater.java - Compress a data stream 2: Copyright (C) 1999, 2000, 2001, 2004 Free Software Foundation, Inc. 3: 4: This file is part of GNU Classpath. 5: 6: GNU Classpath is free software; you can redistribute it and/or modify 7: it under the terms of the GNU General Public License as published by 8: the Free Software Foundation; either version 2, or (at your option) 9: any later version. 10: 11: GNU Classpath is distributed in the hope that it will be useful, but 12: WITHOUT ANY WARRANTY; without even the implied warranty of 13: MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14: General Public License for more details. 15: 16: You should have received a copy of the GNU General Public License 17: along with GNU Classpath; see the file COPYING. If not, write to the 18: Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 19: 02110-1301 USA. 20: 21: Linking this library statically or dynamically with other modules is 22: making a combined work based on this library. Thus, the terms and 23: conditions of the GNU General Public License cover the whole 24: combination. 25: 26: As a special exception, the copyright holders of this library give you 27: permission to link this library with independent modules to produce an 28: executable, regardless of the license terms of these independent 29: modules, and to copy and distribute the resulting executable under 30: terms of your choice, provided that you also meet, for each linked 31: independent module, the terms and conditions of the license of that 32: module. An independent module is a module which is not derived from 33: or based on this library. If you modify this library, you may extend 34: this exception to your version of the library, but you are not 35: obligated to do so. If you do not wish to do so, delete this 36: exception statement from your version. */ 37: 38: package java.util.zip; 39: 40: /** 41: * This is the Deflater class. The deflater class compresses input 42: * with the deflate algorithm described in RFC 1951. It has several 43: * compression levels and three different strategies described below. 44: * 45: * This class is <i>not</i> thread safe. This is inherent in the API, due 46: * to the split of deflate and setInput. 47: * 48: * @author Jochen Hoenicke 49: * @author Tom Tromey 50: */ 51: public class Deflater 52: { 53: /** 54: * The best and slowest compression level. This tries to find very 55: * long and distant string repetitions. 56: */ 57: public static final int BEST_COMPRESSION = 9; 58: /** 59: * The worst but fastest compression level. 60: */ 61: public static final int BEST_SPEED = 1; 62: /** 63: * The default compression level. 64: */ 65: public static final int DEFAULT_COMPRESSION = -1; 66: /** 67: * This level won't compress at all but output uncompressed blocks. 68: */ 69: public static final int NO_COMPRESSION = 0; 70: 71: /** 72: * The default strategy. 73: */ 74: public static final int DEFAULT_STRATEGY = 0; 75: /** 76: * This strategy will only allow longer string repetitions. It is 77: * useful for random data with a small character set. 78: */ 79: public static final int FILTERED = 1; 80: 81: /** 82: * This strategy will not look for string repetitions at all. It 83: * only encodes with Huffman trees (which means, that more common 84: * characters get a smaller encoding. 85: */ 86: public static final int HUFFMAN_ONLY = 2; 87: 88: /** 89: * The compression method. This is the only method supported so far. 90: * There is no need to use this constant at all. 91: */ 92: public static final int DEFLATED = 8; 93: 94: /* 95: * The Deflater can do the following state transitions: 96: * 97: * (1) -> INIT_STATE ----> INIT_FINISHING_STATE ---. 98: * / | (2) (5) | 99: * / v (5) | 100: * (3)| SETDICT_STATE ---> SETDICT_FINISHING_STATE |(3) 101: * \ | (3) | ,-------' 102: * | | | (3) / 103: * v v (5) v v 104: * (1) -> BUSY_STATE ----> FINISHING_STATE 105: * | (6) 106: * v 107: * FINISHED_STATE 108: * \_____________________________________/ 109: * | (7) 110: * v 111: * CLOSED_STATE 112: * 113: * (1) If we should produce a header we start in INIT_STATE, otherwise 114: * we start in BUSY_STATE. 115: * (2) A dictionary may be set only when we are in INIT_STATE, then 116: * we change the state as indicated. 117: * (3) Whether a dictionary is set or not, on the first call of deflate 118: * we change to BUSY_STATE. 119: * (4) -- intentionally left blank -- :) 120: * (5) FINISHING_STATE is entered, when flush() is called to indicate that 121: * there is no more INPUT. There are also states indicating, that 122: * the header wasn't written yet. 123: * (6) FINISHED_STATE is entered, when everything has been flushed to the 124: * internal pending output buffer. 125: * (7) At any time (7) 126: * 127: */ 128: 129: private static final int IS_SETDICT = 0x01; 130: private static final int IS_FLUSHING = 0x04; 131: private static final int IS_FINISHING = 0x08; 132: 133: private static final int INIT_STATE = 0x00; 134: private static final int SETDICT_STATE = 0x01; 135: private static final int INIT_FINISHING_STATE = 0x08; 136: private static final int SETDICT_FINISHING_STATE = 0x09; 137: private static final int BUSY_STATE = 0x10; 138: private static final int FLUSHING_STATE = 0x14; 139: private static final int FINISHING_STATE = 0x1c; 140: private static final int FINISHED_STATE = 0x1e; 141: private static final int CLOSED_STATE = 0x7f; 142: 143: /** Compression level. */ 144: private int level; 145: 146: /** should we include a header. */ 147: private boolean noHeader; 148: 149: /** The current state. */ 150: private int state; 151: 152: /** The total bytes of output written. */ 153: private int totalOut; 154: 155: /** The pending output. */ 156: private DeflaterPending pending; 157: 158: /** The deflater engine. */ 159: private DeflaterEngine engine; 160: 161: /** 162: * Creates a new deflater with default compression level. 163: */ 164: public Deflater() 165: { 166: this(DEFAULT_COMPRESSION, false); 167: } 168: 169: /** 170: * Creates a new deflater with given compression level. 171: * @param lvl the compression level, a value between NO_COMPRESSION 172: * and BEST_COMPRESSION, or DEFAULT_COMPRESSION. 173: * @exception IllegalArgumentException if lvl is out of range. 174: */ 175: public Deflater(int lvl) 176: { 177: this(lvl, false); 178: } 179: 180: /** 181: * Creates a new deflater with given compression level. 182: * @param lvl the compression level, a value between NO_COMPRESSION 183: * and BEST_COMPRESSION. 184: * @param nowrap true, iff we should suppress the deflate header at the 185: * beginning and the adler checksum at the end of the output. This is 186: * useful for the GZIP format. 187: * @exception IllegalArgumentException if lvl is out of range. 188: */ 189: public Deflater(int lvl, boolean nowrap) 190: { 191: if (lvl == DEFAULT_COMPRESSION) 192: lvl = 6; 193: else if (lvl < NO_COMPRESSION || lvl > BEST_COMPRESSION) 194: throw new IllegalArgumentException(); 195: 196: pending = new DeflaterPending(); 197: engine = new DeflaterEngine(pending); 198: this.noHeader = nowrap; 199: setStrategy(DEFAULT_STRATEGY); 200: setLevel(lvl); 201: reset(); 202: } 203: 204: /** 205: * Resets the deflater. The deflater acts afterwards as if it was 206: * just created with the same compression level and strategy as it 207: * had before. 208: */ 209: public void reset() 210: { 211: state = (noHeader ? BUSY_STATE : INIT_STATE); 212: totalOut = 0; 213: pending.reset(); 214: engine.reset(); 215: } 216: 217: /** 218: * Frees all objects allocated by the compressor. There's no 219: * reason to call this, since you can just rely on garbage 220: * collection. Exists only for compatibility against Sun's JDK, 221: * where the compressor allocates native memory. 222: * If you call any method (even reset) afterwards the behaviour is 223: * <i>undefined</i>. 224: */ 225: public void end() 226: { 227: engine = null; 228: pending = null; 229: state = CLOSED_STATE; 230: } 231: 232: /** 233: * Gets the current adler checksum of the data that was processed so 234: * far. 235: */ 236: public int getAdler() 237: { 238: return engine.getAdler(); 239: } 240: 241: /** 242: * Gets the number of input bytes processed so far. 243: */ 244: public int getTotalIn() 245: { 246: return engine.getTotalIn(); 247: } 248: 249: /** 250: * Gets the number of output bytes so far. 251: */ 252: public int getTotalOut() 253: { 254: return totalOut; 255: } 256: 257: /** 258: * Finalizes this object. 259: */ 260: protected void finalize() 261: { 262: /* Exists solely for compatibility. We don't have any native state. */ 263: } 264: 265: /** 266: * Flushes the current input block. Further calls to deflate() will 267: * produce enough output to inflate everything in the current input 268: * block. This is not part of Sun's JDK so I have made it package 269: * private. It is used by DeflaterOutputStream to implement 270: * flush(). 271: */ 272: void flush() { 273: state |= IS_FLUSHING; 274: } 275: 276: /** 277: * Finishes the deflater with the current input block. It is an error 278: * to give more input after this method was called. This method must 279: * be called to force all bytes to be flushed. 280: */ 281: public void finish() { 282: state |= IS_FLUSHING | IS_FINISHING; 283: } 284: 285: /** 286: * Returns true iff the stream was finished and no more output bytes 287: * are available. 288: */ 289: public boolean finished() 290: { 291: return state == FINISHED_STATE && pending.isFlushed(); 292: } 293: 294: /** 295: * Returns true, if the input buffer is empty. 296: * You should then call setInput(). <br> 297: * 298: * <em>NOTE</em>: This method can also return true when the stream 299: * was finished. 300: */ 301: public boolean needsInput() 302: { 303: return engine.needsInput(); 304: } 305: 306: /** 307: * Sets the data which should be compressed next. This should be only 308: * called when needsInput indicates that more input is needed. 309: * If you call setInput when needsInput() returns false, the 310: * previous input that is still pending will be thrown away. 311: * The given byte array should not be changed, before needsInput() returns 312: * true again. 313: * This call is equivalent to <code>setInput(input, 0, input.length)</code>. 314: * @param input the buffer containing the input data. 315: * @exception IllegalStateException if the buffer was finished() or ended(). 316: */ 317: public void setInput(byte[] input) 318: { 319: setInput(input, 0, input.length); 320: } 321: 322: /** 323: * Sets the data which should be compressed next. This should be 324: * only called when needsInput indicates that more input is needed. 325: * The given byte array should not be changed, before needsInput() returns 326: * true again. 327: * @param input the buffer containing the input data. 328: * @param off the start of the data. 329: * @param len the length of the data. 330: * @exception IllegalStateException if the buffer was finished() or ended() 331: * or if previous input is still pending. 332: */ 333: public void setInput(byte[] input, int off, int len) 334: { 335: if ((state & IS_FINISHING) != 0) 336: throw new IllegalStateException("finish()/end() already called"); 337: engine.setInput(input, off, len); 338: } 339: 340: /** 341: * Sets the compression level. There is no guarantee of the exact 342: * position of the change, but if you call this when needsInput is 343: * true the change of compression level will occur somewhere near 344: * before the end of the so far given input. 345: * @param lvl the new compression level. 346: */ 347: public void setLevel(int lvl) 348: { 349: if (lvl == DEFAULT_COMPRESSION) 350: lvl = 6; 351: else if (lvl < NO_COMPRESSION || lvl > BEST_COMPRESSION) 352: throw new IllegalArgumentException(); 353: 354: 355: if (level != lvl) 356: { 357: level = lvl; 358: engine.setLevel(lvl); 359: } 360: } 361: 362: /** 363: * Sets the compression strategy. Strategy is one of 364: * DEFAULT_STRATEGY, HUFFMAN_ONLY and FILTERED. For the exact 365: * position where the strategy is changed, the same as for 366: * setLevel() applies. 367: * @param stgy the new compression strategy. 368: */ 369: public void setStrategy(int stgy) 370: { 371: if (stgy != DEFAULT_STRATEGY && stgy != FILTERED 372: && stgy != HUFFMAN_ONLY) 373: throw new IllegalArgumentException(); 374: engine.setStrategy(stgy); 375: } 376: 377: /** 378: * Deflates the current input block to the given array. It returns 379: * the number of bytes compressed, or 0 if either 380: * needsInput() or finished() returns true or length is zero. 381: * @param output the buffer where to write the compressed data. 382: */ 383: public int deflate(byte[] output) 384: { 385: return deflate(output, 0, output.length); 386: } 387: 388: /** 389: * Deflates the current input block to the given array. It returns 390: * the number of bytes compressed, or 0 if either 391: * needsInput() or finished() returns true or length is zero. 392: * @param output the buffer where to write the compressed data. 393: * @param offset the offset into the output array. 394: * @param length the maximum number of bytes that may be written. 395: * @exception IllegalStateException if end() was called. 396: * @exception IndexOutOfBoundsException if offset and/or length 397: * don't match the array length. 398: */ 399: public int deflate(byte[] output, int offset, int length) 400: { 401: int origLength = length; 402: 403: if (state == CLOSED_STATE) 404: throw new IllegalStateException("Deflater closed"); 405: 406: if (state < BUSY_STATE) 407: { 408: /* output header */ 409: int header = (DEFLATED + 410: ((DeflaterConstants.MAX_WBITS - 8) << 4)) << 8; 411: int level_flags = (level - 1) >> 1; 412: if (level_flags < 0 || level_flags > 3) 413: level_flags = 3; 414: header |= level_flags << 6; 415: if ((state & IS_SETDICT) != 0) 416: /* Dictionary was set */ 417: header |= DeflaterConstants.PRESET_DICT; 418: header += 31 - (header % 31); 419: 420: pending.writeShortMSB(header); 421: if ((state & IS_SETDICT) != 0) 422: { 423: int chksum = engine.getAdler(); 424: engine.resetAdler(); 425: pending.writeShortMSB(chksum >> 16); 426: pending.writeShortMSB(chksum & 0xffff); 427: } 428: 429: state = BUSY_STATE | (state & (IS_FLUSHING | IS_FINISHING)); 430: } 431: 432: for (;;) 433: { 434: int count = pending.flush(output, offset, length); 435: offset += count; 436: totalOut += count; 437: length -= count; 438: if (length == 0 || state == FINISHED_STATE) 439: break; 440: 441: if (!engine.deflate((state & IS_FLUSHING) != 0, 442: (state & IS_FINISHING) != 0)) 443: { 444: if (state == BUSY_STATE) 445: /* We need more input now */ 446: return origLength - length; 447: else if (state == FLUSHING_STATE) 448: { 449: if (level != NO_COMPRESSION) 450: { 451: /* We have to supply some lookahead. 8 bit lookahead 452: * are needed by the zlib inflater, and we must fill 453: * the next byte, so that all bits are flushed. 454: */ 455: int neededbits = 8 + ((-pending.getBitCount()) & 7); 456: while (neededbits > 0) 457: { 458: /* write a static tree block consisting solely of 459: * an EOF: 460: */ 461: pending.writeBits(2, 10); 462: neededbits -= 10; 463: } 464: } 465: state = BUSY_STATE; 466: } 467: else if (state == FINISHING_STATE) 468: { 469: pending.alignToByte(); 470: /* We have completed the stream */ 471: if (!noHeader) 472: { 473: int adler = engine.getAdler(); 474: pending.writeShortMSB(adler >> 16); 475: pending.writeShortMSB(adler & 0xffff); 476: } 477: state = FINISHED_STATE; 478: } 479: } 480: } 481: 482: return origLength - length; 483: } 484: 485: /** 486: * Sets the dictionary which should be used in the deflate process. 487: * This call is equivalent to <code>setDictionary(dict, 0, 488: * dict.length)</code>. 489: * @param dict the dictionary. 490: * @exception IllegalStateException if setInput () or deflate () 491: * were already called or another dictionary was already set. 492: */ 493: public void setDictionary(byte[] dict) 494: { 495: setDictionary(dict, 0, dict.length); 496: } 497: 498: /** 499: * Sets the dictionary which should be used in the deflate process. 500: * The dictionary should be a byte array containing strings that are 501: * likely to occur in the data which should be compressed. The 502: * dictionary is not stored in the compressed output, only a 503: * checksum. To decompress the output you need to supply the same 504: * dictionary again. 505: * @param dict the dictionary. 506: * @param offset an offset into the dictionary. 507: * @param length the length of the dictionary. 508: * @exception IllegalStateException if setInput () or deflate () were 509: * already called or another dictionary was already set. 510: */ 511: public void setDictionary(byte[] dict, int offset, int length) 512: { 513: if (state != INIT_STATE) 514: throw new IllegalStateException(); 515: 516: state = SETDICT_STATE; 517: engine.setDictionary(dict, offset, length); 518: } 519: }
GNU Classpath (0.91) |