BE THE CODER - com/itextpdf/text/pdf/codec/LZWStringTable.java


/*

 * Copyright 2003-2008 by Paulo Soares.

 *

 * This code was originally released in 2001 by SUN (see class

 * com.sun.media.imageio.plugins.tiff.TIFFDirectory.java)

 * using the BSD license in a specific wording. In a mail dating from

 * January 23, 2008, Brian Burkhalter (@sun.com) gave us permission

 * to use the code under the following version of the BSD license:

 *

 * Copyright (c) 2005 Sun Microsystems, Inc. All  Rights Reserved.

 * 

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions

 * are met: 

 * 

 * - Redistribution of source code must retain the above copyright 

 *   notice, this  list of conditions and the following disclaimer.

 * 

 * - Redistribution in binary form must reproduce the above copyright

 *   notice, this list of conditions and the following disclaimer in 

 *   the documentation and/or other materials provided with the

 *   distribution.

 * 

 * Neither the name of Sun Microsystems, Inc. or the names of 

 * contributors may be used to endorse or promote products derived 

 * from this software without specific prior written permission.

 * 

 * This software is provided "AS IS," without a warranty of any 

 * kind. ALL EXPRESS OR IMPLIED CONDITIONS, REPRESENTATIONS AND 

 * WARRANTIES, INCLUDING ANY IMPLIED WARRANTY OF MERCHANTABILITY, 

 * FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT, ARE HEREBY

 * EXCLUDED. SUN MIDROSYSTEMS, INC. ("SUN") AND ITS LICENSORS SHALL 

 * NOT BE LIABLE FOR ANY DAMAGES SUFFERED BY LICENSEE AS A RESULT OF 

 * USING, MODIFYING OR DISTRIBUTING THIS SOFTWARE OR ITS

 * DERIVATIVES. IN NO EVENT WILL SUN OR ITS LICENSORS BE LIABLE FOR 

 * ANY LOST REVENUE, PROFIT OR DATA, OR FOR DIRECT, INDIRECT, SPECIAL,

 * CONSEQUENTIAL, INCIDENTAL OR PUNITIVE DAMAGES, HOWEVER CAUSED AND

 * REGARDLESS OF THE THEORY OF LIABILITY, ARISING OUT OF THE USE OF OR

 * INABILITY TO USE THIS SOFTWARE, EVEN IF SUN HAS BEEN ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGES. 

 * 

 * You acknowledge that this software is not designed or intended for 

 * use in the design, construction, operation or maintenance of any 

 * nuclear facility. 

 *

 * $Revision: 4540 $

 * $Date: 2010-07-13 14:57:54 +0200 (di, 13 jul 2010) $

 * $State: Exp $

 */



package com.itextpdf.text.pdf.codec;



import java.io.PrintStream;



/** 

 * General purpose LZW String Table.

 * Extracted from GIFEncoder by Adam Doppelt

 * Comments added by Robin Luiten

 * <code>expandCode</code> added by Robin Luiten

 * The strLen_ table to give quick access to the lenght of an expanded

 * code for use by the <code>expandCode</code> method added by Robin.

 * @since 5.0.2

 */

public class LZWStringTable

{

    /** codesize + Reserved Codes */

    private  final static int RES_CODES = 2;



    private  final static short HASH_FREE = (short)0xFFFF;

    private  final static short NEXT_FIRST =  (short)0xFFFF;



    private  final static int MAXBITS = 12;

    private  final static int MAXSTR  = (1 <<  MAXBITS);



    private  final static short HASHSIZE  = 9973;

    private  final static short HASHSTEP  = 2039;



    byte[]  strChr_;    // after predecessor character

    short[] strNxt_;    // predecessor string 

    short[] strHsh_;    // hash table to find  predecessor + char pairs

    short numStrings_;    // next code if adding new prestring + char



    /**

   * each entry corresponds to a code and contains the length of data

   * that the code expands to when decoded.

   **/

    int[] strLen_;



    /**

   * Constructor allocate memory for string store data

   **/

    public LZWStringTable()

    {

        strChr_  = new byte[MAXSTR];

        strNxt_  = new short[MAXSTR];

        strLen_  = new int[MAXSTR];

        strHsh_  = new short[HASHSIZE];    

    }



    /**

   * @param index value of -1 indicates no predecessor [used in initialization]

   * @param b the byte [character] to add to the string store which follows

   * the predecessor string specified the index.

   * @return 0xFFFF if no space in table left for addition of predecessor

   * index and byte b. Else return the code allocated for combination index + b.

   **/

    public int AddCharString(short index, byte b)

    {

        int  hshidx;



        if (numStrings_  >= MAXSTR)  // if used up all codes

            {

                return 0xFFFF;

            }

    

        hshidx = Hash(index, b);

        while (strHsh_[hshidx] != HASH_FREE)

            hshidx = (hshidx + HASHSTEP) % HASHSIZE;

    

        strHsh_[hshidx]  = numStrings_;

        strChr_[numStrings_] = b;

        if (index == HASH_FREE)

            {

                strNxt_[numStrings_] = NEXT_FIRST;

                strLen_[numStrings_] = 1;

            }

        else

            {

                strNxt_[numStrings_] = index;

                strLen_[numStrings_] = strLen_[index] + 1;

            }



        return numStrings_++;  // return the code and inc for next code

    }



    /**

   * @param index index to prefix string

   * @param b the character that follws the index prefix

   * @return b if param index is HASH_FREE. Else return the code

   * for this prefix and byte successor

   **/  

    public short FindCharString(short index, byte b)

    {

        int  hshidx,  nxtidx;



        if (index == HASH_FREE)

            return (short)(b & 0xFF);    // Rob fixed used to sign extend



        hshidx = Hash(index, b);

        while ((nxtidx = strHsh_[hshidx]) != HASH_FREE)  // search

            {

                if (strNxt_[nxtidx]  == index &&  strChr_[nxtidx]  == b)

                    return (short)nxtidx;

                hshidx = (hshidx + HASHSTEP) % HASHSIZE;

            }



        return (short)0xFFFF;

    }



    /**

   * @param codesize the size of code to be preallocated for the

   * string store.

   **/

    public void  ClearTable(int codesize)

    {

        numStrings_  = 0;



        for  (int q = 0;  q <  HASHSIZE; q++)

            strHsh_[q] = HASH_FREE;



        int  w =  (1 << codesize)  + RES_CODES;

        for  (int q = 0;  q <  w; q++)

            AddCharString((short)0xFFFF, (byte)q);  // init with no prefix

    }



    static public int Hash(short index,  byte lastbyte)

    {

        return ((int)((short)(lastbyte << 8) ^ index) &  0xFFFF)  % HASHSIZE;

    }



    /**

   * If expanded data doesn't fit into array only what will fit is written

   * to buf and the return value indicates how much of the expanded code has

   * been written to the buf. The next call to expandCode() should be with 

   * the same code and have the skip parameter set the negated value of the 

   * previous return. Successive negative return values should be negated and

   * added together for next skip parameter value with same code.

   *

   * @param buf buffer to place expanded data into

   * @param offset offset to place expanded data

   * @param code the code to expand to the byte array it represents.

   * PRECONDITION This code must already be in the LZSS

   * @param skipHead is the number of bytes at the start of the expanded code to 

   * be skipped before data is written to buf. It is possible that skipHead is

   * equal to codeLen.

   * @return the length of data expanded into buf. If the expanded code is longer

   * than space left in buf then the value returned is a negative number which when

   * negated is equal to the number of bytes that were used of the code being expanded.

   * This negative value also indicates the buffer is full.

   **/

    public int expandCode(byte[] buf, int offset, short code, int skipHead)

    {

        if (offset == -2) 

            {

                if (skipHead == 1) skipHead = 0;

            }

        if (code == (short)0xFFFF ||        // just in case

            skipHead == strLen_[code])        // DONE no more unpacked

            return 0;



        int expandLen;              // how much data we are actually expanding

        int codeLen = strLen_[code] - skipHead;  // length of expanded code left

        int bufSpace = buf.length - offset;    // how much space left

        if (bufSpace > codeLen)

            expandLen = codeLen;        // only got this many to unpack

        else

            expandLen = bufSpace;



        int skipTail = codeLen - expandLen;    // only > 0 if codeLen > bufSpace [left overs]



        int idx = offset + expandLen;      // initialise to exclusive end address of buffer area



        // NOTE: data unpacks in reverse direction and we are placing the

        // unpacked data directly into the array in the correct location.

        while ((idx > offset) && (code != (short)0xFFFF))

            {

                if (--skipTail < 0)          // skip required of expanded data

                    {

                        buf[--idx] = strChr_[code];

                    }

                code = strNxt_[code];        // to predecessor code

            }



        if (codeLen > expandLen)

            return -expandLen;          // indicate what part of codeLen used

        else

            return expandLen;          // indicate length of dat unpacked

    }



    public void dump(PrintStream out)

    {

        int i;

        for (i = 258; i < numStrings_; ++i)

            out.println(  " strNxt_[" + i + "] = " + strNxt_[i]

                          + " strChr_ " + Integer.toHexString(strChr_[i] & 0xFF)

                          + " strLen_ " + Integer.toHexString(strLen_[i]));

    }

}
Open Source Repository
Home	/itextpdf/itextpdf-5.1.2 \| Repository Home
Open Source Repository