diff options
Diffstat (limited to 'src/isa-l/igzip/huff_codes.c')
-rw-r--r-- | src/isa-l/igzip/huff_codes.c | 1625 |
1 files changed, 1625 insertions, 0 deletions
diff --git a/src/isa-l/igzip/huff_codes.c b/src/isa-l/igzip/huff_codes.c new file mode 100644 index 00000000..c8b2035d --- /dev/null +++ b/src/isa-l/igzip/huff_codes.c @@ -0,0 +1,1625 @@ +/********************************************************************** + Copyright(c) 2011-2016 Intel Corporation All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + * Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + * Redistributions in binary form must reproduce the above copyright + notice, this list of conditions and the following disclaimer in + the documentation and/or other materials provided with the + distribution. + * Neither the name of Intel Corporation nor the names of its + contributors may be used to endorse or promote products derived + from this software without specific prior written permission. + + THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS + "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT + LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR + A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT + OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, + SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT + LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, + DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY + THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT + (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE + OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. +**********************************************************************/ + +#include <immintrin.h> +#include <stdint.h> +#include <string.h> +#include <assert.h> +#include "igzip_lib.h" +#include "huff_codes.h" +#include "huffman.h" +#include "bitbuf2.h" +#include "flatten_ll.h" + +/* The order code length codes are written in the dynamic code header. This is + * defined in RFC 1951 page 13 */ +static const uint8_t code_length_code_order[] = + { 16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15 }; + +const uint32_t len_code_extra_bits[] = { + 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, + 0x1, 0x1, 0x1, 0x1, 0x2, 0x2, 0x2, 0x2, + 0x3, 0x3, 0x3, 0x3, 0x4, 0x4, 0x4, 0x4, + 0x5, 0x5, 0x5, 0x5, 0x0 +}; + +const uint32_t dist_code_extra_bits[] = { + 0x0, 0x0, 0x0, 0x0, 0x1, 0x1, 0x2, 0x2, + 0x3, 0x3, 0x4, 0x4, 0x5, 0x5, 0x6, 0x6, + 0x7, 0x7, 0x8, 0x8, 0x9, 0x9, 0xa, 0xa, + 0xb, 0xb, 0xc, 0xc, 0xd, 0xd +}; + +struct hufftables_icf static_hufftables = { + .lit_len_table = { + {.code_and_extra = 0x00c,.length2 = 0x8}, + {.code_and_extra = 0x08c,.length2 = 0x8}, + {.code_and_extra = 0x04c,.length2 = 0x8}, + {.code_and_extra = 0x0cc,.length2 = 0x8}, + {.code_and_extra = 0x02c,.length2 = 0x8}, + {.code_and_extra = 0x0ac,.length2 = 0x8}, + {.code_and_extra = 0x06c,.length2 = 0x8}, + {.code_and_extra = 0x0ec,.length2 = 0x8}, + {.code_and_extra = 0x01c,.length2 = 0x8}, + {.code_and_extra = 0x09c,.length2 = 0x8}, + {.code_and_extra = 0x05c,.length2 = 0x8}, + {.code_and_extra = 0x0dc,.length2 = 0x8}, + {.code_and_extra = 0x03c,.length2 = 0x8}, + {.code_and_extra = 0x0bc,.length2 = 0x8}, + {.code_and_extra = 0x07c,.length2 = 0x8}, + {.code_and_extra = 0x0fc,.length2 = 0x8}, + {.code_and_extra = 0x002,.length2 = 0x8}, + {.code_and_extra = 0x082,.length2 = 0x8}, + {.code_and_extra = 0x042,.length2 = 0x8}, + {.code_and_extra = 0x0c2,.length2 = 0x8}, + {.code_and_extra = 0x022,.length2 = 0x8}, + {.code_and_extra = 0x0a2,.length2 = 0x8}, + {.code_and_extra = 0x062,.length2 = 0x8}, + {.code_and_extra = 0x0e2,.length2 = 0x8}, + {.code_and_extra = 0x012,.length2 = 0x8}, + {.code_and_extra = 0x092,.length2 = 0x8}, + {.code_and_extra = 0x052,.length2 = 0x8}, + {.code_and_extra = 0x0d2,.length2 = 0x8}, + {.code_and_extra = 0x032,.length2 = 0x8}, + {.code_and_extra = 0x0b2,.length2 = 0x8}, + {.code_and_extra = 0x072,.length2 = 0x8}, + {.code_and_extra = 0x0f2,.length2 = 0x8}, + {.code_and_extra = 0x00a,.length2 = 0x8}, + {.code_and_extra = 0x08a,.length2 = 0x8}, + {.code_and_extra = 0x04a,.length2 = 0x8}, + {.code_and_extra = 0x0ca,.length2 = 0x8}, + {.code_and_extra = 0x02a,.length2 = 0x8}, + {.code_and_extra = 0x0aa,.length2 = 0x8}, + {.code_and_extra = 0x06a,.length2 = 0x8}, + {.code_and_extra = 0x0ea,.length2 = 0x8}, + {.code_and_extra = 0x01a,.length2 = 0x8}, + {.code_and_extra = 0x09a,.length2 = 0x8}, + {.code_and_extra = 0x05a,.length2 = 0x8}, + {.code_and_extra = 0x0da,.length2 = 0x8}, + {.code_and_extra = 0x03a,.length2 = 0x8}, + {.code_and_extra = 0x0ba,.length2 = 0x8}, + {.code_and_extra = 0x07a,.length2 = 0x8}, + {.code_and_extra = 0x0fa,.length2 = 0x8}, + {.code_and_extra = 0x006,.length2 = 0x8}, + {.code_and_extra = 0x086,.length2 = 0x8}, + {.code_and_extra = 0x046,.length2 = 0x8}, + {.code_and_extra = 0x0c6,.length2 = 0x8}, + {.code_and_extra = 0x026,.length2 = 0x8}, + {.code_and_extra = 0x0a6,.length2 = 0x8}, + {.code_and_extra = 0x066,.length2 = 0x8}, + {.code_and_extra = 0x0e6,.length2 = 0x8}, + {.code_and_extra = 0x016,.length2 = 0x8}, + {.code_and_extra = 0x096,.length2 = 0x8}, + {.code_and_extra = 0x056,.length2 = 0x8}, + {.code_and_extra = 0x0d6,.length2 = 0x8}, + {.code_and_extra = 0x036,.length2 = 0x8}, + {.code_and_extra = 0x0b6,.length2 = 0x8}, + {.code_and_extra = 0x076,.length2 = 0x8}, + {.code_and_extra = 0x0f6,.length2 = 0x8}, + {.code_and_extra = 0x00e,.length2 = 0x8}, + {.code_and_extra = 0x08e,.length2 = 0x8}, + {.code_and_extra = 0x04e,.length2 = 0x8}, + {.code_and_extra = 0x0ce,.length2 = 0x8}, + {.code_and_extra = 0x02e,.length2 = 0x8}, + {.code_and_extra = 0x0ae,.length2 = 0x8}, + {.code_and_extra = 0x06e,.length2 = 0x8}, + {.code_and_extra = 0x0ee,.length2 = 0x8}, + {.code_and_extra = 0x01e,.length2 = 0x8}, + {.code_and_extra = 0x09e,.length2 = 0x8}, + {.code_and_extra = 0x05e,.length2 = 0x8}, + {.code_and_extra = 0x0de,.length2 = 0x8}, + {.code_and_extra = 0x03e,.length2 = 0x8}, + {.code_and_extra = 0x0be,.length2 = 0x8}, + {.code_and_extra = 0x07e,.length2 = 0x8}, + {.code_and_extra = 0x0fe,.length2 = 0x8}, + {.code_and_extra = 0x001,.length2 = 0x8}, + {.code_and_extra = 0x081,.length2 = 0x8}, + {.code_and_extra = 0x041,.length2 = 0x8}, + {.code_and_extra = 0x0c1,.length2 = 0x8}, + {.code_and_extra = 0x021,.length2 = 0x8}, + {.code_and_extra = 0x0a1,.length2 = 0x8}, + {.code_and_extra = 0x061,.length2 = 0x8}, + {.code_and_extra = 0x0e1,.length2 = 0x8}, + {.code_and_extra = 0x011,.length2 = 0x8}, + {.code_and_extra = 0x091,.length2 = 0x8}, + {.code_and_extra = 0x051,.length2 = 0x8}, + {.code_and_extra = 0x0d1,.length2 = 0x8}, + {.code_and_extra = 0x031,.length2 = 0x8}, + {.code_and_extra = 0x0b1,.length2 = 0x8}, + {.code_and_extra = 0x071,.length2 = 0x8}, + {.code_and_extra = 0x0f1,.length2 = 0x8}, + {.code_and_extra = 0x009,.length2 = 0x8}, + {.code_and_extra = 0x089,.length2 = 0x8}, + {.code_and_extra = 0x049,.length2 = 0x8}, + {.code_and_extra = 0x0c9,.length2 = 0x8}, + {.code_and_extra = 0x029,.length2 = 0x8}, + {.code_and_extra = 0x0a9,.length2 = 0x8}, + {.code_and_extra = 0x069,.length2 = 0x8}, + {.code_and_extra = 0x0e9,.length2 = 0x8}, + {.code_and_extra = 0x019,.length2 = 0x8}, + {.code_and_extra = 0x099,.length2 = 0x8}, + {.code_and_extra = 0x059,.length2 = 0x8}, + {.code_and_extra = 0x0d9,.length2 = 0x8}, + {.code_and_extra = 0x039,.length2 = 0x8}, + {.code_and_extra = 0x0b9,.length2 = 0x8}, + {.code_and_extra = 0x079,.length2 = 0x8}, + {.code_and_extra = 0x0f9,.length2 = 0x8}, + {.code_and_extra = 0x005,.length2 = 0x8}, + {.code_and_extra = 0x085,.length2 = 0x8}, + {.code_and_extra = 0x045,.length2 = 0x8}, + {.code_and_extra = 0x0c5,.length2 = 0x8}, + {.code_and_extra = 0x025,.length2 = 0x8}, + {.code_and_extra = 0x0a5,.length2 = 0x8}, + {.code_and_extra = 0x065,.length2 = 0x8}, + {.code_and_extra = 0x0e5,.length2 = 0x8}, + {.code_and_extra = 0x015,.length2 = 0x8}, + {.code_and_extra = 0x095,.length2 = 0x8}, + {.code_and_extra = 0x055,.length2 = 0x8}, + {.code_and_extra = 0x0d5,.length2 = 0x8}, + {.code_and_extra = 0x035,.length2 = 0x8}, + {.code_and_extra = 0x0b5,.length2 = 0x8}, + {.code_and_extra = 0x075,.length2 = 0x8}, + {.code_and_extra = 0x0f5,.length2 = 0x8}, + {.code_and_extra = 0x00d,.length2 = 0x8}, + {.code_and_extra = 0x08d,.length2 = 0x8}, + {.code_and_extra = 0x04d,.length2 = 0x8}, + {.code_and_extra = 0x0cd,.length2 = 0x8}, + {.code_and_extra = 0x02d,.length2 = 0x8}, + {.code_and_extra = 0x0ad,.length2 = 0x8}, + {.code_and_extra = 0x06d,.length2 = 0x8}, + {.code_and_extra = 0x0ed,.length2 = 0x8}, + {.code_and_extra = 0x01d,.length2 = 0x8}, + {.code_and_extra = 0x09d,.length2 = 0x8}, + {.code_and_extra = 0x05d,.length2 = 0x8}, + {.code_and_extra = 0x0dd,.length2 = 0x8}, + {.code_and_extra = 0x03d,.length2 = 0x8}, + {.code_and_extra = 0x0bd,.length2 = 0x8}, + {.code_and_extra = 0x07d,.length2 = 0x8}, + {.code_and_extra = 0x0fd,.length2 = 0x8}, + {.code_and_extra = 0x013,.length2 = 0x9}, + {.code_and_extra = 0x113,.length2 = 0x9}, + {.code_and_extra = 0x093,.length2 = 0x9}, + {.code_and_extra = 0x193,.length2 = 0x9}, + {.code_and_extra = 0x053,.length2 = 0x9}, + {.code_and_extra = 0x153,.length2 = 0x9}, + {.code_and_extra = 0x0d3,.length2 = 0x9}, + {.code_and_extra = 0x1d3,.length2 = 0x9}, + {.code_and_extra = 0x033,.length2 = 0x9}, + {.code_and_extra = 0x133,.length2 = 0x9}, + {.code_and_extra = 0x0b3,.length2 = 0x9}, + {.code_and_extra = 0x1b3,.length2 = 0x9}, + {.code_and_extra = 0x073,.length2 = 0x9}, + {.code_and_extra = 0x173,.length2 = 0x9}, + {.code_and_extra = 0x0f3,.length2 = 0x9}, + {.code_and_extra = 0x1f3,.length2 = 0x9}, + {.code_and_extra = 0x00b,.length2 = 0x9}, + {.code_and_extra = 0x10b,.length2 = 0x9}, + {.code_and_extra = 0x08b,.length2 = 0x9}, + {.code_and_extra = 0x18b,.length2 = 0x9}, + {.code_and_extra = 0x04b,.length2 = 0x9}, + {.code_and_extra = 0x14b,.length2 = 0x9}, + {.code_and_extra = 0x0cb,.length2 = 0x9}, + {.code_and_extra = 0x1cb,.length2 = 0x9}, + {.code_and_extra = 0x02b,.length2 = 0x9}, + {.code_and_extra = 0x12b,.length2 = 0x9}, + {.code_and_extra = 0x0ab,.length2 = 0x9}, + {.code_and_extra = 0x1ab,.length2 = 0x9}, + {.code_and_extra = 0x06b,.length2 = 0x9}, + {.code_and_extra = 0x16b,.length2 = 0x9}, + {.code_and_extra = 0x0eb,.length2 = 0x9}, + {.code_and_extra = 0x1eb,.length2 = 0x9}, + {.code_and_extra = 0x01b,.length2 = 0x9}, + {.code_and_extra = 0x11b,.length2 = 0x9}, + {.code_and_extra = 0x09b,.length2 = 0x9}, + {.code_and_extra = 0x19b,.length2 = 0x9}, + {.code_and_extra = 0x05b,.length2 = 0x9}, + {.code_and_extra = 0x15b,.length2 = 0x9}, + {.code_and_extra = 0x0db,.length2 = 0x9}, + {.code_and_extra = 0x1db,.length2 = 0x9}, + {.code_and_extra = 0x03b,.length2 = 0x9}, + {.code_and_extra = 0x13b,.length2 = 0x9}, + {.code_and_extra = 0x0bb,.length2 = 0x9}, + {.code_and_extra = 0x1bb,.length2 = 0x9}, + {.code_and_extra = 0x07b,.length2 = 0x9}, + {.code_and_extra = 0x17b,.length2 = 0x9}, + {.code_and_extra = 0x0fb,.length2 = 0x9}, + {.code_and_extra = 0x1fb,.length2 = 0x9}, + {.code_and_extra = 0x007,.length2 = 0x9}, + {.code_and_extra = 0x107,.length2 = 0x9}, + {.code_and_extra = 0x087,.length2 = 0x9}, + {.code_and_extra = 0x187,.length2 = 0x9}, + {.code_and_extra = 0x047,.length2 = 0x9}, + {.code_and_extra = 0x147,.length2 = 0x9}, + {.code_and_extra = 0x0c7,.length2 = 0x9}, + {.code_and_extra = 0x1c7,.length2 = 0x9}, + {.code_and_extra = 0x027,.length2 = 0x9}, + {.code_and_extra = 0x127,.length2 = 0x9}, + {.code_and_extra = 0x0a7,.length2 = 0x9}, + {.code_and_extra = 0x1a7,.length2 = 0x9}, + {.code_and_extra = 0x067,.length2 = 0x9}, + {.code_and_extra = 0x167,.length2 = 0x9}, + {.code_and_extra = 0x0e7,.length2 = 0x9}, + {.code_and_extra = 0x1e7,.length2 = 0x9}, + {.code_and_extra = 0x017,.length2 = 0x9}, + {.code_and_extra = 0x117,.length2 = 0x9}, + {.code_and_extra = 0x097,.length2 = 0x9}, + {.code_and_extra = 0x197,.length2 = 0x9}, + {.code_and_extra = 0x057,.length2 = 0x9}, + {.code_and_extra = 0x157,.length2 = 0x9}, + {.code_and_extra = 0x0d7,.length2 = 0x9}, + {.code_and_extra = 0x1d7,.length2 = 0x9}, + {.code_and_extra = 0x037,.length2 = 0x9}, + {.code_and_extra = 0x137,.length2 = 0x9}, + {.code_and_extra = 0x0b7,.length2 = 0x9}, + {.code_and_extra = 0x1b7,.length2 = 0x9}, + {.code_and_extra = 0x077,.length2 = 0x9}, + {.code_and_extra = 0x177,.length2 = 0x9}, + {.code_and_extra = 0x0f7,.length2 = 0x9}, + {.code_and_extra = 0x1f7,.length2 = 0x9}, + {.code_and_extra = 0x00f,.length2 = 0x9}, + {.code_and_extra = 0x10f,.length2 = 0x9}, + {.code_and_extra = 0x08f,.length2 = 0x9}, + {.code_and_extra = 0x18f,.length2 = 0x9}, + {.code_and_extra = 0x04f,.length2 = 0x9}, + {.code_and_extra = 0x14f,.length2 = 0x9}, + {.code_and_extra = 0x0cf,.length2 = 0x9}, + {.code_and_extra = 0x1cf,.length2 = 0x9}, + {.code_and_extra = 0x02f,.length2 = 0x9}, + {.code_and_extra = 0x12f,.length2 = 0x9}, + {.code_and_extra = 0x0af,.length2 = 0x9}, + {.code_and_extra = 0x1af,.length2 = 0x9}, + {.code_and_extra = 0x06f,.length2 = 0x9}, + {.code_and_extra = 0x16f,.length2 = 0x9}, + {.code_and_extra = 0x0ef,.length2 = 0x9}, + {.code_and_extra = 0x1ef,.length2 = 0x9}, + {.code_and_extra = 0x01f,.length2 = 0x9}, + {.code_and_extra = 0x11f,.length2 = 0x9}, + {.code_and_extra = 0x09f,.length2 = 0x9}, + {.code_and_extra = 0x19f,.length2 = 0x9}, + {.code_and_extra = 0x05f,.length2 = 0x9}, + {.code_and_extra = 0x15f,.length2 = 0x9}, + {.code_and_extra = 0x0df,.length2 = 0x9}, + {.code_and_extra = 0x1df,.length2 = 0x9}, + {.code_and_extra = 0x03f,.length2 = 0x9}, + {.code_and_extra = 0x13f,.length2 = 0x9}, + {.code_and_extra = 0x0bf,.length2 = 0x9}, + {.code_and_extra = 0x1bf,.length2 = 0x9}, + {.code_and_extra = 0x07f,.length2 = 0x9}, + {.code_and_extra = 0x17f,.length2 = 0x9}, + {.code_and_extra = 0x0ff,.length2 = 0x9}, + {.code_and_extra = 0x1ff,.length2 = 0x9}, + {.code_and_extra = 0x000,.length2 = 0x7}, + {.code_and_extra = 0x040,.length2 = 0x7}, + {.code_and_extra = 0x020,.length2 = 0x7}, + {.code_and_extra = 0x060,.length2 = 0x7}, + {.code_and_extra = 0x010,.length2 = 0x7}, + {.code_and_extra = 0x050,.length2 = 0x7}, + {.code_and_extra = 0x030,.length2 = 0x7}, + {.code_and_extra = 0x070,.length2 = 0x7}, + {.code_and_extra = 0x008,.length2 = 0x7}, + {.code_and_extra = 0x048,.length2 = 0x7}, + {.code_and_extra = 0x028,.length2 = 0x7}, + {.code_and_extra = 0x068,.length2 = 0x7}, + {.code_and_extra = 0x018,.length2 = 0x7}, + {.code_and_extra = 0x058,.length2 = 0x7}, + {.code_and_extra = 0x038,.length2 = 0x7}, + {.code_and_extra = 0x078,.length2 = 0x7}, + {.code_and_extra = 0x004,.length2 = 0x7}, + {.code_and_extra = 0x044,.length2 = 0x7}, + {.code_and_extra = 0x024,.length2 = 0x7}, + {.code_and_extra = 0x064,.length2 = 0x7}, + {.code_and_extra = 0x014,.length2 = 0x7}, + {.code_and_extra = 0x054,.length2 = 0x7}, + {.code_and_extra = 0x034,.length2 = 0x7}, + {.code_and_extra = 0x074,.length2 = 0x7}, + {.code_and_extra = 0x003,.length2 = 0x8}, + {.code_and_extra = 0x083,.length2 = 0x8}, + {.code_and_extra = 0x043,.length2 = 0x8}, + {.code_and_extra = 0x0c3,.length2 = 0x8}, + {.code_and_extra = 0x023,.length2 = 0x8}, + {.code_and_extra = 0x0a3,.length2 = 0x8}, + {.code_and_extra = 0x063,.length2 = 0x8}, + {.code_and_extra = 0x0e3,.length2 = 0x8}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}, + {.code_and_extra = 0x000,.length2 = 0x0}}, + .dist_table = { + {.code_and_extra = 0x000,.length2 = 0x5}, + {.code_and_extra = 0x010,.length2 = 0x5}, + {.code_and_extra = 0x008,.length2 = 0x5}, + {.code_and_extra = 0x018,.length2 = 0x5}, + {.code_and_extra = 0x10004,.length2 = 0x5}, + {.code_and_extra = 0x10014,.length2 = 0x5}, + {.code_and_extra = 0x2000c,.length2 = 0x5}, + {.code_and_extra = 0x2001c,.length2 = 0x5}, + {.code_and_extra = 0x30002,.length2 = 0x5}, + {.code_and_extra = 0x30012,.length2 = 0x5}, + {.code_and_extra = 0x4000a,.length2 = 0x5}, + {.code_and_extra = 0x4001a,.length2 = 0x5}, + {.code_and_extra = 0x50006,.length2 = 0x5}, + {.code_and_extra = 0x50016,.length2 = 0x5}, + {.code_and_extra = 0x6000e,.length2 = 0x5}, + {.code_and_extra = 0x6001e,.length2 = 0x5}, + {.code_and_extra = 0x70001,.length2 = 0x5}, + {.code_and_extra = 0x70011,.length2 = 0x5}, + {.code_and_extra = 0x80009,.length2 = 0x5}, + {.code_and_extra = 0x80019,.length2 = 0x5}, + {.code_and_extra = 0x90005,.length2 = 0x5}, + {.code_and_extra = 0x90015,.length2 = 0x5}, + {.code_and_extra = 0xa000d,.length2 = 0x5}, + {.code_and_extra = 0xa001d,.length2 = 0x5}, + {.code_and_extra = 0xb0003,.length2 = 0x5}, + {.code_and_extra = 0xb0013,.length2 = 0x5}, + {.code_and_extra = 0xc000b,.length2 = 0x5}, + {.code_and_extra = 0xc001b,.length2 = 0x5}, + {.code_and_extra = 0xd0007,.length2 = 0x5}, + {.code_and_extra = 0xd0017,.length2 = 0x5}, + {.code_and_extra = 0x000,.length2 = 0x0}} +}; + +struct slver { + uint16_t snum; + uint8_t ver; + uint8_t core; +}; + +/* Version info */ +struct slver isal_update_histogram_slver_00010085; +struct slver isal_update_histogram_slver = { 0x0085, 0x01, 0x00 }; + +struct slver isal_create_hufftables_slver_00010086; +struct slver isal_create_hufftables_slver = { 0x0086, 0x01, 0x00 }; + +struct slver isal_create_hufftables_subset_slver_00010087; +struct slver isal_create_hufftables_subset_slver = { 0x0087, 0x01, 0x00 }; + +extern uint32_t build_huff_tree(struct heap_tree *heap, uint64_t heap_size, uint64_t node_ptr); +extern void build_heap(uint64_t * heap, uint64_t heap_size); + +static const uint8_t bitrev8[0x100] = { + 0x00, 0x80, 0x40, 0xC0, 0x20, 0xA0, 0x60, 0xE0, + 0x10, 0x90, 0x50, 0xD0, 0x30, 0xB0, 0x70, 0xF0, + 0x08, 0x88, 0x48, 0xC8, 0x28, 0xA8, 0x68, 0xE8, + 0x18, 0x98, 0x58, 0xD8, 0x38, 0xB8, 0x78, 0xF8, + 0x04, 0x84, 0x44, 0xC4, 0x24, 0xA4, 0x64, 0xE4, + 0x14, 0x94, 0x54, 0xD4, 0x34, 0xB4, 0x74, 0xF4, + 0x0C, 0x8C, 0x4C, 0xCC, 0x2C, 0xAC, 0x6C, 0xEC, + 0x1C, 0x9C, 0x5C, 0xDC, 0x3C, 0xBC, 0x7C, 0xFC, + 0x02, 0x82, 0x42, 0xC2, 0x22, 0xA2, 0x62, 0xE2, + 0x12, 0x92, 0x52, 0xD2, 0x32, 0xB2, 0x72, 0xF2, + 0x0A, 0x8A, 0x4A, 0xCA, 0x2A, 0xAA, 0x6A, 0xEA, + 0x1A, 0x9A, 0x5A, 0xDA, 0x3A, 0xBA, 0x7A, 0xFA, + 0x06, 0x86, 0x46, 0xC6, 0x26, 0xA6, 0x66, 0xE6, + 0x16, 0x96, 0x56, 0xD6, 0x36, 0xB6, 0x76, 0xF6, + 0x0E, 0x8E, 0x4E, 0xCE, 0x2E, 0xAE, 0x6E, 0xEE, + 0x1E, 0x9E, 0x5E, 0xDE, 0x3E, 0xBE, 0x7E, 0xFE, + 0x01, 0x81, 0x41, 0xC1, 0x21, 0xA1, 0x61, 0xE1, + 0x11, 0x91, 0x51, 0xD1, 0x31, 0xB1, 0x71, 0xF1, + 0x09, 0x89, 0x49, 0xC9, 0x29, 0xA9, 0x69, 0xE9, + 0x19, 0x99, 0x59, 0xD9, 0x39, 0xB9, 0x79, 0xF9, + 0x05, 0x85, 0x45, 0xC5, 0x25, 0xA5, 0x65, 0xE5, + 0x15, 0x95, 0x55, 0xD5, 0x35, 0xB5, 0x75, 0xF5, + 0x0D, 0x8D, 0x4D, 0xCD, 0x2D, 0xAD, 0x6D, 0xED, + 0x1D, 0x9D, 0x5D, 0xDD, 0x3D, 0xBD, 0x7D, 0xFD, + 0x03, 0x83, 0x43, 0xC3, 0x23, 0xA3, 0x63, 0xE3, + 0x13, 0x93, 0x53, 0xD3, 0x33, 0xB3, 0x73, 0xF3, + 0x0B, 0x8B, 0x4B, 0xCB, 0x2B, 0xAB, 0x6B, 0xEB, + 0x1B, 0x9B, 0x5B, 0xDB, 0x3B, 0xBB, 0x7B, 0xFB, + 0x07, 0x87, 0x47, 0xC7, 0x27, 0xA7, 0x67, 0xE7, + 0x17, 0x97, 0x57, 0xD7, 0x37, 0xB7, 0x77, 0xF7, + 0x0F, 0x8F, 0x4F, 0xCF, 0x2F, 0xAF, 0x6F, 0xEF, + 0x1F, 0x9F, 0x5F, 0xDF, 0x3F, 0xBF, 0x7F, 0xFF +}; + +// bit reverse low order LENGTH bits in code, and return result in low order bits +static inline uint16_t bit_reverse(uint16_t code, uint32_t length) +{ + code = (bitrev8[code & 0x00FF] << 8) | (bitrev8[code >> 8]); + return (code >> (16 - length)); +} + +void isal_update_histogram_base(uint8_t * start_stream, int length, + struct isal_huff_histogram *histogram) +{ + uint32_t literal = 0, hash; + uint16_t seen, *last_seen = histogram->hash_table; + uint8_t *current, *end_stream, *next_hash, *end; + uint32_t match_length; + uint32_t dist; + uint64_t *lit_len_histogram = histogram->lit_len_histogram; + uint64_t *dist_histogram = histogram->dist_histogram; + + if (length <= 0) + return; + + end_stream = start_stream + length; + memset(last_seen, 0, sizeof(histogram->hash_table)); /* Initialize last_seen to be 0. */ + for (current = start_stream; current < end_stream - 3; current++) { + literal = *(uint32_t *) current; + hash = compute_hash(literal) & HASH_MASK; + seen = last_seen[hash]; + last_seen[hash] = (current - start_stream) & 0xFFFF; + dist = (current - start_stream - seen) & 0xFFFF; + if (dist - 1 < D - 1) { + assert(start_stream <= current - dist); + match_length = + compare258(current - dist, current, end_stream - current); + if (match_length >= SHORTEST_MATCH) { + next_hash = current; +#ifdef ISAL_LIMIT_HASH_UPDATE + end = next_hash + 3; +#else + end = next_hash + match_length; +#endif + if (end > end_stream - 3) + end = end_stream - 3; + next_hash++; + for (; next_hash < end; next_hash++) { + literal = *(uint32_t *) next_hash; + hash = compute_hash(literal) & HASH_MASK; + last_seen[hash] = (next_hash - start_stream) & 0xFFFF; + } + + dist_histogram[convert_dist_to_dist_sym(dist)] += 1; + lit_len_histogram[convert_length_to_len_sym(match_length)] += + 1; + current += match_length - 1; + continue; + } + } + lit_len_histogram[literal & 0xFF] += 1; + } + literal = literal >> 8; + hash = compute_hash(literal) & HASH_MASK; + seen = last_seen[hash]; + last_seen[hash] = (current - start_stream) & 0xFFFF; + dist = (current - start_stream - seen) & 0xFFFF; + if (dist < D) { + match_length = compare258(current - dist, current, end_stream - current); + if (match_length >= SHORTEST_MATCH) { + dist_histogram[convert_dist_to_dist_sym(dist)] += 1; + lit_len_histogram[convert_length_to_len_sym(match_length)] += 1; + lit_len_histogram[256] += 1; + return; + } + } else + lit_len_histogram[literal & 0xFF] += 1; + lit_len_histogram[(literal >> 8) & 0xFF] += 1; + lit_len_histogram[(literal >> 16) & 0xFF] += 1; + lit_len_histogram[256] += 1; + return; +} + +uint32_t convert_dist_to_dist_sym(uint32_t dist) +{ + assert(dist <= 32768 && dist > 0); + if (dist <= 2) + return dist - 1; + else if (dist <= 4) + return 0 + (dist - 1) / 1; + else if (dist <= 8) + return 2 + (dist - 1) / 2; + else if (dist <= 16) + return 4 + (dist - 1) / 4; + else if (dist <= 32) + return 6 + (dist - 1) / 8; + else if (dist <= 64) + return 8 + (dist - 1) / 16; + else if (dist <= 128) + return 10 + (dist - 1) / 32; + else if (dist <= 256) + return 12 + (dist - 1) / 64; + else if (dist <= 512) + return 14 + (dist - 1) / 128; + else if (dist <= 1024) + return 16 + (dist - 1) / 256; + else if (dist <= 2048) + return 18 + (dist - 1) / 512; + else if (dist <= 4096) + return 20 + (dist - 1) / 1024; + else if (dist <= 8192) + return 22 + (dist - 1) / 2048; + else if (dist <= 16384) + return 24 + (dist - 1) / 4096; + else if (dist <= 32768) + return 26 + (dist - 1) / 8192; + else + return ~0; /* ~0 is an invalid distance code */ + +} + +uint32_t convert_length_to_len_sym(uint32_t length) +{ + assert(length > 2 && length < 259); + + /* Based on tables on page 11 in RFC 1951 */ + if (length < 11) + return 257 + length - 3; + else if (length < 19) + return 261 + (length - 3) / 2; + else if (length < 35) + return 265 + (length - 3) / 4; + else if (length < 67) + return 269 + (length - 3) / 8; + else if (length < 131) + return 273 + (length - 3) / 16; + else if (length < 258) + return 277 + (length - 3) / 32; + else + return 285; +} + +// Upon return, codes[] contains the code lengths, +// and bl_count is the count of the lengths + +/* Init heap with the histogram, and return the histogram size */ +static inline uint32_t init_heap32(struct heap_tree *heap_space, uint32_t * histogram, + uint32_t hist_size) +{ + uint32_t heap_size, i; + + memset(heap_space, 0, sizeof(struct heap_tree)); + + heap_size = 0; + for (i = 0; i < hist_size; i++) { + if (histogram[i] != 0) + heap_space->heap[++heap_size] = + (((uint64_t) histogram[i]) << FREQ_SHIFT) | i; + } + + // make sure heap has at least two elements in it + if (heap_size < 2) { + if (heap_size == 0) { + heap_space->heap[1] = 1ULL << FREQ_SHIFT; + heap_space->heap[2] = (1ULL << FREQ_SHIFT) | 1; + heap_size = 2; + } else { + // heap size == 1 + if (histogram[0] == 0) + heap_space->heap[2] = 1ULL << FREQ_SHIFT; + else + heap_space->heap[2] = (1ULL << FREQ_SHIFT) | 1; + heap_size = 2; + } + } + + build_heap(heap_space->heap, heap_size); + + return heap_size; +} + +static inline uint32_t init_heap64(struct heap_tree *heap_space, uint64_t * histogram, + uint64_t hist_size) +{ + uint32_t heap_size, i; + + memset(heap_space, 0, sizeof(struct heap_tree)); + + heap_size = 0; + for (i = 0; i < hist_size; i++) { + if (histogram[i] != 0) + heap_space->heap[++heap_size] = ((histogram[i]) << FREQ_SHIFT) | i; + } + + // make sure heap has at least two elements in it + if (heap_size < 2) { + if (heap_size == 0) { + heap_space->heap[1] = 1ULL << FREQ_SHIFT; + heap_space->heap[2] = (1ULL << FREQ_SHIFT) | 1; + heap_size = 2; + } else { + // heap size == 1 + if (histogram[0] == 0) + heap_space->heap[2] = 1ULL << FREQ_SHIFT; + else + heap_space->heap[2] = (1ULL << FREQ_SHIFT) | 1; + heap_size = 2; + } + } + + build_heap(heap_space->heap, heap_size); + + return heap_size; +} + +static inline uint32_t init_heap64_complete(struct heap_tree *heap_space, uint64_t * histogram, + uint64_t hist_size) +{ + uint32_t heap_size, i; + + memset(heap_space, 0, sizeof(struct heap_tree)); + + heap_size = 0; + for (i = 0; i < hist_size; i++) + heap_space->heap[++heap_size] = ((histogram[i]) << FREQ_SHIFT) | i; + + build_heap(heap_space->heap, heap_size); + + return heap_size; +} + +static inline uint32_t fix_code_lens(struct heap_tree *heap_space, uint32_t root_node, + uint32_t * bl_count, uint32_t max_code_len) +{ + struct tree_node *tree = heap_space->tree; + uint64_t *code_len_count = heap_space->code_len_count; + uint32_t i, j, k, child, depth, code_len; + + // compute code lengths and code length counts + code_len = 0; + j = root_node; + for (i = root_node; i <= HEAP_TREE_NODE_START; i++) { + child = tree[i].child; + if (child > MAX_HISTHEAP_SIZE) { + depth = 1 + tree[i].depth; + + tree[child].depth = depth; + tree[child - 1].depth = depth; + } else { + tree[j++] = tree[i]; + depth = tree[i].depth; + while (code_len < depth) { + code_len++; + code_len_count[code_len] = 0; + } + code_len_count[depth]++; + } + } + + if (code_len > max_code_len) { + while (code_len > max_code_len) { + assert(code_len_count[code_len] > 1); + for (i = max_code_len - 1; i != 0; i--) + if (code_len_count[i] != 0) + break; + assert(i != 0); + code_len_count[i]--; + code_len_count[i + 1] += 2; + code_len_count[code_len - 1]++; + code_len_count[code_len] -= 2; + if (code_len_count[code_len] == 0) + code_len--; + } + + for (i = 1; i <= code_len; i++) + bl_count[i] = code_len_count[i]; + for (; i <= max_code_len; i++) + bl_count[i] = 0; + + for (k = 1; code_len_count[k] == 0; k++) ; + for (i = root_node; i < j; i++) { + tree[i].depth = k; + code_len_count[k]--; + for (; code_len_count[k] == 0; k++) ; + } + } else { + for (i = 1; i <= code_len; i++) + bl_count[i] = code_len_count[i]; + for (; i <= max_code_len; i++) + bl_count[i] = 0; + } + + return j; + +} + +static inline void +gen_huff_code_lens(struct heap_tree *heap_space, uint32_t heap_size, uint32_t * bl_count, + struct huff_code *codes, uint32_t codes_count, uint32_t max_code_len) +{ + struct tree_node *tree = heap_space->tree; + uint32_t root_node = HEAP_TREE_NODE_START, node_ptr; + uint32_t end_node; + + root_node = build_huff_tree(heap_space, heap_size, root_node); + + end_node = fix_code_lens(heap_space, root_node, bl_count, max_code_len); + + memset(codes, 0, codes_count * sizeof(*codes)); + for (node_ptr = root_node; node_ptr < end_node; node_ptr++) + codes[tree[node_ptr].child].length = tree[node_ptr].depth; + +} + +inline uint32_t set_huff_codes(struct huff_code *huff_code_table, int table_length, + uint32_t * count) +{ + /* Uses the algorithm mentioned in the deflate standard, Rfc 1951. */ + int i; + uint16_t code = 0; + uint16_t next_code[MAX_HUFF_TREE_DEPTH + 1]; + uint32_t max_code = 0; + + next_code[0] = code; + + for (i = 1; i < MAX_HUFF_TREE_DEPTH + 1; i++) + next_code[i] = (next_code[i - 1] + count[i - 1]) << 1; + + for (i = 0; i < table_length; i++) { + if (huff_code_table[i].length != 0) { + huff_code_table[i].code = + bit_reverse(next_code[huff_code_table[i].length], + huff_code_table[i].length); + next_code[huff_code_table[i].length] += 1; + max_code = i; + } + } + + return max_code; +} + +// on input, codes contain the code lengths +// on output, code contains: +// 23:16 code length +// 15:0 code value in low order bits +// returns max code value +static inline uint32_t set_dist_huff_codes(struct huff_code *codes, uint32_t * bl_count) +{ + uint32_t code, code_len, bits, i; + uint32_t next_code[MAX_DEFLATE_CODE_LEN + 1]; + uint32_t max_code = 0; + const uint32_t num_codes = DIST_LEN; + + code = bl_count[0] = 0; + for (bits = 1; bits <= MAX_HUFF_TREE_DEPTH; bits++) { + code = (code + bl_count[bits - 1]) << 1; + next_code[bits] = code; + } + for (i = 0; i < num_codes; i++) { + code_len = codes[i].length; + if (code_len != 0) { + codes[i].code = bit_reverse(next_code[code_len], code_len); + codes[i].extra_bit_count = dist_code_extra_bits[i]; + next_code[code_len] += 1; + max_code = i; + } + } + return max_code; +} + +int create_huffman_header(struct BitBuf2 *header_bitbuf, + struct huff_code *lookup_table, + struct rl_code *huffman_rep, + uint16_t huffman_rep_length, uint32_t end_of_block, + uint32_t hclen, uint32_t hlit, uint32_t hdist) +{ + /* hlit, hdist, hclen are as defined in the deflate standard, head is the + * first three deflate header bits.*/ + int i; + uint64_t bit_count; + uint64_t data; + struct huff_code huffman_value; + const uint32_t extra_bits[3] = { 2, 3, 7 }; + + bit_count = buffer_bits_used(header_bitbuf); + + data = (end_of_block ? 5 : 4) | (hlit << 3) | (hdist << 8) | (hclen << 13); + data |= ((lookup_table[code_length_code_order[0]].length) << DYN_HDR_START_LEN); + write_bits(header_bitbuf, data, DYN_HDR_START_LEN + 3); + data = 0; + for (i = hclen + 3; i >= 1; i--) + data = (data << 3) | lookup_table[code_length_code_order[i]].length; + + write_bits(header_bitbuf, data, (hclen + 3) * 3); + + for (i = 0; i < huffman_rep_length; i++) { + huffman_value = lookup_table[huffman_rep[i].code]; + + write_bits(header_bitbuf, (uint64_t) huffman_value.code, + (uint32_t) huffman_value.length); + + if (huffman_rep[i].code > 15) { + write_bits(header_bitbuf, (uint64_t) huffman_rep[i].extra_bits, + (uint32_t) extra_bits[huffman_rep[i].code - 16]); + } + } + bit_count = buffer_bits_used(header_bitbuf) - bit_count; + + return bit_count; +} + +inline int create_header(struct BitBuf2 *header_bitbuf, struct rl_code *huffman_rep, + uint32_t length, uint64_t * histogram, uint32_t hlit, + uint32_t hdist, uint32_t end_of_block) +{ + int i; + + uint32_t heap_size; + struct heap_tree heap_space; + uint32_t code_len_count[MAX_HUFF_TREE_DEPTH + 1]; + struct huff_code lookup_table[HUFF_LEN]; + + /* hlit, hdist, and hclen are defined in RFC 1951 page 13 */ + uint32_t hclen; + uint64_t bit_count; + + /* Create a huffman tree to encode run length encoded representation. */ + heap_size = init_heap64(&heap_space, histogram, HUFF_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)lookup_table, HUFF_LEN, 7); + set_huff_codes(lookup_table, HUFF_LEN, code_len_count); + + /* Calculate hclen */ + for (i = CODE_LEN_CODES - 1; i > 3; i--) /* i must be at least 4 */ + if (lookup_table[code_length_code_order[i]].length != 0) + break; + + hclen = i - 3; + + /* Generate actual header. */ + bit_count = create_huffman_header(header_bitbuf, lookup_table, huffman_rep, + length, end_of_block, hclen, hlit, hdist); + + return bit_count; +} + +static inline + struct rl_code *write_rl(struct rl_code *pout, uint16_t last_len, uint32_t run_len, + uint64_t * counts) +{ + if (last_len == 0) { + while (run_len > 138) { + pout->code = 18; + pout->extra_bits = 138 - 11; + pout++; + run_len -= 138; + counts[18]++; + } + // 1 <= run_len <= 138 + if (run_len > 10) { + pout->code = 18; + pout->extra_bits = run_len - 11; + pout++; + counts[18]++; + } else if (run_len > 2) { + pout->code = 17; + pout->extra_bits = run_len - 3; + pout++; + counts[17]++; + } else if (run_len == 1) { + pout->code = 0; + pout->extra_bits = 0; + pout++; + counts[0]++; + } else { + assert(run_len == 2); + pout[0].code = 0; + pout[0].extra_bits = 0; + pout[1].code = 0; + pout[1].extra_bits = 0; + pout += 2; + counts[0] += 2; + } + } else { + // last_len != 0 + pout->code = last_len; + pout->extra_bits = 0; + pout++; + counts[last_len]++; + run_len--; + if (run_len != 0) { + while (run_len > 6) { + pout->code = 16; + pout->extra_bits = 6 - 3; + pout++; + run_len -= 6; + counts[16]++; + } + // 1 <= run_len <= 6 + switch (run_len) { + case 1: + pout->code = last_len; + pout->extra_bits = 0; + pout++; + counts[last_len]++; + break; + case 2: + pout[0].code = last_len; + pout[0].extra_bits = 0; + pout[1].code = last_len; + pout[1].extra_bits = 0; + pout += 2; + counts[last_len] += 2; + break; + default: // 3...6 + pout->code = 16; + pout->extra_bits = run_len - 3; + pout++; + counts[16]++; + } + } + } + return pout; +} + +// convert codes into run-length symbols, write symbols into OUT +// generate histogram into COUNTS (assumed to be initialized to 0) +// Format of OUT: +// 4:0 code (0...18) +// 15:8 Extra bits (0...127) +// returns number of symbols in out +static inline uint32_t rl_encode(uint16_t * codes, uint32_t num_codes, uint64_t * counts, + struct rl_code *out) +{ + uint32_t i, run_len; + uint16_t last_len, len; + struct rl_code *pout; + + pout = out; + last_len = codes[0]; + run_len = 1; + for (i = 1; i < num_codes; i++) { + len = codes[i]; + if (len == last_len) { + run_len++; + continue; + } + pout = write_rl(pout, last_len, run_len, counts); + last_len = len; + run_len = 1; + } + pout = write_rl(pout, last_len, run_len, counts); + + return (uint32_t) (pout - out); +} + +void create_code_tables(uint16_t * code_table, uint8_t * code_length_table, uint32_t length, + struct huff_code *hufftable) +{ + int i; + for (i = 0; i < length; i++) { + code_table[i] = hufftable[i].code; + code_length_table[i] = hufftable[i].length; + } +} + +void create_packed_len_table(uint32_t * packed_table, struct huff_code *lit_len_hufftable) +{ + int i, count = 0; + uint16_t extra_bits; + uint16_t extra_bits_count = 0; + + /* Gain extra bits is the next place where the number of extra bits in + * lenght codes increases. */ + uint16_t gain_extra_bits = LEN_EXTRA_BITS_START; + + for (i = 257; i < LIT_LEN - 1; i++) { + for (extra_bits = 0; extra_bits < (1 << extra_bits_count); extra_bits++) { + if (count > 254) + break; + packed_table[count++] = + (extra_bits << (lit_len_hufftable[i].length + LENGTH_BITS)) | + (lit_len_hufftable[i].code << LENGTH_BITS) | + (lit_len_hufftable[i].length + extra_bits_count); + } + + if (i == gain_extra_bits) { + gain_extra_bits += LEN_EXTRA_BITS_INTERVAL; + extra_bits_count += 1; + } + } + + packed_table[count] = (lit_len_hufftable[LIT_LEN - 1].code << LENGTH_BITS) | + (lit_len_hufftable[LIT_LEN - 1].length); +} + +void create_packed_dist_table(uint32_t * packed_table, uint32_t length, + struct huff_code *dist_hufftable) +{ + int i, count = 0; + uint16_t extra_bits; + uint16_t extra_bits_count = 0; + + /* Gain extra bits is the next place where the number of extra bits in + * distance codes increases. */ + uint16_t gain_extra_bits = DIST_EXTRA_BITS_START; + + for (i = 0; i < DIST_LEN; i++) { + for (extra_bits = 0; extra_bits < (1 << extra_bits_count); extra_bits++) { + if (count >= length) + return; + + packed_table[count++] = + (extra_bits << (dist_hufftable[i].length + LENGTH_BITS)) | + (dist_hufftable[i].code << LENGTH_BITS) | + (dist_hufftable[i].length + extra_bits_count); + + } + + if (i == gain_extra_bits) { + gain_extra_bits += DIST_EXTRA_BITS_INTERVAL; + extra_bits_count += 1; + } + } +} + +int are_hufftables_useable(struct huff_code *lit_len_hufftable, + struct huff_code *dist_hufftable) +{ + int max_lit_code_len = 0, max_len_code_len = 0, max_dist_code_len = 0; + int dist_extra_bits = 0, len_extra_bits = 0; + int gain_dist_extra_bits = DIST_EXTRA_BITS_START; + int gain_len_extra_bits = LEN_EXTRA_BITS_START; + int max_code_len; + int i; + + for (i = 0; i < LIT_LEN; i++) + if (lit_len_hufftable[i].length > max_lit_code_len) + max_lit_code_len = lit_len_hufftable[i].length; + + for (i = 257; i < LIT_LEN - 1; i++) { + if (lit_len_hufftable[i].length + len_extra_bits > max_len_code_len) + max_len_code_len = lit_len_hufftable[i].length + len_extra_bits; + + if (i == gain_len_extra_bits) { + gain_len_extra_bits += LEN_EXTRA_BITS_INTERVAL; + len_extra_bits += 1; + } + } + + for (i = 0; i < DIST_LEN; i++) { + if (dist_hufftable[i].length + dist_extra_bits > max_dist_code_len) + max_dist_code_len = dist_hufftable[i].length + dist_extra_bits; + + if (i == gain_dist_extra_bits) { + gain_dist_extra_bits += DIST_EXTRA_BITS_INTERVAL; + dist_extra_bits += 1; + } + } + + max_code_len = max_lit_code_len + max_len_code_len + max_dist_code_len; + + /* Some versions of igzip can write upto one literal, one length and one + * distance code at the same time. This checks to make sure that is + * always writeable in bitbuf*/ + return (max_code_len > MAX_BITBUF_BIT_WRITE); +} + +int isal_create_hufftables(struct isal_hufftables *hufftables, + struct isal_huff_histogram *histogram) +{ + struct huff_code lit_huff_table[LIT_LEN], dist_huff_table[DIST_LEN]; + uint64_t bit_count; + int max_dist = convert_dist_to_dist_sym(IGZIP_HIST_SIZE); + struct heap_tree heap_space; + uint32_t heap_size; + uint32_t code_len_count[MAX_HUFF_TREE_DEPTH + 1]; + struct BitBuf2 header_bitbuf; + uint32_t max_lit_len_sym; + uint32_t max_dist_sym; + uint32_t hlit, hdist, i; + uint16_t combined_table[LIT_LEN + DIST_LEN]; + uint64_t count_histogram[HUFF_LEN]; + struct rl_code rl_huff[LIT_LEN + DIST_LEN]; + uint32_t rl_huff_len; + + uint32_t *dist_table = hufftables->dist_table; + uint32_t *len_table = hufftables->len_table; + uint16_t *lit_table = hufftables->lit_table; + uint16_t *dcodes = hufftables->dcodes; + uint8_t *lit_table_sizes = hufftables->lit_table_sizes; + uint8_t *dcodes_sizes = hufftables->dcodes_sizes; + uint8_t *deflate_hdr = hufftables->deflate_hdr; + uint64_t *lit_len_histogram = histogram->lit_len_histogram; + uint64_t *dist_histogram = histogram->dist_histogram; + + memset(hufftables, 0, sizeof(struct isal_hufftables)); + + heap_size = init_heap64_complete(&heap_space, lit_len_histogram, LIT_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)lit_huff_table, LIT_LEN, MAX_DEFLATE_CODE_LEN); + max_lit_len_sym = set_huff_codes(lit_huff_table, LIT_LEN, code_len_count); + + heap_size = init_heap64_complete(&heap_space, dist_histogram, DIST_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)dist_huff_table, max_dist, + MAX_DEFLATE_CODE_LEN); + max_dist_sym = set_huff_codes(dist_huff_table, DIST_LEN, code_len_count); + + if (are_hufftables_useable(lit_huff_table, dist_huff_table)) { + heap_size = init_heap64_complete(&heap_space, lit_len_histogram, LIT_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)lit_huff_table, LIT_LEN, + MAX_SAFE_LIT_CODE_LEN); + max_lit_len_sym = set_huff_codes(lit_huff_table, LIT_LEN, code_len_count); + + heap_size = init_heap64_complete(&heap_space, dist_histogram, DIST_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)dist_huff_table, max_dist, + MAX_SAFE_DIST_CODE_LEN); + max_dist_sym = set_huff_codes(dist_huff_table, DIST_LEN, code_len_count); + + } + + create_code_tables(dcodes, dcodes_sizes, DIST_LEN - DCODE_OFFSET, + dist_huff_table + DCODE_OFFSET); + + create_code_tables(lit_table, lit_table_sizes, IGZIP_LIT_TABLE_SIZE, lit_huff_table); + + create_packed_len_table(len_table, lit_huff_table); + create_packed_dist_table(dist_table, IGZIP_DIST_TABLE_SIZE, dist_huff_table); + + set_buf(&header_bitbuf, deflate_hdr, sizeof(deflate_hdr)); + init(&header_bitbuf); + + hlit = max_lit_len_sym - 256; + hdist = max_dist_sym; + + /* Run length encode the length and distance huffman codes */ + memset(count_histogram, 0, sizeof(count_histogram)); + for (i = 0; i < 257 + hlit; i++) + combined_table[i] = lit_huff_table[i].length; + for (i = 0; i < 1 + hdist; i++) + combined_table[i + hlit + 257] = dist_huff_table[i].length; + rl_huff_len = + rl_encode(combined_table, hlit + 257 + hdist + 1, count_histogram, rl_huff); + + /* Create header */ + bit_count = + create_header(&header_bitbuf, rl_huff, rl_huff_len, + count_histogram, hlit, hdist, LAST_BLOCK); + flush(&header_bitbuf); + + hufftables->deflate_hdr_count = bit_count / 8; + hufftables->deflate_hdr_extra_bits = bit_count % 8; + + return 0; +} + +int isal_create_hufftables_subset(struct isal_hufftables *hufftables, + struct isal_huff_histogram *histogram) +{ + struct huff_code lit_huff_table[LIT_LEN], dist_huff_table[DIST_LEN]; + uint64_t bit_count; + int max_dist = convert_dist_to_dist_sym(IGZIP_HIST_SIZE); + struct heap_tree heap_space; + uint32_t heap_size; + uint32_t code_len_count[MAX_HUFF_TREE_DEPTH + 1]; + struct BitBuf2 header_bitbuf; + uint32_t max_lit_len_sym; + uint32_t max_dist_sym; + uint32_t hlit, hdist, i; + uint16_t combined_table[LIT_LEN + DIST_LEN]; + uint64_t count_histogram[HUFF_LEN]; + struct rl_code rl_huff[LIT_LEN + DIST_LEN]; + uint32_t rl_huff_len; + + uint32_t *dist_table = hufftables->dist_table; + uint32_t *len_table = hufftables->len_table; + uint16_t *lit_table = hufftables->lit_table; + uint16_t *dcodes = hufftables->dcodes; + uint8_t *lit_table_sizes = hufftables->lit_table_sizes; + uint8_t *dcodes_sizes = hufftables->dcodes_sizes; + uint8_t *deflate_hdr = hufftables->deflate_hdr; + uint64_t *lit_len_histogram = histogram->lit_len_histogram; + uint64_t *dist_histogram = histogram->dist_histogram; + + memset(hufftables, 0, sizeof(struct isal_hufftables)); + + heap_size = init_heap64(&heap_space, lit_len_histogram, LIT_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)lit_huff_table, LIT_LEN, MAX_DEFLATE_CODE_LEN); + max_lit_len_sym = set_huff_codes(lit_huff_table, LIT_LEN, code_len_count); + + heap_size = init_heap64_complete(&heap_space, dist_histogram, DIST_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)dist_huff_table, max_dist, + MAX_DEFLATE_CODE_LEN); + max_dist_sym = set_huff_codes(dist_huff_table, DIST_LEN, code_len_count); + + if (are_hufftables_useable(lit_huff_table, dist_huff_table)) { + heap_size = init_heap64_complete(&heap_space, lit_len_histogram, LIT_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)lit_huff_table, LIT_LEN, + MAX_SAFE_LIT_CODE_LEN); + max_lit_len_sym = set_huff_codes(lit_huff_table, LIT_LEN, code_len_count); + + heap_size = init_heap64_complete(&heap_space, dist_histogram, DIST_LEN); + gen_huff_code_lens(&heap_space, heap_size, code_len_count, + (struct huff_code *)dist_huff_table, max_dist, + MAX_SAFE_DIST_CODE_LEN); + max_dist_sym = set_huff_codes(dist_huff_table, DIST_LEN, code_len_count); + + } + + create_code_tables(dcodes, dcodes_sizes, DIST_LEN - DCODE_OFFSET, + dist_huff_table + DCODE_OFFSET); + + create_code_tables(lit_table, lit_table_sizes, IGZIP_LIT_TABLE_SIZE, lit_huff_table); + + create_packed_len_table(len_table, lit_huff_table); + create_packed_dist_table(dist_table, IGZIP_DIST_TABLE_SIZE, dist_huff_table); + + set_buf(&header_bitbuf, deflate_hdr, sizeof(deflate_hdr)); + init(&header_bitbuf); + + hlit = max_lit_len_sym - 256; + hdist = max_dist_sym; + + /* Run length encode the length and distance huffman codes */ + memset(count_histogram, 0, sizeof(count_histogram)); + for (i = 0; i < 257 + hlit; i++) + combined_table[i] = lit_huff_table[i].length; + for (i = 0; i < 1 + hdist; i++) + combined_table[i + hlit + 257] = dist_huff_table[i].length; + rl_huff_len = + rl_encode(combined_table, hlit + 257 + hdist + 1, count_histogram, rl_huff); + + /* Create header */ + bit_count = + create_header(&header_bitbuf, rl_huff, rl_huff_len, + count_histogram, hlit, hdist, LAST_BLOCK); + flush(&header_bitbuf); + + hufftables->deflate_hdr_count = bit_count / 8; + hufftables->deflate_hdr_extra_bits = bit_count % 8; + + return 0; +} + +void expand_hufftables_icf(struct hufftables_icf *hufftables) +{ + uint32_t i, eb, j, k, len, code; + struct huff_code orig[21], *p_code; + struct huff_code *lit_len_codes = hufftables->lit_len_table; + struct huff_code *dist_codes = hufftables->dist_table; + + for (i = 0; i < 21; i++) + orig[i] = lit_len_codes[i + 265]; + + p_code = &lit_len_codes[265]; + + i = 0; + for (eb = 1; eb < 6; eb++) { + for (k = 0; k < 4; k++) { + len = orig[i].length; + code = orig[i++].code; + for (j = 0; j < (1u << eb); j++) { + p_code->code_and_extra = code | (j << len); + p_code->length = len + eb; + p_code++; + } + } // end for k + } // end for eb + // fix up last record + p_code[-1] = orig[i]; + + dist_codes[DIST_LEN].code_and_extra = 0; + dist_codes[DIST_LEN].length = 0; +} + +void +create_hufftables_icf(struct BitBuf2 *bb, struct hufftables_icf *hufftables, + struct isal_mod_hist *hist, uint32_t end_of_block) +{ + uint32_t bl_count[MAX_DEFLATE_CODE_LEN + 1]; + uint32_t max_ll_code, max_d_code; + struct heap_tree heap_space; + uint32_t heap_size; + struct rl_code cl_tokens[LIT_LEN + DIST_LEN]; + uint32_t num_cl_tokens; + uint64_t cl_counts[CODE_LEN_CODES]; + uint16_t combined_table[LIT_LEN + DIST_LEN]; + int i; + uint64_t compressed_len = 0; + uint64_t static_compressed_len = 3; /* The static header size */ + struct BitBuf2 bb_tmp; + + struct huff_code *ll_codes = hufftables->lit_len_table; + struct huff_code *d_codes = hufftables->dist_table; + uint32_t *ll_hist = hist->ll_hist; + uint32_t *d_hist = hist->d_hist; + struct huff_code *static_ll_codes = static_hufftables.lit_len_table; + struct huff_code *static_d_codes = static_hufftables.dist_table; + + memcpy(&bb_tmp, bb, sizeof(struct BitBuf2)); + + flatten_ll(hist->ll_hist); + + // make sure EOB is present + if (ll_hist[256] == 0) + ll_hist[256] = 1; + + heap_size = init_heap32(&heap_space, ll_hist, LIT_LEN); + gen_huff_code_lens(&heap_space, heap_size, bl_count, + ll_codes, LIT_LEN, MAX_DEFLATE_CODE_LEN); + max_ll_code = set_huff_codes(ll_codes, LIT_LEN, bl_count); + + heap_size = init_heap32(&heap_space, d_hist, DIST_LEN); + gen_huff_code_lens(&heap_space, heap_size, bl_count, d_codes, + DIST_LEN, MAX_DEFLATE_CODE_LEN); + max_d_code = set_dist_huff_codes(d_codes, bl_count); + + assert(max_ll_code >= 256); // must be EOB code + assert(max_d_code != 0); + + /* Run length encode the length and distance huffman codes */ + memset(cl_counts, 0, sizeof(cl_counts)); + + for (i = 0; i <= 256; i++) { + combined_table[i] = ll_codes[i].length; + compressed_len += ll_codes[i].length * ll_hist[i]; + static_compressed_len += static_ll_codes[i].length * ll_hist[i]; + } + + for (; i < max_ll_code + 1; i++) { + combined_table[i] = ll_codes[i].length; + compressed_len += + (ll_codes[i].length + len_code_extra_bits[i - 257]) * ll_hist[i]; + static_compressed_len += + (static_ll_codes[i].length + len_code_extra_bits[i - 257]) * ll_hist[i]; + } + + for (i = 0; i < max_d_code + 1; i++) { + combined_table[i + max_ll_code + 1] = d_codes[i].length; + compressed_len += (d_codes[i].length + dist_code_extra_bits[i]) * d_hist[i]; + static_compressed_len += + (static_d_codes[i].length + dist_code_extra_bits[i]) * d_hist[i]; + } + + expand_hufftables_icf(hufftables); + + num_cl_tokens = + rl_encode(combined_table, max_ll_code + max_d_code + 2, cl_counts, cl_tokens); + + /* Create header */ + create_header(bb, cl_tokens, num_cl_tokens, cl_counts, max_ll_code - 256, max_d_code, + end_of_block); + compressed_len += 8 * buffer_used(bb) + bb->m_bit_count; + + if (static_compressed_len < compressed_len) { + memcpy(hufftables, &static_hufftables, sizeof(struct hufftables_icf)); + expand_hufftables_icf(hufftables); + memcpy(bb, &bb_tmp, sizeof(struct BitBuf2)); + end_of_block = end_of_block ? 1 : 0; + write_bits(bb, 0x2 | end_of_block, 3); + } +} |