summaryrefslogtreecommitdiffstats
path: root/src/isa-l/igzip/huff_codes.c
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-27 18:24:20 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-27 18:24:20 +0000
commit483eb2f56657e8e7f419ab1a4fab8dce9ade8609 (patch)
treee5d88d25d870d5dedacb6bbdbe2a966086a0a5cf /src/isa-l/igzip/huff_codes.c
parentInitial commit. (diff)
downloadceph-483eb2f56657e8e7f419ab1a4fab8dce9ade8609.tar.xz
ceph-483eb2f56657e8e7f419ab1a4fab8dce9ade8609.zip
Adding upstream version 14.2.21.upstream/14.2.21upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'src/isa-l/igzip/huff_codes.c')
-rw-r--r--src/isa-l/igzip/huff_codes.c1625
1 files changed, 1625 insertions, 0 deletions
diff --git a/src/isa-l/igzip/huff_codes.c b/src/isa-l/igzip/huff_codes.c
new file mode 100644
index 00000000..c8b2035d
--- /dev/null
+++ b/src/isa-l/igzip/huff_codes.c
@@ -0,0 +1,1625 @@
+/**********************************************************************
+ Copyright(c) 2011-2016 Intel Corporation All rights reserved.
+
+ Redistribution and use in source and binary forms, with or without
+ modification, are permitted provided that the following conditions
+ are met:
+ * Redistributions of source code must retain the above copyright
+ notice, this list of conditions and the following disclaimer.
+ * Redistributions in binary form must reproduce the above copyright
+ notice, this list of conditions and the following disclaimer in
+ the documentation and/or other materials provided with the
+ distribution.
+ * Neither the name of Intel Corporation nor the names of its
+ contributors may be used to endorse or promote products derived
+ from this software without specific prior written permission.
+
+ THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+ "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+ LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+ A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+ OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+ SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+ LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+**********************************************************************/
+
+#include <immintrin.h>
+#include <stdint.h>
+#include <string.h>
+#include <assert.h>
+#include "igzip_lib.h"
+#include "huff_codes.h"
+#include "huffman.h"
+#include "bitbuf2.h"
+#include "flatten_ll.h"
+
+/* The order code length codes are written in the dynamic code header. This is
+ * defined in RFC 1951 page 13 */
+static const uint8_t code_length_code_order[] =
+ { 16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15 };
+
+const uint32_t len_code_extra_bits[] = {
+ 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
+ 0x1, 0x1, 0x1, 0x1, 0x2, 0x2, 0x2, 0x2,
+ 0x3, 0x3, 0x3, 0x3, 0x4, 0x4, 0x4, 0x4,
+ 0x5, 0x5, 0x5, 0x5, 0x0
+};
+
+const uint32_t dist_code_extra_bits[] = {
+ 0x0, 0x0, 0x0, 0x0, 0x1, 0x1, 0x2, 0x2,
+ 0x3, 0x3, 0x4, 0x4, 0x5, 0x5, 0x6, 0x6,
+ 0x7, 0x7, 0x8, 0x8, 0x9, 0x9, 0xa, 0xa,
+ 0xb, 0xb, 0xc, 0xc, 0xd, 0xd
+};
+
+struct hufftables_icf static_hufftables = {
+ .lit_len_table = {
+ {.code_and_extra = 0x00c,.length2 = 0x8},
+ {.code_and_extra = 0x08c,.length2 = 0x8},
+ {.code_and_extra = 0x04c,.length2 = 0x8},
+ {.code_and_extra = 0x0cc,.length2 = 0x8},
+ {.code_and_extra = 0x02c,.length2 = 0x8},
+ {.code_and_extra = 0x0ac,.length2 = 0x8},
+ {.code_and_extra = 0x06c,.length2 = 0x8},
+ {.code_and_extra = 0x0ec,.length2 = 0x8},
+ {.code_and_extra = 0x01c,.length2 = 0x8},
+ {.code_and_extra = 0x09c,.length2 = 0x8},
+ {.code_and_extra = 0x05c,.length2 = 0x8},
+ {.code_and_extra = 0x0dc,.length2 = 0x8},
+ {.code_and_extra = 0x03c,.length2 = 0x8},
+ {.code_and_extra = 0x0bc,.length2 = 0x8},
+ {.code_and_extra = 0x07c,.length2 = 0x8},
+ {.code_and_extra = 0x0fc,.length2 = 0x8},
+ {.code_and_extra = 0x002,.length2 = 0x8},
+ {.code_and_extra = 0x082,.length2 = 0x8},
+ {.code_and_extra = 0x042,.length2 = 0x8},
+ {.code_and_extra = 0x0c2,.length2 = 0x8},
+ {.code_and_extra = 0x022,.length2 = 0x8},
+ {.code_and_extra = 0x0a2,.length2 = 0x8},
+ {.code_and_extra = 0x062,.length2 = 0x8},
+ {.code_and_extra = 0x0e2,.length2 = 0x8},
+ {.code_and_extra = 0x012,.length2 = 0x8},
+ {.code_and_extra = 0x092,.length2 = 0x8},
+ {.code_and_extra = 0x052,.length2 = 0x8},
+ {.code_and_extra = 0x0d2,.length2 = 0x8},
+ {.code_and_extra = 0x032,.length2 = 0x8},
+ {.code_and_extra = 0x0b2,.length2 = 0x8},
+ {.code_and_extra = 0x072,.length2 = 0x8},
+ {.code_and_extra = 0x0f2,.length2 = 0x8},
+ {.code_and_extra = 0x00a,.length2 = 0x8},
+ {.code_and_extra = 0x08a,.length2 = 0x8},
+ {.code_and_extra = 0x04a,.length2 = 0x8},
+ {.code_and_extra = 0x0ca,.length2 = 0x8},
+ {.code_and_extra = 0x02a,.length2 = 0x8},
+ {.code_and_extra = 0x0aa,.length2 = 0x8},
+ {.code_and_extra = 0x06a,.length2 = 0x8},
+ {.code_and_extra = 0x0ea,.length2 = 0x8},
+ {.code_and_extra = 0x01a,.length2 = 0x8},
+ {.code_and_extra = 0x09a,.length2 = 0x8},
+ {.code_and_extra = 0x05a,.length2 = 0x8},
+ {.code_and_extra = 0x0da,.length2 = 0x8},
+ {.code_and_extra = 0x03a,.length2 = 0x8},
+ {.code_and_extra = 0x0ba,.length2 = 0x8},
+ {.code_and_extra = 0x07a,.length2 = 0x8},
+ {.code_and_extra = 0x0fa,.length2 = 0x8},
+ {.code_and_extra = 0x006,.length2 = 0x8},
+ {.code_and_extra = 0x086,.length2 = 0x8},
+ {.code_and_extra = 0x046,.length2 = 0x8},
+ {.code_and_extra = 0x0c6,.length2 = 0x8},
+ {.code_and_extra = 0x026,.length2 = 0x8},
+ {.code_and_extra = 0x0a6,.length2 = 0x8},
+ {.code_and_extra = 0x066,.length2 = 0x8},
+ {.code_and_extra = 0x0e6,.length2 = 0x8},
+ {.code_and_extra = 0x016,.length2 = 0x8},
+ {.code_and_extra = 0x096,.length2 = 0x8},
+ {.code_and_extra = 0x056,.length2 = 0x8},
+ {.code_and_extra = 0x0d6,.length2 = 0x8},
+ {.code_and_extra = 0x036,.length2 = 0x8},
+ {.code_and_extra = 0x0b6,.length2 = 0x8},
+ {.code_and_extra = 0x076,.length2 = 0x8},
+ {.code_and_extra = 0x0f6,.length2 = 0x8},
+ {.code_and_extra = 0x00e,.length2 = 0x8},
+ {.code_and_extra = 0x08e,.length2 = 0x8},
+ {.code_and_extra = 0x04e,.length2 = 0x8},
+ {.code_and_extra = 0x0ce,.length2 = 0x8},
+ {.code_and_extra = 0x02e,.length2 = 0x8},
+ {.code_and_extra = 0x0ae,.length2 = 0x8},
+ {.code_and_extra = 0x06e,.length2 = 0x8},
+ {.code_and_extra = 0x0ee,.length2 = 0x8},
+ {.code_and_extra = 0x01e,.length2 = 0x8},
+ {.code_and_extra = 0x09e,.length2 = 0x8},
+ {.code_and_extra = 0x05e,.length2 = 0x8},
+ {.code_and_extra = 0x0de,.length2 = 0x8},
+ {.code_and_extra = 0x03e,.length2 = 0x8},
+ {.code_and_extra = 0x0be,.length2 = 0x8},
+ {.code_and_extra = 0x07e,.length2 = 0x8},
+ {.code_and_extra = 0x0fe,.length2 = 0x8},
+ {.code_and_extra = 0x001,.length2 = 0x8},
+ {.code_and_extra = 0x081,.length2 = 0x8},
+ {.code_and_extra = 0x041,.length2 = 0x8},
+ {.code_and_extra = 0x0c1,.length2 = 0x8},
+ {.code_and_extra = 0x021,.length2 = 0x8},
+ {.code_and_extra = 0x0a1,.length2 = 0x8},
+ {.code_and_extra = 0x061,.length2 = 0x8},
+ {.code_and_extra = 0x0e1,.length2 = 0x8},
+ {.code_and_extra = 0x011,.length2 = 0x8},
+ {.code_and_extra = 0x091,.length2 = 0x8},
+ {.code_and_extra = 0x051,.length2 = 0x8},
+ {.code_and_extra = 0x0d1,.length2 = 0x8},
+ {.code_and_extra = 0x031,.length2 = 0x8},
+ {.code_and_extra = 0x0b1,.length2 = 0x8},
+ {.code_and_extra = 0x071,.length2 = 0x8},
+ {.code_and_extra = 0x0f1,.length2 = 0x8},
+ {.code_and_extra = 0x009,.length2 = 0x8},
+ {.code_and_extra = 0x089,.length2 = 0x8},
+ {.code_and_extra = 0x049,.length2 = 0x8},
+ {.code_and_extra = 0x0c9,.length2 = 0x8},
+ {.code_and_extra = 0x029,.length2 = 0x8},
+ {.code_and_extra = 0x0a9,.length2 = 0x8},
+ {.code_and_extra = 0x069,.length2 = 0x8},
+ {.code_and_extra = 0x0e9,.length2 = 0x8},
+ {.code_and_extra = 0x019,.length2 = 0x8},
+ {.code_and_extra = 0x099,.length2 = 0x8},
+ {.code_and_extra = 0x059,.length2 = 0x8},
+ {.code_and_extra = 0x0d9,.length2 = 0x8},
+ {.code_and_extra = 0x039,.length2 = 0x8},
+ {.code_and_extra = 0x0b9,.length2 = 0x8},
+ {.code_and_extra = 0x079,.length2 = 0x8},
+ {.code_and_extra = 0x0f9,.length2 = 0x8},
+ {.code_and_extra = 0x005,.length2 = 0x8},
+ {.code_and_extra = 0x085,.length2 = 0x8},
+ {.code_and_extra = 0x045,.length2 = 0x8},
+ {.code_and_extra = 0x0c5,.length2 = 0x8},
+ {.code_and_extra = 0x025,.length2 = 0x8},
+ {.code_and_extra = 0x0a5,.length2 = 0x8},
+ {.code_and_extra = 0x065,.length2 = 0x8},
+ {.code_and_extra = 0x0e5,.length2 = 0x8},
+ {.code_and_extra = 0x015,.length2 = 0x8},
+ {.code_and_extra = 0x095,.length2 = 0x8},
+ {.code_and_extra = 0x055,.length2 = 0x8},
+ {.code_and_extra = 0x0d5,.length2 = 0x8},
+ {.code_and_extra = 0x035,.length2 = 0x8},
+ {.code_and_extra = 0x0b5,.length2 = 0x8},
+ {.code_and_extra = 0x075,.length2 = 0x8},
+ {.code_and_extra = 0x0f5,.length2 = 0x8},
+ {.code_and_extra = 0x00d,.length2 = 0x8},
+ {.code_and_extra = 0x08d,.length2 = 0x8},
+ {.code_and_extra = 0x04d,.length2 = 0x8},
+ {.code_and_extra = 0x0cd,.length2 = 0x8},
+ {.code_and_extra = 0x02d,.length2 = 0x8},
+ {.code_and_extra = 0x0ad,.length2 = 0x8},
+ {.code_and_extra = 0x06d,.length2 = 0x8},
+ {.code_and_extra = 0x0ed,.length2 = 0x8},
+ {.code_and_extra = 0x01d,.length2 = 0x8},
+ {.code_and_extra = 0x09d,.length2 = 0x8},
+ {.code_and_extra = 0x05d,.length2 = 0x8},
+ {.code_and_extra = 0x0dd,.length2 = 0x8},
+ {.code_and_extra = 0x03d,.length2 = 0x8},
+ {.code_and_extra = 0x0bd,.length2 = 0x8},
+ {.code_and_extra = 0x07d,.length2 = 0x8},
+ {.code_and_extra = 0x0fd,.length2 = 0x8},
+ {.code_and_extra = 0x013,.length2 = 0x9},
+ {.code_and_extra = 0x113,.length2 = 0x9},
+ {.code_and_extra = 0x093,.length2 = 0x9},
+ {.code_and_extra = 0x193,.length2 = 0x9},
+ {.code_and_extra = 0x053,.length2 = 0x9},
+ {.code_and_extra = 0x153,.length2 = 0x9},
+ {.code_and_extra = 0x0d3,.length2 = 0x9},
+ {.code_and_extra = 0x1d3,.length2 = 0x9},
+ {.code_and_extra = 0x033,.length2 = 0x9},
+ {.code_and_extra = 0x133,.length2 = 0x9},
+ {.code_and_extra = 0x0b3,.length2 = 0x9},
+ {.code_and_extra = 0x1b3,.length2 = 0x9},
+ {.code_and_extra = 0x073,.length2 = 0x9},
+ {.code_and_extra = 0x173,.length2 = 0x9},
+ {.code_and_extra = 0x0f3,.length2 = 0x9},
+ {.code_and_extra = 0x1f3,.length2 = 0x9},
+ {.code_and_extra = 0x00b,.length2 = 0x9},
+ {.code_and_extra = 0x10b,.length2 = 0x9},
+ {.code_and_extra = 0x08b,.length2 = 0x9},
+ {.code_and_extra = 0x18b,.length2 = 0x9},
+ {.code_and_extra = 0x04b,.length2 = 0x9},
+ {.code_and_extra = 0x14b,.length2 = 0x9},
+ {.code_and_extra = 0x0cb,.length2 = 0x9},
+ {.code_and_extra = 0x1cb,.length2 = 0x9},
+ {.code_and_extra = 0x02b,.length2 = 0x9},
+ {.code_and_extra = 0x12b,.length2 = 0x9},
+ {.code_and_extra = 0x0ab,.length2 = 0x9},
+ {.code_and_extra = 0x1ab,.length2 = 0x9},
+ {.code_and_extra = 0x06b,.length2 = 0x9},
+ {.code_and_extra = 0x16b,.length2 = 0x9},
+ {.code_and_extra = 0x0eb,.length2 = 0x9},
+ {.code_and_extra = 0x1eb,.length2 = 0x9},
+ {.code_and_extra = 0x01b,.length2 = 0x9},
+ {.code_and_extra = 0x11b,.length2 = 0x9},
+ {.code_and_extra = 0x09b,.length2 = 0x9},
+ {.code_and_extra = 0x19b,.length2 = 0x9},
+ {.code_and_extra = 0x05b,.length2 = 0x9},
+ {.code_and_extra = 0x15b,.length2 = 0x9},
+ {.code_and_extra = 0x0db,.length2 = 0x9},
+ {.code_and_extra = 0x1db,.length2 = 0x9},
+ {.code_and_extra = 0x03b,.length2 = 0x9},
+ {.code_and_extra = 0x13b,.length2 = 0x9},
+ {.code_and_extra = 0x0bb,.length2 = 0x9},
+ {.code_and_extra = 0x1bb,.length2 = 0x9},
+ {.code_and_extra = 0x07b,.length2 = 0x9},
+ {.code_and_extra = 0x17b,.length2 = 0x9},
+ {.code_and_extra = 0x0fb,.length2 = 0x9},
+ {.code_and_extra = 0x1fb,.length2 = 0x9},
+ {.code_and_extra = 0x007,.length2 = 0x9},
+ {.code_and_extra = 0x107,.length2 = 0x9},
+ {.code_and_extra = 0x087,.length2 = 0x9},
+ {.code_and_extra = 0x187,.length2 = 0x9},
+ {.code_and_extra = 0x047,.length2 = 0x9},
+ {.code_and_extra = 0x147,.length2 = 0x9},
+ {.code_and_extra = 0x0c7,.length2 = 0x9},
+ {.code_and_extra = 0x1c7,.length2 = 0x9},
+ {.code_and_extra = 0x027,.length2 = 0x9},
+ {.code_and_extra = 0x127,.length2 = 0x9},
+ {.code_and_extra = 0x0a7,.length2 = 0x9},
+ {.code_and_extra = 0x1a7,.length2 = 0x9},
+ {.code_and_extra = 0x067,.length2 = 0x9},
+ {.code_and_extra = 0x167,.length2 = 0x9},
+ {.code_and_extra = 0x0e7,.length2 = 0x9},
+ {.code_and_extra = 0x1e7,.length2 = 0x9},
+ {.code_and_extra = 0x017,.length2 = 0x9},
+ {.code_and_extra = 0x117,.length2 = 0x9},
+ {.code_and_extra = 0x097,.length2 = 0x9},
+ {.code_and_extra = 0x197,.length2 = 0x9},
+ {.code_and_extra = 0x057,.length2 = 0x9},
+ {.code_and_extra = 0x157,.length2 = 0x9},
+ {.code_and_extra = 0x0d7,.length2 = 0x9},
+ {.code_and_extra = 0x1d7,.length2 = 0x9},
+ {.code_and_extra = 0x037,.length2 = 0x9},
+ {.code_and_extra = 0x137,.length2 = 0x9},
+ {.code_and_extra = 0x0b7,.length2 = 0x9},
+ {.code_and_extra = 0x1b7,.length2 = 0x9},
+ {.code_and_extra = 0x077,.length2 = 0x9},
+ {.code_and_extra = 0x177,.length2 = 0x9},
+ {.code_and_extra = 0x0f7,.length2 = 0x9},
+ {.code_and_extra = 0x1f7,.length2 = 0x9},
+ {.code_and_extra = 0x00f,.length2 = 0x9},
+ {.code_and_extra = 0x10f,.length2 = 0x9},
+ {.code_and_extra = 0x08f,.length2 = 0x9},
+ {.code_and_extra = 0x18f,.length2 = 0x9},
+ {.code_and_extra = 0x04f,.length2 = 0x9},
+ {.code_and_extra = 0x14f,.length2 = 0x9},
+ {.code_and_extra = 0x0cf,.length2 = 0x9},
+ {.code_and_extra = 0x1cf,.length2 = 0x9},
+ {.code_and_extra = 0x02f,.length2 = 0x9},
+ {.code_and_extra = 0x12f,.length2 = 0x9},
+ {.code_and_extra = 0x0af,.length2 = 0x9},
+ {.code_and_extra = 0x1af,.length2 = 0x9},
+ {.code_and_extra = 0x06f,.length2 = 0x9},
+ {.code_and_extra = 0x16f,.length2 = 0x9},
+ {.code_and_extra = 0x0ef,.length2 = 0x9},
+ {.code_and_extra = 0x1ef,.length2 = 0x9},
+ {.code_and_extra = 0x01f,.length2 = 0x9},
+ {.code_and_extra = 0x11f,.length2 = 0x9},
+ {.code_and_extra = 0x09f,.length2 = 0x9},
+ {.code_and_extra = 0x19f,.length2 = 0x9},
+ {.code_and_extra = 0x05f,.length2 = 0x9},
+ {.code_and_extra = 0x15f,.length2 = 0x9},
+ {.code_and_extra = 0x0df,.length2 = 0x9},
+ {.code_and_extra = 0x1df,.length2 = 0x9},
+ {.code_and_extra = 0x03f,.length2 = 0x9},
+ {.code_and_extra = 0x13f,.length2 = 0x9},
+ {.code_and_extra = 0x0bf,.length2 = 0x9},
+ {.code_and_extra = 0x1bf,.length2 = 0x9},
+ {.code_and_extra = 0x07f,.length2 = 0x9},
+ {.code_and_extra = 0x17f,.length2 = 0x9},
+ {.code_and_extra = 0x0ff,.length2 = 0x9},
+ {.code_and_extra = 0x1ff,.length2 = 0x9},
+ {.code_and_extra = 0x000,.length2 = 0x7},
+ {.code_and_extra = 0x040,.length2 = 0x7},
+ {.code_and_extra = 0x020,.length2 = 0x7},
+ {.code_and_extra = 0x060,.length2 = 0x7},
+ {.code_and_extra = 0x010,.length2 = 0x7},
+ {.code_and_extra = 0x050,.length2 = 0x7},
+ {.code_and_extra = 0x030,.length2 = 0x7},
+ {.code_and_extra = 0x070,.length2 = 0x7},
+ {.code_and_extra = 0x008,.length2 = 0x7},
+ {.code_and_extra = 0x048,.length2 = 0x7},
+ {.code_and_extra = 0x028,.length2 = 0x7},
+ {.code_and_extra = 0x068,.length2 = 0x7},
+ {.code_and_extra = 0x018,.length2 = 0x7},
+ {.code_and_extra = 0x058,.length2 = 0x7},
+ {.code_and_extra = 0x038,.length2 = 0x7},
+ {.code_and_extra = 0x078,.length2 = 0x7},
+ {.code_and_extra = 0x004,.length2 = 0x7},
+ {.code_and_extra = 0x044,.length2 = 0x7},
+ {.code_and_extra = 0x024,.length2 = 0x7},
+ {.code_and_extra = 0x064,.length2 = 0x7},
+ {.code_and_extra = 0x014,.length2 = 0x7},
+ {.code_and_extra = 0x054,.length2 = 0x7},
+ {.code_and_extra = 0x034,.length2 = 0x7},
+ {.code_and_extra = 0x074,.length2 = 0x7},
+ {.code_and_extra = 0x003,.length2 = 0x8},
+ {.code_and_extra = 0x083,.length2 = 0x8},
+ {.code_and_extra = 0x043,.length2 = 0x8},
+ {.code_and_extra = 0x0c3,.length2 = 0x8},
+ {.code_and_extra = 0x023,.length2 = 0x8},
+ {.code_and_extra = 0x0a3,.length2 = 0x8},
+ {.code_and_extra = 0x063,.length2 = 0x8},
+ {.code_and_extra = 0x0e3,.length2 = 0x8},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0},
+ {.code_and_extra = 0x000,.length2 = 0x0}},
+ .dist_table = {
+ {.code_and_extra = 0x000,.length2 = 0x5},
+ {.code_and_extra = 0x010,.length2 = 0x5},
+ {.code_and_extra = 0x008,.length2 = 0x5},
+ {.code_and_extra = 0x018,.length2 = 0x5},
+ {.code_and_extra = 0x10004,.length2 = 0x5},
+ {.code_and_extra = 0x10014,.length2 = 0x5},
+ {.code_and_extra = 0x2000c,.length2 = 0x5},
+ {.code_and_extra = 0x2001c,.length2 = 0x5},
+ {.code_and_extra = 0x30002,.length2 = 0x5},
+ {.code_and_extra = 0x30012,.length2 = 0x5},
+ {.code_and_extra = 0x4000a,.length2 = 0x5},
+ {.code_and_extra = 0x4001a,.length2 = 0x5},
+ {.code_and_extra = 0x50006,.length2 = 0x5},
+ {.code_and_extra = 0x50016,.length2 = 0x5},
+ {.code_and_extra = 0x6000e,.length2 = 0x5},
+ {.code_and_extra = 0x6001e,.length2 = 0x5},
+ {.code_and_extra = 0x70001,.length2 = 0x5},
+ {.code_and_extra = 0x70011,.length2 = 0x5},
+ {.code_and_extra = 0x80009,.length2 = 0x5},
+ {.code_and_extra = 0x80019,.length2 = 0x5},
+ {.code_and_extra = 0x90005,.length2 = 0x5},
+ {.code_and_extra = 0x90015,.length2 = 0x5},
+ {.code_and_extra = 0xa000d,.length2 = 0x5},
+ {.code_and_extra = 0xa001d,.length2 = 0x5},
+ {.code_and_extra = 0xb0003,.length2 = 0x5},
+ {.code_and_extra = 0xb0013,.length2 = 0x5},
+ {.code_and_extra = 0xc000b,.length2 = 0x5},
+ {.code_and_extra = 0xc001b,.length2 = 0x5},
+ {.code_and_extra = 0xd0007,.length2 = 0x5},
+ {.code_and_extra = 0xd0017,.length2 = 0x5},
+ {.code_and_extra = 0x000,.length2 = 0x0}}
+};
+
+struct slver {
+ uint16_t snum;
+ uint8_t ver;
+ uint8_t core;
+};
+
+/* Version info */
+struct slver isal_update_histogram_slver_00010085;
+struct slver isal_update_histogram_slver = { 0x0085, 0x01, 0x00 };
+
+struct slver isal_create_hufftables_slver_00010086;
+struct slver isal_create_hufftables_slver = { 0x0086, 0x01, 0x00 };
+
+struct slver isal_create_hufftables_subset_slver_00010087;
+struct slver isal_create_hufftables_subset_slver = { 0x0087, 0x01, 0x00 };
+
+extern uint32_t build_huff_tree(struct heap_tree *heap, uint64_t heap_size, uint64_t node_ptr);
+extern void build_heap(uint64_t * heap, uint64_t heap_size);
+
+static const uint8_t bitrev8[0x100] = {
+ 0x00, 0x80, 0x40, 0xC0, 0x20, 0xA0, 0x60, 0xE0,
+ 0x10, 0x90, 0x50, 0xD0, 0x30, 0xB0, 0x70, 0xF0,
+ 0x08, 0x88, 0x48, 0xC8, 0x28, 0xA8, 0x68, 0xE8,
+ 0x18, 0x98, 0x58, 0xD8, 0x38, 0xB8, 0x78, 0xF8,
+ 0x04, 0x84, 0x44, 0xC4, 0x24, 0xA4, 0x64, 0xE4,
+ 0x14, 0x94, 0x54, 0xD4, 0x34, 0xB4, 0x74, 0xF4,
+ 0x0C, 0x8C, 0x4C, 0xCC, 0x2C, 0xAC, 0x6C, 0xEC,
+ 0x1C, 0x9C, 0x5C, 0xDC, 0x3C, 0xBC, 0x7C, 0xFC,
+ 0x02, 0x82, 0x42, 0xC2, 0x22, 0xA2, 0x62, 0xE2,
+ 0x12, 0x92, 0x52, 0xD2, 0x32, 0xB2, 0x72, 0xF2,
+ 0x0A, 0x8A, 0x4A, 0xCA, 0x2A, 0xAA, 0x6A, 0xEA,
+ 0x1A, 0x9A, 0x5A, 0xDA, 0x3A, 0xBA, 0x7A, 0xFA,
+ 0x06, 0x86, 0x46, 0xC6, 0x26, 0xA6, 0x66, 0xE6,
+ 0x16, 0x96, 0x56, 0xD6, 0x36, 0xB6, 0x76, 0xF6,
+ 0x0E, 0x8E, 0x4E, 0xCE, 0x2E, 0xAE, 0x6E, 0xEE,
+ 0x1E, 0x9E, 0x5E, 0xDE, 0x3E, 0xBE, 0x7E, 0xFE,
+ 0x01, 0x81, 0x41, 0xC1, 0x21, 0xA1, 0x61, 0xE1,
+ 0x11, 0x91, 0x51, 0xD1, 0x31, 0xB1, 0x71, 0xF1,
+ 0x09, 0x89, 0x49, 0xC9, 0x29, 0xA9, 0x69, 0xE9,
+ 0x19, 0x99, 0x59, 0xD9, 0x39, 0xB9, 0x79, 0xF9,
+ 0x05, 0x85, 0x45, 0xC5, 0x25, 0xA5, 0x65, 0xE5,
+ 0x15, 0x95, 0x55, 0xD5, 0x35, 0xB5, 0x75, 0xF5,
+ 0x0D, 0x8D, 0x4D, 0xCD, 0x2D, 0xAD, 0x6D, 0xED,
+ 0x1D, 0x9D, 0x5D, 0xDD, 0x3D, 0xBD, 0x7D, 0xFD,
+ 0x03, 0x83, 0x43, 0xC3, 0x23, 0xA3, 0x63, 0xE3,
+ 0x13, 0x93, 0x53, 0xD3, 0x33, 0xB3, 0x73, 0xF3,
+ 0x0B, 0x8B, 0x4B, 0xCB, 0x2B, 0xAB, 0x6B, 0xEB,
+ 0x1B, 0x9B, 0x5B, 0xDB, 0x3B, 0xBB, 0x7B, 0xFB,
+ 0x07, 0x87, 0x47, 0xC7, 0x27, 0xA7, 0x67, 0xE7,
+ 0x17, 0x97, 0x57, 0xD7, 0x37, 0xB7, 0x77, 0xF7,
+ 0x0F, 0x8F, 0x4F, 0xCF, 0x2F, 0xAF, 0x6F, 0xEF,
+ 0x1F, 0x9F, 0x5F, 0xDF, 0x3F, 0xBF, 0x7F, 0xFF
+};
+
+// bit reverse low order LENGTH bits in code, and return result in low order bits
+static inline uint16_t bit_reverse(uint16_t code, uint32_t length)
+{
+ code = (bitrev8[code & 0x00FF] << 8) | (bitrev8[code >> 8]);
+ return (code >> (16 - length));
+}
+
+void isal_update_histogram_base(uint8_t * start_stream, int length,
+ struct isal_huff_histogram *histogram)
+{
+ uint32_t literal = 0, hash;
+ uint16_t seen, *last_seen = histogram->hash_table;
+ uint8_t *current, *end_stream, *next_hash, *end;
+ uint32_t match_length;
+ uint32_t dist;
+ uint64_t *lit_len_histogram = histogram->lit_len_histogram;
+ uint64_t *dist_histogram = histogram->dist_histogram;
+
+ if (length <= 0)
+ return;
+
+ end_stream = start_stream + length;
+ memset(last_seen, 0, sizeof(histogram->hash_table)); /* Initialize last_seen to be 0. */
+ for (current = start_stream; current < end_stream - 3; current++) {
+ literal = *(uint32_t *) current;
+ hash = compute_hash(literal) & HASH_MASK;
+ seen = last_seen[hash];
+ last_seen[hash] = (current - start_stream) & 0xFFFF;
+ dist = (current - start_stream - seen) & 0xFFFF;
+ if (dist - 1 < D - 1) {
+ assert(start_stream <= current - dist);
+ match_length =
+ compare258(current - dist, current, end_stream - current);
+ if (match_length >= SHORTEST_MATCH) {
+ next_hash = current;
+#ifdef ISAL_LIMIT_HASH_UPDATE
+ end = next_hash + 3;
+#else
+ end = next_hash + match_length;
+#endif
+ if (end > end_stream - 3)
+ end = end_stream - 3;
+ next_hash++;
+ for (; next_hash < end; next_hash++) {
+ literal = *(uint32_t *) next_hash;
+ hash = compute_hash(literal) & HASH_MASK;
+ last_seen[hash] = (next_hash - start_stream) & 0xFFFF;
+ }
+
+ dist_histogram[convert_dist_to_dist_sym(dist)] += 1;
+ lit_len_histogram[convert_length_to_len_sym(match_length)] +=
+ 1;
+ current += match_length - 1;
+ continue;
+ }
+ }
+ lit_len_histogram[literal & 0xFF] += 1;
+ }
+ literal = literal >> 8;
+ hash = compute_hash(literal) & HASH_MASK;
+ seen = last_seen[hash];
+ last_seen[hash] = (current - start_stream) & 0xFFFF;
+ dist = (current - start_stream - seen) & 0xFFFF;
+ if (dist < D) {
+ match_length = compare258(current - dist, current, end_stream - current);
+ if (match_length >= SHORTEST_MATCH) {
+ dist_histogram[convert_dist_to_dist_sym(dist)] += 1;
+ lit_len_histogram[convert_length_to_len_sym(match_length)] += 1;
+ lit_len_histogram[256] += 1;
+ return;
+ }
+ } else
+ lit_len_histogram[literal & 0xFF] += 1;
+ lit_len_histogram[(literal >> 8) & 0xFF] += 1;
+ lit_len_histogram[(literal >> 16) & 0xFF] += 1;
+ lit_len_histogram[256] += 1;
+ return;
+}
+
+uint32_t convert_dist_to_dist_sym(uint32_t dist)
+{
+ assert(dist <= 32768 && dist > 0);
+ if (dist <= 2)
+ return dist - 1;
+ else if (dist <= 4)
+ return 0 + (dist - 1) / 1;
+ else if (dist <= 8)
+ return 2 + (dist - 1) / 2;
+ else if (dist <= 16)
+ return 4 + (dist - 1) / 4;
+ else if (dist <= 32)
+ return 6 + (dist - 1) / 8;
+ else if (dist <= 64)
+ return 8 + (dist - 1) / 16;
+ else if (dist <= 128)
+ return 10 + (dist - 1) / 32;
+ else if (dist <= 256)
+ return 12 + (dist - 1) / 64;
+ else if (dist <= 512)
+ return 14 + (dist - 1) / 128;
+ else if (dist <= 1024)
+ return 16 + (dist - 1) / 256;
+ else if (dist <= 2048)
+ return 18 + (dist - 1) / 512;
+ else if (dist <= 4096)
+ return 20 + (dist - 1) / 1024;
+ else if (dist <= 8192)
+ return 22 + (dist - 1) / 2048;
+ else if (dist <= 16384)
+ return 24 + (dist - 1) / 4096;
+ else if (dist <= 32768)
+ return 26 + (dist - 1) / 8192;
+ else
+ return ~0; /* ~0 is an invalid distance code */
+
+}
+
+uint32_t convert_length_to_len_sym(uint32_t length)
+{
+ assert(length > 2 && length < 259);
+
+ /* Based on tables on page 11 in RFC 1951 */
+ if (length < 11)
+ return 257 + length - 3;
+ else if (length < 19)
+ return 261 + (length - 3) / 2;
+ else if (length < 35)
+ return 265 + (length - 3) / 4;
+ else if (length < 67)
+ return 269 + (length - 3) / 8;
+ else if (length < 131)
+ return 273 + (length - 3) / 16;
+ else if (length < 258)
+ return 277 + (length - 3) / 32;
+ else
+ return 285;
+}
+
+// Upon return, codes[] contains the code lengths,
+// and bl_count is the count of the lengths
+
+/* Init heap with the histogram, and return the histogram size */
+static inline uint32_t init_heap32(struct heap_tree *heap_space, uint32_t * histogram,
+ uint32_t hist_size)
+{
+ uint32_t heap_size, i;
+
+ memset(heap_space, 0, sizeof(struct heap_tree));
+
+ heap_size = 0;
+ for (i = 0; i < hist_size; i++) {
+ if (histogram[i] != 0)
+ heap_space->heap[++heap_size] =
+ (((uint64_t) histogram[i]) << FREQ_SHIFT) | i;
+ }
+
+ // make sure heap has at least two elements in it
+ if (heap_size < 2) {
+ if (heap_size == 0) {
+ heap_space->heap[1] = 1ULL << FREQ_SHIFT;
+ heap_space->heap[2] = (1ULL << FREQ_SHIFT) | 1;
+ heap_size = 2;
+ } else {
+ // heap size == 1
+ if (histogram[0] == 0)
+ heap_space->heap[2] = 1ULL << FREQ_SHIFT;
+ else
+ heap_space->heap[2] = (1ULL << FREQ_SHIFT) | 1;
+ heap_size = 2;
+ }
+ }
+
+ build_heap(heap_space->heap, heap_size);
+
+ return heap_size;
+}
+
+static inline uint32_t init_heap64(struct heap_tree *heap_space, uint64_t * histogram,
+ uint64_t hist_size)
+{
+ uint32_t heap_size, i;
+
+ memset(heap_space, 0, sizeof(struct heap_tree));
+
+ heap_size = 0;
+ for (i = 0; i < hist_size; i++) {
+ if (histogram[i] != 0)
+ heap_space->heap[++heap_size] = ((histogram[i]) << FREQ_SHIFT) | i;
+ }
+
+ // make sure heap has at least two elements in it
+ if (heap_size < 2) {
+ if (heap_size == 0) {
+ heap_space->heap[1] = 1ULL << FREQ_SHIFT;
+ heap_space->heap[2] = (1ULL << FREQ_SHIFT) | 1;
+ heap_size = 2;
+ } else {
+ // heap size == 1
+ if (histogram[0] == 0)
+ heap_space->heap[2] = 1ULL << FREQ_SHIFT;
+ else
+ heap_space->heap[2] = (1ULL << FREQ_SHIFT) | 1;
+ heap_size = 2;
+ }
+ }
+
+ build_heap(heap_space->heap, heap_size);
+
+ return heap_size;
+}
+
+static inline uint32_t init_heap64_complete(struct heap_tree *heap_space, uint64_t * histogram,
+ uint64_t hist_size)
+{
+ uint32_t heap_size, i;
+
+ memset(heap_space, 0, sizeof(struct heap_tree));
+
+ heap_size = 0;
+ for (i = 0; i < hist_size; i++)
+ heap_space->heap[++heap_size] = ((histogram[i]) << FREQ_SHIFT) | i;
+
+ build_heap(heap_space->heap, heap_size);
+
+ return heap_size;
+}
+
+static inline uint32_t fix_code_lens(struct heap_tree *heap_space, uint32_t root_node,
+ uint32_t * bl_count, uint32_t max_code_len)
+{
+ struct tree_node *tree = heap_space->tree;
+ uint64_t *code_len_count = heap_space->code_len_count;
+ uint32_t i, j, k, child, depth, code_len;
+
+ // compute code lengths and code length counts
+ code_len = 0;
+ j = root_node;
+ for (i = root_node; i <= HEAP_TREE_NODE_START; i++) {
+ child = tree[i].child;
+ if (child > MAX_HISTHEAP_SIZE) {
+ depth = 1 + tree[i].depth;
+
+ tree[child].depth = depth;
+ tree[child - 1].depth = depth;
+ } else {
+ tree[j++] = tree[i];
+ depth = tree[i].depth;
+ while (code_len < depth) {
+ code_len++;
+ code_len_count[code_len] = 0;
+ }
+ code_len_count[depth]++;
+ }
+ }
+
+ if (code_len > max_code_len) {
+ while (code_len > max_code_len) {
+ assert(code_len_count[code_len] > 1);
+ for (i = max_code_len - 1; i != 0; i--)
+ if (code_len_count[i] != 0)
+ break;
+ assert(i != 0);
+ code_len_count[i]--;
+ code_len_count[i + 1] += 2;
+ code_len_count[code_len - 1]++;
+ code_len_count[code_len] -= 2;
+ if (code_len_count[code_len] == 0)
+ code_len--;
+ }
+
+ for (i = 1; i <= code_len; i++)
+ bl_count[i] = code_len_count[i];
+ for (; i <= max_code_len; i++)
+ bl_count[i] = 0;
+
+ for (k = 1; code_len_count[k] == 0; k++) ;
+ for (i = root_node; i < j; i++) {
+ tree[i].depth = k;
+ code_len_count[k]--;
+ for (; code_len_count[k] == 0; k++) ;
+ }
+ } else {
+ for (i = 1; i <= code_len; i++)
+ bl_count[i] = code_len_count[i];
+ for (; i <= max_code_len; i++)
+ bl_count[i] = 0;
+ }
+
+ return j;
+
+}
+
+static inline void
+gen_huff_code_lens(struct heap_tree *heap_space, uint32_t heap_size, uint32_t * bl_count,
+ struct huff_code *codes, uint32_t codes_count, uint32_t max_code_len)
+{
+ struct tree_node *tree = heap_space->tree;
+ uint32_t root_node = HEAP_TREE_NODE_START, node_ptr;
+ uint32_t end_node;
+
+ root_node = build_huff_tree(heap_space, heap_size, root_node);
+
+ end_node = fix_code_lens(heap_space, root_node, bl_count, max_code_len);
+
+ memset(codes, 0, codes_count * sizeof(*codes));
+ for (node_ptr = root_node; node_ptr < end_node; node_ptr++)
+ codes[tree[node_ptr].child].length = tree[node_ptr].depth;
+
+}
+
+inline uint32_t set_huff_codes(struct huff_code *huff_code_table, int table_length,
+ uint32_t * count)
+{
+ /* Uses the algorithm mentioned in the deflate standard, Rfc 1951. */
+ int i;
+ uint16_t code = 0;
+ uint16_t next_code[MAX_HUFF_TREE_DEPTH + 1];
+ uint32_t max_code = 0;
+
+ next_code[0] = code;
+
+ for (i = 1; i < MAX_HUFF_TREE_DEPTH + 1; i++)
+ next_code[i] = (next_code[i - 1] + count[i - 1]) << 1;
+
+ for (i = 0; i < table_length; i++) {
+ if (huff_code_table[i].length != 0) {
+ huff_code_table[i].code =
+ bit_reverse(next_code[huff_code_table[i].length],
+ huff_code_table[i].length);
+ next_code[huff_code_table[i].length] += 1;
+ max_code = i;
+ }
+ }
+
+ return max_code;
+}
+
+// on input, codes contain the code lengths
+// on output, code contains:
+// 23:16 code length
+// 15:0 code value in low order bits
+// returns max code value
+static inline uint32_t set_dist_huff_codes(struct huff_code *codes, uint32_t * bl_count)
+{
+ uint32_t code, code_len, bits, i;
+ uint32_t next_code[MAX_DEFLATE_CODE_LEN + 1];
+ uint32_t max_code = 0;
+ const uint32_t num_codes = DIST_LEN;
+
+ code = bl_count[0] = 0;
+ for (bits = 1; bits <= MAX_HUFF_TREE_DEPTH; bits++) {
+ code = (code + bl_count[bits - 1]) << 1;
+ next_code[bits] = code;
+ }
+ for (i = 0; i < num_codes; i++) {
+ code_len = codes[i].length;
+ if (code_len != 0) {
+ codes[i].code = bit_reverse(next_code[code_len], code_len);
+ codes[i].extra_bit_count = dist_code_extra_bits[i];
+ next_code[code_len] += 1;
+ max_code = i;
+ }
+ }
+ return max_code;
+}
+
+int create_huffman_header(struct BitBuf2 *header_bitbuf,
+ struct huff_code *lookup_table,
+ struct rl_code *huffman_rep,
+ uint16_t huffman_rep_length, uint32_t end_of_block,
+ uint32_t hclen, uint32_t hlit, uint32_t hdist)
+{
+ /* hlit, hdist, hclen are as defined in the deflate standard, head is the
+ * first three deflate header bits.*/
+ int i;
+ uint64_t bit_count;
+ uint64_t data;
+ struct huff_code huffman_value;
+ const uint32_t extra_bits[3] = { 2, 3, 7 };
+
+ bit_count = buffer_bits_used(header_bitbuf);
+
+ data = (end_of_block ? 5 : 4) | (hlit << 3) | (hdist << 8) | (hclen << 13);
+ data |= ((lookup_table[code_length_code_order[0]].length) << DYN_HDR_START_LEN);
+ write_bits(header_bitbuf, data, DYN_HDR_START_LEN + 3);
+ data = 0;
+ for (i = hclen + 3; i >= 1; i--)
+ data = (data << 3) | lookup_table[code_length_code_order[i]].length;
+
+ write_bits(header_bitbuf, data, (hclen + 3) * 3);
+
+ for (i = 0; i < huffman_rep_length; i++) {
+ huffman_value = lookup_table[huffman_rep[i].code];
+
+ write_bits(header_bitbuf, (uint64_t) huffman_value.code,
+ (uint32_t) huffman_value.length);
+
+ if (huffman_rep[i].code > 15) {
+ write_bits(header_bitbuf, (uint64_t) huffman_rep[i].extra_bits,
+ (uint32_t) extra_bits[huffman_rep[i].code - 16]);
+ }
+ }
+ bit_count = buffer_bits_used(header_bitbuf) - bit_count;
+
+ return bit_count;
+}
+
+inline int create_header(struct BitBuf2 *header_bitbuf, struct rl_code *huffman_rep,
+ uint32_t length, uint64_t * histogram, uint32_t hlit,
+ uint32_t hdist, uint32_t end_of_block)
+{
+ int i;
+
+ uint32_t heap_size;
+ struct heap_tree heap_space;
+ uint32_t code_len_count[MAX_HUFF_TREE_DEPTH + 1];
+ struct huff_code lookup_table[HUFF_LEN];
+
+ /* hlit, hdist, and hclen are defined in RFC 1951 page 13 */
+ uint32_t hclen;
+ uint64_t bit_count;
+
+ /* Create a huffman tree to encode run length encoded representation. */
+ heap_size = init_heap64(&heap_space, histogram, HUFF_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)lookup_table, HUFF_LEN, 7);
+ set_huff_codes(lookup_table, HUFF_LEN, code_len_count);
+
+ /* Calculate hclen */
+ for (i = CODE_LEN_CODES - 1; i > 3; i--) /* i must be at least 4 */
+ if (lookup_table[code_length_code_order[i]].length != 0)
+ break;
+
+ hclen = i - 3;
+
+ /* Generate actual header. */
+ bit_count = create_huffman_header(header_bitbuf, lookup_table, huffman_rep,
+ length, end_of_block, hclen, hlit, hdist);
+
+ return bit_count;
+}
+
+static inline
+ struct rl_code *write_rl(struct rl_code *pout, uint16_t last_len, uint32_t run_len,
+ uint64_t * counts)
+{
+ if (last_len == 0) {
+ while (run_len > 138) {
+ pout->code = 18;
+ pout->extra_bits = 138 - 11;
+ pout++;
+ run_len -= 138;
+ counts[18]++;
+ }
+ // 1 <= run_len <= 138
+ if (run_len > 10) {
+ pout->code = 18;
+ pout->extra_bits = run_len - 11;
+ pout++;
+ counts[18]++;
+ } else if (run_len > 2) {
+ pout->code = 17;
+ pout->extra_bits = run_len - 3;
+ pout++;
+ counts[17]++;
+ } else if (run_len == 1) {
+ pout->code = 0;
+ pout->extra_bits = 0;
+ pout++;
+ counts[0]++;
+ } else {
+ assert(run_len == 2);
+ pout[0].code = 0;
+ pout[0].extra_bits = 0;
+ pout[1].code = 0;
+ pout[1].extra_bits = 0;
+ pout += 2;
+ counts[0] += 2;
+ }
+ } else {
+ // last_len != 0
+ pout->code = last_len;
+ pout->extra_bits = 0;
+ pout++;
+ counts[last_len]++;
+ run_len--;
+ if (run_len != 0) {
+ while (run_len > 6) {
+ pout->code = 16;
+ pout->extra_bits = 6 - 3;
+ pout++;
+ run_len -= 6;
+ counts[16]++;
+ }
+ // 1 <= run_len <= 6
+ switch (run_len) {
+ case 1:
+ pout->code = last_len;
+ pout->extra_bits = 0;
+ pout++;
+ counts[last_len]++;
+ break;
+ case 2:
+ pout[0].code = last_len;
+ pout[0].extra_bits = 0;
+ pout[1].code = last_len;
+ pout[1].extra_bits = 0;
+ pout += 2;
+ counts[last_len] += 2;
+ break;
+ default: // 3...6
+ pout->code = 16;
+ pout->extra_bits = run_len - 3;
+ pout++;
+ counts[16]++;
+ }
+ }
+ }
+ return pout;
+}
+
+// convert codes into run-length symbols, write symbols into OUT
+// generate histogram into COUNTS (assumed to be initialized to 0)
+// Format of OUT:
+// 4:0 code (0...18)
+// 15:8 Extra bits (0...127)
+// returns number of symbols in out
+static inline uint32_t rl_encode(uint16_t * codes, uint32_t num_codes, uint64_t * counts,
+ struct rl_code *out)
+{
+ uint32_t i, run_len;
+ uint16_t last_len, len;
+ struct rl_code *pout;
+
+ pout = out;
+ last_len = codes[0];
+ run_len = 1;
+ for (i = 1; i < num_codes; i++) {
+ len = codes[i];
+ if (len == last_len) {
+ run_len++;
+ continue;
+ }
+ pout = write_rl(pout, last_len, run_len, counts);
+ last_len = len;
+ run_len = 1;
+ }
+ pout = write_rl(pout, last_len, run_len, counts);
+
+ return (uint32_t) (pout - out);
+}
+
+void create_code_tables(uint16_t * code_table, uint8_t * code_length_table, uint32_t length,
+ struct huff_code *hufftable)
+{
+ int i;
+ for (i = 0; i < length; i++) {
+ code_table[i] = hufftable[i].code;
+ code_length_table[i] = hufftable[i].length;
+ }
+}
+
+void create_packed_len_table(uint32_t * packed_table, struct huff_code *lit_len_hufftable)
+{
+ int i, count = 0;
+ uint16_t extra_bits;
+ uint16_t extra_bits_count = 0;
+
+ /* Gain extra bits is the next place where the number of extra bits in
+ * lenght codes increases. */
+ uint16_t gain_extra_bits = LEN_EXTRA_BITS_START;
+
+ for (i = 257; i < LIT_LEN - 1; i++) {
+ for (extra_bits = 0; extra_bits < (1 << extra_bits_count); extra_bits++) {
+ if (count > 254)
+ break;
+ packed_table[count++] =
+ (extra_bits << (lit_len_hufftable[i].length + LENGTH_BITS)) |
+ (lit_len_hufftable[i].code << LENGTH_BITS) |
+ (lit_len_hufftable[i].length + extra_bits_count);
+ }
+
+ if (i == gain_extra_bits) {
+ gain_extra_bits += LEN_EXTRA_BITS_INTERVAL;
+ extra_bits_count += 1;
+ }
+ }
+
+ packed_table[count] = (lit_len_hufftable[LIT_LEN - 1].code << LENGTH_BITS) |
+ (lit_len_hufftable[LIT_LEN - 1].length);
+}
+
+void create_packed_dist_table(uint32_t * packed_table, uint32_t length,
+ struct huff_code *dist_hufftable)
+{
+ int i, count = 0;
+ uint16_t extra_bits;
+ uint16_t extra_bits_count = 0;
+
+ /* Gain extra bits is the next place where the number of extra bits in
+ * distance codes increases. */
+ uint16_t gain_extra_bits = DIST_EXTRA_BITS_START;
+
+ for (i = 0; i < DIST_LEN; i++) {
+ for (extra_bits = 0; extra_bits < (1 << extra_bits_count); extra_bits++) {
+ if (count >= length)
+ return;
+
+ packed_table[count++] =
+ (extra_bits << (dist_hufftable[i].length + LENGTH_BITS)) |
+ (dist_hufftable[i].code << LENGTH_BITS) |
+ (dist_hufftable[i].length + extra_bits_count);
+
+ }
+
+ if (i == gain_extra_bits) {
+ gain_extra_bits += DIST_EXTRA_BITS_INTERVAL;
+ extra_bits_count += 1;
+ }
+ }
+}
+
+int are_hufftables_useable(struct huff_code *lit_len_hufftable,
+ struct huff_code *dist_hufftable)
+{
+ int max_lit_code_len = 0, max_len_code_len = 0, max_dist_code_len = 0;
+ int dist_extra_bits = 0, len_extra_bits = 0;
+ int gain_dist_extra_bits = DIST_EXTRA_BITS_START;
+ int gain_len_extra_bits = LEN_EXTRA_BITS_START;
+ int max_code_len;
+ int i;
+
+ for (i = 0; i < LIT_LEN; i++)
+ if (lit_len_hufftable[i].length > max_lit_code_len)
+ max_lit_code_len = lit_len_hufftable[i].length;
+
+ for (i = 257; i < LIT_LEN - 1; i++) {
+ if (lit_len_hufftable[i].length + len_extra_bits > max_len_code_len)
+ max_len_code_len = lit_len_hufftable[i].length + len_extra_bits;
+
+ if (i == gain_len_extra_bits) {
+ gain_len_extra_bits += LEN_EXTRA_BITS_INTERVAL;
+ len_extra_bits += 1;
+ }
+ }
+
+ for (i = 0; i < DIST_LEN; i++) {
+ if (dist_hufftable[i].length + dist_extra_bits > max_dist_code_len)
+ max_dist_code_len = dist_hufftable[i].length + dist_extra_bits;
+
+ if (i == gain_dist_extra_bits) {
+ gain_dist_extra_bits += DIST_EXTRA_BITS_INTERVAL;
+ dist_extra_bits += 1;
+ }
+ }
+
+ max_code_len = max_lit_code_len + max_len_code_len + max_dist_code_len;
+
+ /* Some versions of igzip can write upto one literal, one length and one
+ * distance code at the same time. This checks to make sure that is
+ * always writeable in bitbuf*/
+ return (max_code_len > MAX_BITBUF_BIT_WRITE);
+}
+
+int isal_create_hufftables(struct isal_hufftables *hufftables,
+ struct isal_huff_histogram *histogram)
+{
+ struct huff_code lit_huff_table[LIT_LEN], dist_huff_table[DIST_LEN];
+ uint64_t bit_count;
+ int max_dist = convert_dist_to_dist_sym(IGZIP_HIST_SIZE);
+ struct heap_tree heap_space;
+ uint32_t heap_size;
+ uint32_t code_len_count[MAX_HUFF_TREE_DEPTH + 1];
+ struct BitBuf2 header_bitbuf;
+ uint32_t max_lit_len_sym;
+ uint32_t max_dist_sym;
+ uint32_t hlit, hdist, i;
+ uint16_t combined_table[LIT_LEN + DIST_LEN];
+ uint64_t count_histogram[HUFF_LEN];
+ struct rl_code rl_huff[LIT_LEN + DIST_LEN];
+ uint32_t rl_huff_len;
+
+ uint32_t *dist_table = hufftables->dist_table;
+ uint32_t *len_table = hufftables->len_table;
+ uint16_t *lit_table = hufftables->lit_table;
+ uint16_t *dcodes = hufftables->dcodes;
+ uint8_t *lit_table_sizes = hufftables->lit_table_sizes;
+ uint8_t *dcodes_sizes = hufftables->dcodes_sizes;
+ uint8_t *deflate_hdr = hufftables->deflate_hdr;
+ uint64_t *lit_len_histogram = histogram->lit_len_histogram;
+ uint64_t *dist_histogram = histogram->dist_histogram;
+
+ memset(hufftables, 0, sizeof(struct isal_hufftables));
+
+ heap_size = init_heap64_complete(&heap_space, lit_len_histogram, LIT_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)lit_huff_table, LIT_LEN, MAX_DEFLATE_CODE_LEN);
+ max_lit_len_sym = set_huff_codes(lit_huff_table, LIT_LEN, code_len_count);
+
+ heap_size = init_heap64_complete(&heap_space, dist_histogram, DIST_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)dist_huff_table, max_dist,
+ MAX_DEFLATE_CODE_LEN);
+ max_dist_sym = set_huff_codes(dist_huff_table, DIST_LEN, code_len_count);
+
+ if (are_hufftables_useable(lit_huff_table, dist_huff_table)) {
+ heap_size = init_heap64_complete(&heap_space, lit_len_histogram, LIT_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)lit_huff_table, LIT_LEN,
+ MAX_SAFE_LIT_CODE_LEN);
+ max_lit_len_sym = set_huff_codes(lit_huff_table, LIT_LEN, code_len_count);
+
+ heap_size = init_heap64_complete(&heap_space, dist_histogram, DIST_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)dist_huff_table, max_dist,
+ MAX_SAFE_DIST_CODE_LEN);
+ max_dist_sym = set_huff_codes(dist_huff_table, DIST_LEN, code_len_count);
+
+ }
+
+ create_code_tables(dcodes, dcodes_sizes, DIST_LEN - DCODE_OFFSET,
+ dist_huff_table + DCODE_OFFSET);
+
+ create_code_tables(lit_table, lit_table_sizes, IGZIP_LIT_TABLE_SIZE, lit_huff_table);
+
+ create_packed_len_table(len_table, lit_huff_table);
+ create_packed_dist_table(dist_table, IGZIP_DIST_TABLE_SIZE, dist_huff_table);
+
+ set_buf(&header_bitbuf, deflate_hdr, sizeof(deflate_hdr));
+ init(&header_bitbuf);
+
+ hlit = max_lit_len_sym - 256;
+ hdist = max_dist_sym;
+
+ /* Run length encode the length and distance huffman codes */
+ memset(count_histogram, 0, sizeof(count_histogram));
+ for (i = 0; i < 257 + hlit; i++)
+ combined_table[i] = lit_huff_table[i].length;
+ for (i = 0; i < 1 + hdist; i++)
+ combined_table[i + hlit + 257] = dist_huff_table[i].length;
+ rl_huff_len =
+ rl_encode(combined_table, hlit + 257 + hdist + 1, count_histogram, rl_huff);
+
+ /* Create header */
+ bit_count =
+ create_header(&header_bitbuf, rl_huff, rl_huff_len,
+ count_histogram, hlit, hdist, LAST_BLOCK);
+ flush(&header_bitbuf);
+
+ hufftables->deflate_hdr_count = bit_count / 8;
+ hufftables->deflate_hdr_extra_bits = bit_count % 8;
+
+ return 0;
+}
+
+int isal_create_hufftables_subset(struct isal_hufftables *hufftables,
+ struct isal_huff_histogram *histogram)
+{
+ struct huff_code lit_huff_table[LIT_LEN], dist_huff_table[DIST_LEN];
+ uint64_t bit_count;
+ int max_dist = convert_dist_to_dist_sym(IGZIP_HIST_SIZE);
+ struct heap_tree heap_space;
+ uint32_t heap_size;
+ uint32_t code_len_count[MAX_HUFF_TREE_DEPTH + 1];
+ struct BitBuf2 header_bitbuf;
+ uint32_t max_lit_len_sym;
+ uint32_t max_dist_sym;
+ uint32_t hlit, hdist, i;
+ uint16_t combined_table[LIT_LEN + DIST_LEN];
+ uint64_t count_histogram[HUFF_LEN];
+ struct rl_code rl_huff[LIT_LEN + DIST_LEN];
+ uint32_t rl_huff_len;
+
+ uint32_t *dist_table = hufftables->dist_table;
+ uint32_t *len_table = hufftables->len_table;
+ uint16_t *lit_table = hufftables->lit_table;
+ uint16_t *dcodes = hufftables->dcodes;
+ uint8_t *lit_table_sizes = hufftables->lit_table_sizes;
+ uint8_t *dcodes_sizes = hufftables->dcodes_sizes;
+ uint8_t *deflate_hdr = hufftables->deflate_hdr;
+ uint64_t *lit_len_histogram = histogram->lit_len_histogram;
+ uint64_t *dist_histogram = histogram->dist_histogram;
+
+ memset(hufftables, 0, sizeof(struct isal_hufftables));
+
+ heap_size = init_heap64(&heap_space, lit_len_histogram, LIT_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)lit_huff_table, LIT_LEN, MAX_DEFLATE_CODE_LEN);
+ max_lit_len_sym = set_huff_codes(lit_huff_table, LIT_LEN, code_len_count);
+
+ heap_size = init_heap64_complete(&heap_space, dist_histogram, DIST_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)dist_huff_table, max_dist,
+ MAX_DEFLATE_CODE_LEN);
+ max_dist_sym = set_huff_codes(dist_huff_table, DIST_LEN, code_len_count);
+
+ if (are_hufftables_useable(lit_huff_table, dist_huff_table)) {
+ heap_size = init_heap64_complete(&heap_space, lit_len_histogram, LIT_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)lit_huff_table, LIT_LEN,
+ MAX_SAFE_LIT_CODE_LEN);
+ max_lit_len_sym = set_huff_codes(lit_huff_table, LIT_LEN, code_len_count);
+
+ heap_size = init_heap64_complete(&heap_space, dist_histogram, DIST_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, code_len_count,
+ (struct huff_code *)dist_huff_table, max_dist,
+ MAX_SAFE_DIST_CODE_LEN);
+ max_dist_sym = set_huff_codes(dist_huff_table, DIST_LEN, code_len_count);
+
+ }
+
+ create_code_tables(dcodes, dcodes_sizes, DIST_LEN - DCODE_OFFSET,
+ dist_huff_table + DCODE_OFFSET);
+
+ create_code_tables(lit_table, lit_table_sizes, IGZIP_LIT_TABLE_SIZE, lit_huff_table);
+
+ create_packed_len_table(len_table, lit_huff_table);
+ create_packed_dist_table(dist_table, IGZIP_DIST_TABLE_SIZE, dist_huff_table);
+
+ set_buf(&header_bitbuf, deflate_hdr, sizeof(deflate_hdr));
+ init(&header_bitbuf);
+
+ hlit = max_lit_len_sym - 256;
+ hdist = max_dist_sym;
+
+ /* Run length encode the length and distance huffman codes */
+ memset(count_histogram, 0, sizeof(count_histogram));
+ for (i = 0; i < 257 + hlit; i++)
+ combined_table[i] = lit_huff_table[i].length;
+ for (i = 0; i < 1 + hdist; i++)
+ combined_table[i + hlit + 257] = dist_huff_table[i].length;
+ rl_huff_len =
+ rl_encode(combined_table, hlit + 257 + hdist + 1, count_histogram, rl_huff);
+
+ /* Create header */
+ bit_count =
+ create_header(&header_bitbuf, rl_huff, rl_huff_len,
+ count_histogram, hlit, hdist, LAST_BLOCK);
+ flush(&header_bitbuf);
+
+ hufftables->deflate_hdr_count = bit_count / 8;
+ hufftables->deflate_hdr_extra_bits = bit_count % 8;
+
+ return 0;
+}
+
+void expand_hufftables_icf(struct hufftables_icf *hufftables)
+{
+ uint32_t i, eb, j, k, len, code;
+ struct huff_code orig[21], *p_code;
+ struct huff_code *lit_len_codes = hufftables->lit_len_table;
+ struct huff_code *dist_codes = hufftables->dist_table;
+
+ for (i = 0; i < 21; i++)
+ orig[i] = lit_len_codes[i + 265];
+
+ p_code = &lit_len_codes[265];
+
+ i = 0;
+ for (eb = 1; eb < 6; eb++) {
+ for (k = 0; k < 4; k++) {
+ len = orig[i].length;
+ code = orig[i++].code;
+ for (j = 0; j < (1u << eb); j++) {
+ p_code->code_and_extra = code | (j << len);
+ p_code->length = len + eb;
+ p_code++;
+ }
+ } // end for k
+ } // end for eb
+ // fix up last record
+ p_code[-1] = orig[i];
+
+ dist_codes[DIST_LEN].code_and_extra = 0;
+ dist_codes[DIST_LEN].length = 0;
+}
+
+void
+create_hufftables_icf(struct BitBuf2 *bb, struct hufftables_icf *hufftables,
+ struct isal_mod_hist *hist, uint32_t end_of_block)
+{
+ uint32_t bl_count[MAX_DEFLATE_CODE_LEN + 1];
+ uint32_t max_ll_code, max_d_code;
+ struct heap_tree heap_space;
+ uint32_t heap_size;
+ struct rl_code cl_tokens[LIT_LEN + DIST_LEN];
+ uint32_t num_cl_tokens;
+ uint64_t cl_counts[CODE_LEN_CODES];
+ uint16_t combined_table[LIT_LEN + DIST_LEN];
+ int i;
+ uint64_t compressed_len = 0;
+ uint64_t static_compressed_len = 3; /* The static header size */
+ struct BitBuf2 bb_tmp;
+
+ struct huff_code *ll_codes = hufftables->lit_len_table;
+ struct huff_code *d_codes = hufftables->dist_table;
+ uint32_t *ll_hist = hist->ll_hist;
+ uint32_t *d_hist = hist->d_hist;
+ struct huff_code *static_ll_codes = static_hufftables.lit_len_table;
+ struct huff_code *static_d_codes = static_hufftables.dist_table;
+
+ memcpy(&bb_tmp, bb, sizeof(struct BitBuf2));
+
+ flatten_ll(hist->ll_hist);
+
+ // make sure EOB is present
+ if (ll_hist[256] == 0)
+ ll_hist[256] = 1;
+
+ heap_size = init_heap32(&heap_space, ll_hist, LIT_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, bl_count,
+ ll_codes, LIT_LEN, MAX_DEFLATE_CODE_LEN);
+ max_ll_code = set_huff_codes(ll_codes, LIT_LEN, bl_count);
+
+ heap_size = init_heap32(&heap_space, d_hist, DIST_LEN);
+ gen_huff_code_lens(&heap_space, heap_size, bl_count, d_codes,
+ DIST_LEN, MAX_DEFLATE_CODE_LEN);
+ max_d_code = set_dist_huff_codes(d_codes, bl_count);
+
+ assert(max_ll_code >= 256); // must be EOB code
+ assert(max_d_code != 0);
+
+ /* Run length encode the length and distance huffman codes */
+ memset(cl_counts, 0, sizeof(cl_counts));
+
+ for (i = 0; i <= 256; i++) {
+ combined_table[i] = ll_codes[i].length;
+ compressed_len += ll_codes[i].length * ll_hist[i];
+ static_compressed_len += static_ll_codes[i].length * ll_hist[i];
+ }
+
+ for (; i < max_ll_code + 1; i++) {
+ combined_table[i] = ll_codes[i].length;
+ compressed_len +=
+ (ll_codes[i].length + len_code_extra_bits[i - 257]) * ll_hist[i];
+ static_compressed_len +=
+ (static_ll_codes[i].length + len_code_extra_bits[i - 257]) * ll_hist[i];
+ }
+
+ for (i = 0; i < max_d_code + 1; i++) {
+ combined_table[i + max_ll_code + 1] = d_codes[i].length;
+ compressed_len += (d_codes[i].length + dist_code_extra_bits[i]) * d_hist[i];
+ static_compressed_len +=
+ (static_d_codes[i].length + dist_code_extra_bits[i]) * d_hist[i];
+ }
+
+ expand_hufftables_icf(hufftables);
+
+ num_cl_tokens =
+ rl_encode(combined_table, max_ll_code + max_d_code + 2, cl_counts, cl_tokens);
+
+ /* Create header */
+ create_header(bb, cl_tokens, num_cl_tokens, cl_counts, max_ll_code - 256, max_d_code,
+ end_of_block);
+ compressed_len += 8 * buffer_used(bb) + bb->m_bit_count;
+
+ if (static_compressed_len < compressed_len) {
+ memcpy(hufftables, &static_hufftables, sizeof(struct hufftables_icf));
+ expand_hufftables_icf(hufftables);
+ memcpy(bb, &bb_tmp, sizeof(struct BitBuf2));
+ end_of_block = end_of_block ? 1 : 0;
+ write_bits(bb, 0x2 | end_of_block, 3);
+ }
+}