summaryrefslogtreecommitdiffstats
path: root/epan/tvbuff_lz77.c
diff options
context:
space:
mode:
Diffstat (limited to '')
-rw-r--r--epan/tvbuff_lz77.c157
1 files changed, 157 insertions, 0 deletions
diff --git a/epan/tvbuff_lz77.c b/epan/tvbuff_lz77.c
new file mode 100644
index 00000000..08e711ca
--- /dev/null
+++ b/epan/tvbuff_lz77.c
@@ -0,0 +1,157 @@
+/*
+ * Decompression code for Plain LZ77. This encoding is used by
+ * Microsoft in various file formats and protocols including SMB3.
+ *
+ * See MS-XCA.
+ *
+ * Copyright (C) 2019 Aurélien Aptel
+ *
+ * SPDX-License-Identifier: GPL-2.0-or-later
+ */
+
+#include <glib.h>
+#include <epan/exceptions.h>
+#include <epan/tvbuff.h>
+#include <epan/wmem_scopes.h>
+
+#define MAX_INPUT_SIZE (16*1024*1024) /* 16MB */
+
+static gboolean do_uncompress(tvbuff_t *tvb, int offset, int in_size,
+ wmem_array_t *obuf)
+{
+ guint buf_flags = 0, buf_flag_count = 0;
+ int in_off = 0;
+ int last_length_half_byte = 0;
+ guint match_bytes, match_len, match_off;
+ guint i;
+
+ if (!tvb)
+ return FALSE;
+
+ if (!in_size || in_size > MAX_INPUT_SIZE)
+ return FALSE;
+
+ while (1) {
+ if (buf_flag_count == 0) {
+ buf_flags = tvb_get_letohl(tvb, offset+in_off);
+ in_off += 4;
+ buf_flag_count = 32;
+ }
+ buf_flag_count--;
+ if ((buf_flags & (1u << buf_flag_count)) == 0) {
+ guint8 v = tvb_get_guint8(tvb, offset+in_off);
+ wmem_array_append_one(obuf, v);
+ in_off++;
+ } else {
+ if (in_off == in_size)
+ return TRUE;
+ match_bytes = tvb_get_letohs(tvb, offset+in_off);
+ in_off += 2;
+ match_len = match_bytes % 8;
+ match_off = (match_bytes/8) + 1;
+ if (match_len == 7) {
+ if (last_length_half_byte == 0) {
+ match_len = tvb_get_guint8(tvb, offset+in_off);
+ match_len = match_len % 16;
+ last_length_half_byte = in_off;
+ in_off++;
+ } else {
+ match_len = tvb_get_guint8(tvb, offset+last_length_half_byte);
+ match_len = match_len / 16;
+ last_length_half_byte = 0;
+ }
+ if (match_len == 15) {
+ match_len = tvb_get_guint8(tvb, offset+in_off);
+ in_off++;
+ if (match_len == 255) {
+ match_len = tvb_get_letohs(tvb, offset+in_off);
+ in_off += 2;
+ if (match_len == 0) {
+ /* This case isn't documented */
+ match_len = tvb_get_letohs(tvb, offset+in_off);
+ in_off += 4;
+ }
+ if (match_len < 15+7)
+ return FALSE;
+ match_len -= (15 + 7);
+ }
+ match_len += 15;
+ }
+ match_len += 7;
+ }
+ match_len += 3;
+ for (i = 0; i < match_len; i++) {
+ guint8 byte;
+ if (match_off > wmem_array_get_count(obuf))
+ return FALSE;
+ if (wmem_array_try_index(obuf, wmem_array_get_count(obuf)-match_off, &byte))
+ return FALSE;
+ wmem_array_append_one(obuf, byte);
+ }
+ }
+ }
+
+ return TRUE;
+}
+
+tvbuff_t *
+tvb_uncompress_lz77(tvbuff_t *tvb, const int offset, int in_size)
+{
+ volatile gboolean ok = FALSE;
+ wmem_allocator_t *pool;
+ wmem_array_t *obuf;
+ tvbuff_t *out;
+
+ pool = wmem_allocator_new(WMEM_ALLOCATOR_SIMPLE);
+ obuf = wmem_array_sized_new(pool, 1, in_size*2);
+
+ TRY {
+ ok = do_uncompress(tvb, offset, in_size, obuf);
+ } CATCH_ALL {
+ ok = FALSE;
+ }
+ ENDTRY;
+
+ if (ok) {
+ /*
+ * Cannot pass a tvb free callback that frees the wmem
+ * pool, so we make an extra copy that uses bare
+ * pointers. This could be optimized if tvb API had a
+ * free pool callback of some sort.
+ */
+ guint size = wmem_array_get_count(obuf);
+ guint8 *p = (guint8 *)g_malloc(size);
+ memcpy(p, wmem_array_get_raw(obuf), size);
+ out = tvb_new_real_data(p, size, size);
+ tvb_set_free_cb(out, g_free);
+ } else {
+ out = NULL;
+ }
+
+ wmem_destroy_allocator(pool);
+
+ return out;
+}
+
+tvbuff_t *
+tvb_child_uncompress_lz77(tvbuff_t *parent, tvbuff_t *tvb, const int offset, int in_size)
+{
+ tvbuff_t *new_tvb = tvb_uncompress_lz77(tvb, offset, in_size);
+ if (new_tvb)
+ tvb_set_child_real_data_tvbuff(parent, new_tvb);
+ return new_tvb;
+}
+
+
+/*
+ * Editor modelines - https://www.wireshark.org/tools/modelines.html
+ *
+ * Local variables:
+ * c-basic-offset: 8
+ * tab-width: 8
+ * indent-tabs-mode: t
+ * End:
+ *
+ * vi: set shiftwidth=8 tabstop=8 noexpandtab:
+ * :indentSize=8:tabSize=8:noTabs=false:
+ */