summaryrefslogtreecommitdiffstats
path: root/lzcheck.c
diff options
context:
space:
mode:
Diffstat (limited to 'lzcheck.c')
-rw-r--r--lzcheck.c234
1 files changed, 234 insertions, 0 deletions
diff --git a/lzcheck.c b/lzcheck.c
new file mode 100644
index 0000000..19a1887
--- /dev/null
+++ b/lzcheck.c
@@ -0,0 +1,234 @@
+/* Lzcheck - A test program for the lzlib library
+ Copyright (C) 2009, 2010, 2011, 2012 Antonio Diaz Diaz.
+
+ This program is free software: you have unlimited permission
+ to copy, distribute and modify it.
+
+ Usage is:
+ lzcheck filename.txt
+
+ This program reads the specified text file and then compresses it,
+ line by line, to test the flushing mechanism and the member
+ restart/reset/sync functions.
+*/
+
+#define _FILE_OFFSET_BITS 64
+
+#include <stdbool.h>
+#include <stdint.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <unistd.h>
+
+#include "lzlib.h"
+
+#ifndef LLONG_MAX
+#define LLONG_MAX 0x7FFFFFFFFFFFFFFFLL
+#endif
+#ifndef LLONG_MIN
+#define LLONG_MIN (-LLONG_MAX - 1LL)
+#endif
+#ifndef ULLONG_MAX
+#define ULLONG_MAX 0xFFFFFFFFFFFFFFFFULL
+#endif
+
+#ifndef min
+ #define min(x,y) ((x) <= (y) ? (x) : (y))
+#endif
+
+enum { buffer_size = 32768 };
+uint8_t in_buffer[buffer_size];
+uint8_t mid_buffer[buffer_size];
+uint8_t out_buffer[buffer_size];
+
+
+int main( const int argc, const char * const argv[] )
+ {
+ if( argc < 2 )
+ {
+ fprintf( stderr, "Usage: lzcheck filename.txt\n" );
+ return 1;
+ }
+
+ FILE *file = fopen( argv[1], "rb" );
+ if( !file )
+ {
+ fprintf( stderr, "lzcheck: Can't open file '%s' for reading\n", argv[1] );
+ return 1;
+ }
+/* fprintf( stderr, "lzcheck: Testing file '%s'\n", argv[1] ); */
+
+ const int dictionary_size = 1 << 20;
+ const int match_len_limit = 36;
+ const long long member_size = LLONG_MAX;
+ struct LZ_Encoder * const encoder =
+ LZ_compress_open( dictionary_size, match_len_limit, member_size );
+ if( !encoder || LZ_compress_errno( encoder ) != LZ_ok )
+ {
+ const bool mem_error = ( LZ_compress_errno( encoder ) == LZ_mem_error );
+ LZ_compress_close( encoder );
+ if( mem_error )
+ {
+ fprintf( stderr, "lzcheck: Not enough memory.\n" );
+ return 1;
+ }
+ fprintf( stderr, "lzcheck: internal error: Invalid argument to encoder.\n" );
+ return 3;
+ }
+
+ struct LZ_Decoder * const decoder = LZ_decompress_open();
+ if( !decoder || LZ_decompress_errno( decoder ) != LZ_ok )
+ {
+ LZ_decompress_close( decoder );
+ fprintf( stderr, "lzcheck: Not enough memory.\n" );
+ return 1;
+ }
+
+ int retval = 0;
+ while( retval <= 1 )
+ {
+ int i, l, r;
+ const int read_size = fread( in_buffer, 1, buffer_size, file );
+ if( read_size <= 0 ) break; /* end of file */
+
+ for( l = 0, r = 1; r <= read_size; l = r, ++r )
+ {
+ while( r < read_size && in_buffer[r-1] != '\n' ) ++r;
+ const int in_size = LZ_compress_write( encoder, in_buffer + l, r - l );
+ if( in_size < r - l ) r = l + in_size;
+ LZ_compress_sync_flush( encoder );
+ const int mid_size = LZ_compress_read( encoder, mid_buffer, buffer_size );
+ if( mid_size < 0 )
+ {
+ fprintf( stderr, "lzcheck: LZ_compress_read error: %s.\n",
+ LZ_strerror( LZ_compress_errno( encoder ) ) );
+ retval = 3; break;
+ }
+ LZ_decompress_write( decoder, mid_buffer, mid_size );
+ const int out_size = LZ_decompress_read( decoder, out_buffer, buffer_size );
+ if( out_size < 0 )
+ {
+ fprintf( stderr, "lzcheck: LZ_decompress_read error: %s.\n",
+ LZ_strerror( LZ_decompress_errno( decoder ) ) );
+ retval = 3; break;
+ }
+
+ if( out_size != in_size || memcmp( in_buffer + l, out_buffer, out_size ) )
+ {
+ fprintf( stderr, "lzcheck: Sync error at pos %d. in_size = %d, out_size = %d\n",
+ l, in_size, out_size );
+ for( i = 0; i < in_size; ++i )
+ fputc( in_buffer[l+i], stderr );
+ if( in_buffer[l+in_size-1] != '\n' )
+ fputc( '\n', stderr );
+ for( i = 0; i < out_size; ++i )
+ fputc( out_buffer[i], stderr );
+ fputc( '\n', stderr );
+ retval = 1;
+ }
+ }
+ }
+
+ if( retval <= 1 )
+ {
+ rewind( file );
+ if( LZ_compress_finish( encoder ) < 0 ||
+ LZ_decompress_write( decoder, mid_buffer, LZ_compress_read( encoder, mid_buffer, buffer_size ) ) < 0 ||
+ LZ_decompress_read( decoder, out_buffer, buffer_size ) != 0 ||
+ LZ_compress_restart_member( encoder, member_size ) < 0 )
+ {
+ fprintf( stderr, "lzcheck: Can't finish member: %s.\n",
+ LZ_strerror( LZ_decompress_errno( decoder ) ) );
+ retval = 3;
+ }
+ }
+
+ while( retval <= 1 )
+ {
+ int i, l, r;
+ const int read_size = fread( in_buffer, 1, buffer_size / 2, file );
+ if( read_size <= 0 ) break; /* end of file */
+
+ for( l = 0, r = 1; r <= read_size; l = r, ++r )
+ {
+ while( r < read_size && in_buffer[r-1] != '\n' ) ++r;
+ const int leading_garbage = (l == 0) ? min( r, read_size / 2 ) : 0;
+ const int in_size = LZ_compress_write( encoder, in_buffer + l, r - l );
+ if( in_size < r - l ) r = l + in_size;
+ LZ_compress_sync_flush( encoder );
+ if( leading_garbage )
+ memset( mid_buffer, in_buffer[0], leading_garbage );
+ const int mid_size = LZ_compress_read( encoder,
+ mid_buffer + leading_garbage,
+ buffer_size - leading_garbage );
+ if( mid_size < 0 )
+ {
+ fprintf( stderr, "lzcheck: LZ_compress_read error: %s.\n",
+ LZ_strerror( LZ_compress_errno( encoder ) ) );
+ retval = 3; break;
+ }
+ LZ_decompress_write( decoder, mid_buffer, mid_size + leading_garbage );
+ int out_size = LZ_decompress_read( decoder, out_buffer, buffer_size );
+ if( out_size < 0 )
+ {
+ if( LZ_decompress_errno( decoder ) == LZ_header_error ||
+ LZ_decompress_errno( decoder ) == LZ_data_error )
+ {
+ LZ_decompress_sync_to_member( decoder ); /* remove leading garbage */
+ out_size = LZ_decompress_read( decoder, out_buffer, buffer_size );
+ }
+ if( out_size < 0 )
+ {
+ fprintf( stderr, "lzcheck: LZ_decompress_read error: %s.\n",
+ LZ_strerror( LZ_decompress_errno( decoder ) ) );
+ retval = 3; break;
+ }
+ }
+
+ if( out_size != in_size || memcmp( in_buffer + l, out_buffer, out_size ) )
+ {
+ fprintf( stderr, "lzcheck: Sync error at pos %d. in_size = %d, out_size = %d\n",
+ l, in_size, out_size );
+ for( i = 0; i < in_size; ++i )
+ fputc( in_buffer[l+i], stderr );
+ if( in_buffer[l+in_size-1] != '\n' )
+ fputc( '\n', stderr );
+ for( i = 0; i < out_size; ++i )
+ fputc( out_buffer[i], stderr );
+ fputc( '\n', stderr );
+ retval = 1;
+ }
+ }
+ if( retval >= 3 ) break;
+
+ if( LZ_compress_finish( encoder ) < 0 ||
+ LZ_decompress_write( decoder, mid_buffer, LZ_compress_read( encoder, mid_buffer, buffer_size ) ) < 0 ||
+ LZ_decompress_read( decoder, out_buffer, buffer_size ) != 0 ||
+ LZ_decompress_reset( decoder ) < 0 ||
+ LZ_compress_restart_member( encoder, member_size ) < 0 )
+ {
+ fprintf( stderr, "lzcheck: Can't restart member: %s.\n",
+ LZ_strerror( LZ_decompress_errno( decoder ) ) );
+ retval = 3; break;
+ }
+
+ const int size = min( 100, read_size );
+ if( LZ_compress_write( encoder, in_buffer, size ) != size ||
+ LZ_compress_finish( encoder ) < 0 ||
+ LZ_decompress_write( decoder, mid_buffer, LZ_compress_read( encoder, mid_buffer, buffer_size ) ) < 0 ||
+ LZ_decompress_read( decoder, out_buffer, 0 ) != 0 ||
+ LZ_decompress_sync_to_member( decoder ) < 0 ||
+ LZ_compress_restart_member( encoder, member_size ) < 0 )
+ {
+ fprintf( stderr, "lzcheck: Can't seek to next member: %s.\n",
+ LZ_strerror( LZ_decompress_errno( decoder ) ) );
+ retval = 3; break;
+ }
+ }
+
+ LZ_decompress_close( decoder );
+ LZ_compress_close( encoder );
+ fclose( file );
+ return retval;
+ }