summaryrefslogtreecommitdiffstats
path: root/gf16.cc
diff options
context:
space:
mode:
Diffstat (limited to 'gf16.cc')
-rw-r--r--gf16.cc308
1 files changed, 308 insertions, 0 deletions
diff --git a/gf16.cc b/gf16.cc
new file mode 100644
index 0000000..ee5bb30
--- /dev/null
+++ b/gf16.cc
@@ -0,0 +1,308 @@
+/* Lziprecover - Data recovery tool for the lzip format
+ Copyright (C) 2023-2024 Antonio Diaz Diaz.
+
+ This program is free software: you can redistribute it and/or modify
+ it under the terms of the GNU General Public License as published by
+ the Free Software Foundation, either version 2 of the License, or
+ (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program. If not, see <http://www.gnu.org/licenses/>.
+*/
+
+#define _FILE_OFFSET_BITS 64
+
+#include <cstdio>
+#include <cstring>
+#include <list>
+#include <string>
+#include <vector>
+#include <stdint.h>
+#include <unistd.h> // STDERR_FILENO
+
+#include "lzip.h"
+#include "md5.h"
+#include "fec.h"
+
+namespace {
+
+const uint16_t u16_one = 1;
+const bool little_endian = *(const uint8_t *)&u16_one == 1;
+inline uint16_t swap_bytes( const uint16_t a )
+ { return ( a >> 8 ) | ( a << 8 ); }
+
+struct Galois16_table // addition/subtraction is exclusive or
+ {
+ enum { size = 1 << 16, poly = 0x1100B }; // generator polynomial
+ uint16_t * log, * ilog, * mul_tables;
+
+ Galois16_table() : log( 0 ), ilog( 0 ), mul_tables( 0 ) {}
+// ~Galois16_table() { delete[] mul_tables; delete[] ilog; delete[] log; }
+
+ void init() // fill log, inverse log, and multiplication tables
+ {
+ if( log ) return;
+ log = new uint16_t[size]; ilog = new uint16_t[size];
+ mul_tables = new uint16_t[3 * 256 * 256]; // LL, LH, HH
+ for( unsigned b = 1, i = 0; i < size - 1; ++i )
+ {
+ log[b] = i;
+ ilog[i] = b;
+ b <<= 1;
+ if( b & size ) b ^= poly;
+ }
+ log[0] = size - 1; // log(0) is not defined, so use a special value
+ ilog[size-1] = 1;
+
+ uint16_t * p = mul_tables;
+ for( int i = 0; i < 16; i += 8 )
+ for( int j = i; j < 16; j += 8 )
+ for( int a = 0; a < 256 << i; a += 1 << i )
+ for( int b = 0; b < 256 << j; b += 1 << j )
+ *p++ = mul( a, b );
+ }
+
+ uint16_t mul( const uint16_t a, const uint16_t b ) const
+ {
+ if( a == 0 || b == 0 ) return 0;
+ const unsigned sum = log[a] + log[b];
+ return ( sum >= size - 1 ) ? ilog[sum-(size-1)] : ilog[sum];
+// return ilog[(log[a] + log[b]) % (size-1)];
+ }
+
+ uint16_t inverse( const uint16_t a ) const { return ilog[size-1-log[a]]; }
+ } gf;
+
+
+inline bool check_element( const uint16_t * const A, const uint16_t * const B,
+ const unsigned k, const unsigned row, const unsigned col )
+ {
+ const uint16_t * pa = A + row * k;
+ const uint16_t * pb = B + col;
+ uint16_t sum = 0;
+ for( unsigned i = 0; i < k; ++i, ++pa, pb += k )
+ sum ^= gf.mul( *pa, *pb );
+ return sum == ( row == col );
+ }
+
+/* Check that A * B = I (A, B, I are square matrices of size k * k).
+ Check just the diagonals for matrices larger than 1024 x 1024. */
+bool check_inverse( const uint16_t * const A, const uint16_t * const B,
+ const unsigned k )
+ {
+ const bool print = verbosity >= 1 && k > max_k8 && isatty( STDERR_FILENO );
+ for( unsigned row = 0; row < k; ++row ) // multiply A * B
+ {
+ if( k <= 1024 )
+ for( unsigned col = 0; col < k; ++col )
+ { if( !check_element( A, B, k, row, col ) )
+ { if( print && row ) std::fputc( '\n', stderr ); return false; } }
+ else
+ if( !check_element( A, B, k, row, row ) ||
+ !check_element( A, B, k, row, k - 1 - row ) )
+ { if( print && row ) std::fputc( '\n', stderr ); return false; }
+ if( print ) std::fprintf( stderr, "\r%5u rows checked \r", row + 1 );
+ }
+ return true; // A * B == I
+ }
+
+
+/* Invert in place a matrix of size k * k.
+ This is like Gaussian elimination with a virtual identity matrix:
+ A --some_changes--> I, I --same_changes--> A^-1
+ Galois arithmetic is exact. Swapping rows or columns is not needed. */
+bool invert_matrix( uint16_t * const matrix, const unsigned k )
+ {
+ const bool print = verbosity >= 1 && k > max_k8 && isatty( STDERR_FILENO );
+ for( unsigned row = 0; row < k; ++row )
+ {
+ uint16_t * const pivot_row = matrix + row * k;
+ uint16_t pivot = pivot_row[row];
+ if( pivot == 0 )
+ { if( print && row ) std::fputc( '\n', stderr ); return false; }
+ if( pivot != 1 ) // scale the pivot_row
+ {
+ pivot = gf.inverse( pivot );
+ pivot_row[row] = 1;
+ for( unsigned col = 0; col < k; ++col )
+ pivot_row[col] = gf.mul( pivot_row[col], pivot );
+ }
+ // subtract pivot_row from the other rows
+ for( unsigned row2 = 0; row2 < k; ++row2 )
+ if( row2 != row )
+ {
+ uint16_t * const dst_row = matrix + row2 * k;
+ const uint16_t c = dst_row[row]; dst_row[row] = 0;
+ for( unsigned col = 0; col < k; ++col )
+ dst_row[col] ^= gf.mul( pivot_row[col], c );
+ }
+ if( print ) std::fprintf( stderr, "\r%5u rows inverted\r", row + 1 );
+ }
+ return true;
+ }
+
+
+// create dec_matrix containing only the rows needed and invert it in place
+const uint16_t * init_dec_matrix( const std::vector< unsigned > & bb_vector,
+ const std::vector< unsigned > & fbn_vector )
+ {
+ const unsigned bad_blocks = bb_vector.size();
+ uint16_t * const dec_matrix = new uint16_t[bad_blocks * bad_blocks];
+
+ // one row for each missing data block
+ for( unsigned row = 0; row < bad_blocks; ++row )
+ {
+ uint16_t * const dec_row = dec_matrix + row * bad_blocks;
+ const unsigned fbn = fbn_vector[row] | 0x8000;
+ for( unsigned col = 0; col < bad_blocks; ++col )
+ dec_row[col] = gf.inverse( fbn ^ bb_vector[col] );
+ }
+ if( !invert_matrix( dec_matrix, bad_blocks ) )
+ internal_error( "GF(2^16) matrix not invertible." );
+ return dec_matrix;
+ }
+
+#if 0
+/* compute dst[] += c * src[]
+ treat the buffers as arrays of 16-bit Galois values */
+inline void mul_add( const uint8_t * const src, uint8_t * const dst,
+ const unsigned long fbs, const uint16_t c )
+ {
+ if( c == 0 ) return; // nothing to add
+ const uint16_t * const src16 = (const uint16_t *)src;
+ uint16_t * const dst16 = (uint16_t *)dst;
+
+ if( little_endian )
+ for( unsigned long i = 0; i < fbs / 2; ++i )
+ dst16[i] ^= gf.mul( src16[i], c );
+ else // big endian
+ for( unsigned long i = 0; i < fbs / 2; ++i )
+ dst16[i] ^= swap_bytes( gf.mul( swap_bytes( src16[i] ), c ) );
+ }
+#else
+
+/* compute dst[] += c * src[]
+ treat the buffers as arrays of pairs of 16-bit Galois values */
+inline void mul_add( const uint8_t * const src, uint8_t * const dst,
+ const unsigned long fbs, const uint16_t c )
+ {
+ if( c == 0 ) return; // nothing to add
+ const int cl = c & 0xFF; // split factor c into low and high bytes
+ const int ch = c >> 8;
+ // pointers to the four multiplication tables (c.low/high * src.low/high)
+ const uint16_t * LL = &gf.mul_tables[cl * 256];
+ const uint16_t * LH = &gf.mul_tables[65536 + cl * 256];
+ const uint16_t * HL = &gf.mul_tables[65536 + ch]; // step 256
+ const uint16_t * HH = &gf.mul_tables[131072 + ch * 256];
+ uint16_t L[256]; // extract the two tables for factor c
+ uint16_t H[256];
+
+ if( little_endian )
+ for( int i = 0; i < 256; ++i )
+ { L[i] = *LL++ ^ *HL; HL+=256; H[i] = *LH++ ^ *HH++; }
+ else // big endian
+ for( int i = 0; i < 256; ++i )
+ { H[i] = swap_bytes( *LL++ ^ *HL ); HL+=256;
+ L[i] = swap_bytes( *LH++ ^ *HH++ ); }
+
+ const uint32_t * const src32 = (const uint32_t *)src;
+ uint32_t * const dst32 = (uint32_t *)dst;
+
+ for( unsigned long i = 0; i < fbs / 4; ++i )
+ { const uint32_t s = src32[i];
+ dst32[i] ^= L[s & 0xFF] ^ H[s >> 8 & 0xFF] ^
+ L[s >> 16 & 0xFF] << 16 ^ H[s >> 24] << 16; }
+ }
+#endif
+
+} // end namespace
+
+
+void gf16_init() { gf.init(); }
+
+bool gf16_check( const std::vector< unsigned > & fbn_vector, const unsigned k )
+ {
+ if( k == 0 ) return true;
+ gf.init();
+ bool good = true;
+ for( unsigned a = 1; a < gf.size; ++a )
+ if( gf.mul( a, gf.inverse( a ) ) != 1 )
+ { good = false;
+ std::fprintf( stderr, "%u * ( 1/%u ) != 1 in GF(2^16)\n", a, a ); }
+ uint16_t * const enc_matrix = new uint16_t[k * k];
+ uint16_t * const dec_matrix = new uint16_t[k * k];
+ const bool random = fbn_vector.size() == k;
+ for( unsigned row = 0; row < k; ++row )
+ {
+ const unsigned fbn = ( random ? fbn_vector[row] : row ) | 0x8000;
+ uint16_t * const enc_row = enc_matrix + row * k;
+ for( unsigned col = 0; col < k; ++col )
+ enc_row[col] = gf.inverse( fbn ^ col );
+ }
+ std::memcpy( dec_matrix, enc_matrix, k * k * sizeof (uint16_t) );
+ if( !invert_matrix( dec_matrix, k ) )
+ { good = false; show_error( "GF(2^16) matrix not invertible." ); }
+ else if( !check_inverse( enc_matrix, dec_matrix, k ) )
+ { good = false; show_error( "GF(2^16) matrix A * A^-1 != I" ); }
+ delete[] dec_matrix;
+ delete[] enc_matrix;
+ return good;
+ }
+
+
+void rs16_encode( const uint8_t * const buffer, const uint8_t * const lastbuf,
+ uint8_t * const fec_block, const unsigned long fbs,
+ const unsigned fbn, const unsigned k )
+ {
+ if( !gf.log ) internal_error( "GF(2^16) tables not initialized." );
+ /* The encode matrix is a Hilbert matrix of size k * k with one row per
+ fec block and one column per data block.
+ The value of each element is computed on the fly with inverse. */
+ const unsigned row = fbn | 0x8000;
+ std::memset( fec_block, 0, fbs );
+ for( unsigned col = 0; col < k; ++col )
+ {
+ const uint8_t * const src =
+ ( col < k - (lastbuf != 0) ) ? buffer + col * fbs : lastbuf;
+ mul_add( src, fec_block, fbs, gf.inverse( row ^ col ) );
+ }
+ }
+
+
+void rs16_decode( uint8_t * const buffer, uint8_t * const lastbuf,
+ const std::vector< unsigned > & bb_vector,
+ const std::vector< unsigned > & fbn_vector,
+ uint8_t * const fecbuf, const unsigned long fbs,
+ const unsigned k )
+ {
+ gf.init();
+ const unsigned bad_blocks = bb_vector.size();
+ for( unsigned col = 0, bi = 0; col < k; ++col ) // reduce
+ {
+ if( bi < bad_blocks && col == bb_vector[bi] ) { ++bi; continue; }
+ const uint8_t * const src =
+ ( col < k - (lastbuf != 0) ) ? buffer + col * fbs : lastbuf;
+ for( unsigned row = 0; row < bad_blocks; ++row )
+ {
+ const unsigned fbn = fbn_vector[row] | 0x8000;
+ mul_add( src, fecbuf + row * fbs, fbs, gf.inverse( fbn ^ col ) );
+ }
+ }
+ const uint16_t * const dec_matrix = init_dec_matrix( bb_vector, fbn_vector );
+ for( unsigned col = 0; col < bad_blocks; ++col ) // solve
+ {
+ const unsigned di = bb_vector[col];
+ uint8_t * const dst =
+ ( di < k - (lastbuf != 0) ) ? buffer + di * fbs : lastbuf;
+ std::memset( dst, 0, fbs );
+ const uint16_t * const dec_row = dec_matrix + col * bad_blocks;
+ for( unsigned row = 0; row < bad_blocks; ++row )
+ mul_add( fecbuf + row * fbs, dst, fbs, dec_row[row] );
+ }
+ delete[] dec_matrix;
+ }