summaryrefslogtreecommitdiffstats
path: root/delete_lz.cc
blob: 961645f596c92efbdd411cc0fe464a55fe58f249 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
/* Tarlz - Archiver with multimember lzip compression
   Copyright (C) 2013-2020 Antonio Diaz Diaz.

   This program is free software: you can redistribute it and/or modify
   it under the terms of the GNU General Public License as published by
   the Free Software Foundation, either version 2 of the License, or
   (at your option) any later version.

   This program is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License
   along with this program.  If not, see <http://www.gnu.org/licenses/>.
*/

#define _FILE_OFFSET_BITS 64

#include <cctype>
#include <cerrno>
#include <climits>
#include <cstdio>
#include <cstdlib>
#include <cstring>
#include <string>
#include <vector>
#include <pthread.h>
#include <stdint.h>
#include <unistd.h>
#include <lzlib.h>

#include "arg_parser.h"
#include "tarlz.h"
#include "lzip_index.h"


/* Read 'size' decompressed bytes from the archive.
   Return value: 0 = OK, 1 = damaged member, 2 = fatal error. */
int archive_read_lz( LZ_Decoder * const decoder, const int infd,
                     long long & file_pos, const long long member_end,
                     const long long cdata_size, uint8_t * const buf,
                     const int size, const char ** msg )
  {
  int sz = 0;

  while( sz < size )
    {
    const int rd = LZ_decompress_read( decoder, buf + sz, size - sz );
    if( rd < 0 )
      { *msg = LZ_strerror( LZ_decompress_errno( decoder ) ); return 1; }
    if( rd == 0 && LZ_decompress_finished( decoder ) == 1 )
      { *msg = end_msg; return 2; }
    sz += rd;
    if( sz < size && LZ_decompress_write_size( decoder ) > 0 )
      {
      const long long ibuf_size = 16384;
      uint8_t ibuf[ibuf_size];
      const long long rest = ( file_pos < member_end ) ?
        member_end - file_pos : cdata_size - file_pos;
      const int rsize = std::min( LZ_decompress_write_size( decoder ),
                                  (int)std::min( ibuf_size, rest ) );
      if( rsize <= 0 ) LZ_decompress_finish( decoder );
      else
        {
        const int rd = preadblock( infd, ibuf, rsize, file_pos );
        if( LZ_decompress_write( decoder, ibuf, rd ) != rd )
          internal_error( "library error (LZ_decompress_write)." );
        file_pos += rd;
        if( rd < rsize )
          {
          LZ_decompress_finish( decoder );
          if( errno ) { *msg = "Error reading archive"; return 2; }
          }
        }
      }
    }
  return 0;
  }


int parse_records_lz( LZ_Decoder * const decoder, const int infd,
                      long long & file_pos, const long long member_end,
                      const long long cdata_size, long long & data_pos,
                      Extended & extended, const Tar_header header,
                      Resizable_buffer & rbuf, const char ** msg,
                      const bool permissive )
  {
  const long long edsize = parse_octal( header + size_o, size_l );
  const long long bufsize = round_up( edsize );
  if( edsize <= 0 || edsize >= 1LL << 33 || bufsize >= INT_MAX )
    return 1;					// overflow or no extended data
  if( !rbuf.resize( bufsize ) ) return 1;	// extended records buffer
  int retval = archive_read_lz( decoder, infd, file_pos, member_end,
                                cdata_size, (uint8_t *)rbuf(), bufsize, msg );
  if( retval == 0 )
    { if( extended.parse( rbuf(), edsize, permissive ) ) data_pos += bufsize;
      else retval = 2; }
  return retval;
  }


int skip_member_lz( LZ_Decoder * const decoder, const int infd,
                    long long & file_pos, const long long member_end,
                    const long long cdata_size, long long & data_pos,
                    long long rest, const char ** msg )
  {
  const int bufsize = 32 * header_size;
  uint8_t buf[bufsize];
  while( rest > 0 )				// skip tar member
    {
    const int rsize = ( rest >= bufsize ) ? bufsize : rest;
    const int ret = archive_read_lz( decoder, infd, file_pos, member_end,
                                     cdata_size, buf, rsize, msg );
    if( ret != 0 ) return ret;
    data_pos += rsize;
    rest -= rsize;
    }
  return 0;
  }


/* Deleting from a corrupt archive must not worsen the corruption. Stop and
   tail-copy as soon as corruption is found.
*/
int delete_members_lz( const Cl_options & cl_opts,
                       const char * const archive_namep,
                       std::vector< char > & name_pending,
                       const Lzip_index & lzip_index,
                       const int infd, const int outfd )
  {
  Resizable_buffer rbuf;
  LZ_Decoder * const decoder = LZ_decompress_open();
  if( !rbuf.size() || !decoder || LZ_decompress_errno( decoder ) != LZ_ok )
    { show_error( mem_msg ); return 1; }

  long long istream_pos = 0;		// source of next data move
  const long long cdata_size = lzip_index.cdata_size();
  int retval = 0, retval2 = 0;
  for( long i = 0; i < lzip_index.members(); ++i )
    {
    const long long mdata_pos = lzip_index.dblock( i ).pos();
    long long data_pos = mdata_pos;
    const long long mdata_end = lzip_index.dblock( i ).end();
    if( data_pos >= mdata_end ) continue;		// empty lzip member
    const long long member_pos = lzip_index.mblock( i ).pos();
    long long file_pos = member_pos;
    const long long member_end = lzip_index.mblock( i ).end();

    long long member_begin = 0;		// first pos of current tar member
    Extended extended;			// metadata from extended records
    bool prev_extended = false;		// prev header was extended
    LZ_decompress_reset( decoder );	// prepare for new member
    if( !safe_seek( infd, member_pos ) ) { retval = 1; break; }
    while( true )			// process one tar header per iteration
      {
      if( data_pos >= mdata_end )
        {
        if( data_pos == mdata_end && !prev_extended ) break;
        // member end exceeded or ends in extended
        show_file_error( archive_namep, "Member misalignment found." );
        retval = 2; goto done;
        }
      if( !prev_extended ) member_begin = data_pos;
      Tar_header header;
      const char * msg = 0;
      retval = archive_read_lz( decoder, infd, file_pos, member_end,
                                cdata_size, header, header_size, &msg );
      if( retval != 0 ) { show_file_error( archive_namep, msg ); goto done; }
      data_pos += header_size;
      if( !verify_ustar_chksum( header ) )
        {
        if( block_is_zero( header, header_size ) )		// EOF
          {
          if( prev_extended && !cl_opts.permissive )
            { show_file_error( archive_namep, fv_msg1 ); retval = 2; }
          goto done;
          }
        show_file_error( archive_namep, ( data_pos > header_size ) ?
                         bad_hdr_msg : posix_lz_msg );
        retval = 2;
        goto done;
        }

      const Typeflag typeflag = (Typeflag)header[typeflag_o];
      if( typeflag == tf_global )
        {
        if( prev_extended && !cl_opts.permissive )
          { show_file_error( archive_namep, fv_msg2 ); retval = 2; goto done; }
        Extended dummy;		// global headers are parsed and ignored
        retval = parse_records_lz( decoder, infd, file_pos, member_end,
                                   cdata_size, data_pos, dummy, header,
                                   rbuf, &msg, true );
        if( retval == 0 ) continue;
        show_file_error( archive_namep, gblrec_msg );
        goto done;
        }
      if( typeflag == tf_extended )
        {
        if( prev_extended && !cl_opts.permissive )
          { msg = fv_msg3; retval = 2; }
        else retval = parse_records_lz( decoder, infd, file_pos, member_end,
                                        cdata_size, data_pos, extended, header,
                                        rbuf, &msg, cl_opts.permissive );
        if( retval == 0 && !extended.crc_present() && cl_opts.missing_crc )
          { msg = mcrc_msg; retval = 2; }
        if( retval == 0 ) { prev_extended = true; continue; }
        show_file_error( archive_namep, extrec_msg );
        goto done;
        }
      prev_extended = false;

      extended.fill_from_ustar( header );	// copy metadata from header

      long long rest = round_up( extended.file_size() );  // size + padding
      if( data_pos + rest >= mdata_end ) data_pos += rest;
      else						// skip tar member
        if( ( retval = skip_member_lz( decoder, infd, file_pos, member_end,
                         cdata_size, data_pos, rest, &msg ) ) != 0 )
          goto done;

      // delete tar member
      if( !check_skip_filename( cl_opts, name_pending, extended.path().c_str() ) )
        {
        // verify that members match
        if( member_begin != mdata_pos || data_pos != mdata_end )
          { show_file_error( extended.path().c_str(),
                             "Can't delete: not compressed individually." );
            retval2 = 2; extended.reset(); continue; }
        if( !show_member_name( extended, header, 1, rbuf ) )
          { retval = 1; goto done; }
        const long long size = member_pos - istream_pos;
        if( size > 0 )	// move pending data each time a member is deleted
          {
          if( istream_pos == 0 )
            { if( !safe_seek( outfd, size ) ) { retval = 1; goto done; } }
          else if( !safe_seek( infd, istream_pos ) ||
                   !copy_file( infd, outfd, size ) ) { retval = 1; goto done; }
          }
        istream_pos = member_end;
        }
      extended.reset();
      }
    }
done:
  if( retval < retval2 ) retval = retval2;
  if( LZ_decompress_close( decoder ) < 0 && !retval )
    { show_error( "LZ_decompress_close failed." ); retval = 1; }
  // tail copy keeps trailing data
  return tail_copy( archive_namep, cl_opts.parser, name_pending, lzip_index,
                    istream_pos, infd, outfd, retval );
  }