summaryrefslogtreecommitdiffstats
path: root/zgrep.cc
diff options
context:
space:
mode:
Diffstat (limited to 'zgrep.cc')
-rw-r--r--zgrep.cc159
1 files changed, 159 insertions, 0 deletions
diff --git a/zgrep.cc b/zgrep.cc
new file mode 100644
index 0000000..b1c18b4
--- /dev/null
+++ b/zgrep.cc
@@ -0,0 +1,159 @@
+/* Zgrep - search compressed files for a regular expression
+ Copyright (C) 2010 Antonio Diaz Diaz.
+
+ This program is free software: you can redistribute it and/or modify
+ it under the terms of the GNU General Public License as published by
+ the Free Software Foundation, either version 3 of the License, or
+ (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program. If not, see <http://www.gnu.org/licenses/>.
+*/
+
+void show_zgrep_help() throw()
+ {
+ std::printf( "Zgrep is a front end to the grep program that allows transparent search\n" );
+ std::printf( "on any combination of compressed and non-compressed files. If any given\n" );
+ std::printf( "file is compressed, its uncompressed content is used. If a given file\n" );
+ std::printf( "does not exist, and its name does not end with one of the known\n" );
+ std::printf( "extensions, zgrep tries the compressed file names corresponding to the\n" );
+ std::printf( "supported compressors. If no files are specified, data is read from\n" );
+ std::printf( "standard input, decompressed if needed, and fed to grep. Data read from\n" );
+ std::printf( "standard input must be of the same type; all uncompressed or all\n" );
+ std::printf( "compressed with the same compressor.\n" );
+ std::printf( "The supported compressors are bzip2, gzip, lzip and xz.\n" );
+ std::printf( "\nUsage: zgrep [options] <pattern> [files]\n" );
+ std::printf( "\nExit status is 0 if match, 1 if no match, 2 if trouble.\n" );
+ std::printf( "\nOptions:\n" );
+ std::printf( " --help display this help and exit\n" );
+ std::printf( " -V, --version output version information and exit\n" );
+ std::printf( " -a, --text treat all files as text\n" );
+ std::printf( " -A, --after-context=<n> print <n> lines of trailing context\n" );
+ std::printf( " -b, --byte-offset print the byte offset of each line\n" );
+ std::printf( " -B, --before-context=<n> print <n> lines of leading context\n" );
+ std::printf( " -c, --count only print a count of matching lines per file\n" );
+ std::printf( " -C, --context=<n> print <n> lines of output context\n" );
+ std::printf( " -e, --regexp=<pattern> use <pattern> as the pattern to match\n" );
+ std::printf( " -E, --extended-regexp <pattern> is an extended regular expression\n" );
+ std::printf( " -f, --file=<file> obtain patterns from <file>\n" );
+ std::printf( " -F, --fixed-strings <pattern> is a set of newline-separated strings\n" );
+ std::printf( " -h, --no-filename suppress the prefixing filename on output\n" );
+ std::printf( " -H, --with-filename print the filename for each match\n" );
+ std::printf( " -i, --ignore-case ignore case distinctions\n" );
+ std::printf( " -I ignore binary files\n" );
+ std::printf( " -l, --files-with-matches only print names of files containing matches\n" );
+ std::printf( " -L, --files-without-match only print names of files containing no matches\n" );
+ std::printf( " -m, --max-count=<n> stop after <n> matches\n" );
+ std::printf( " -n, --line-number print the line number of each line\n" );
+ std::printf( " -o, --only-matching show only the part of a line matching <pattern>\n" );
+ std::printf( " -q, --quiet suppress all messages\n" );
+ std::printf( " -r, --recursive operate recursively on directories\n" );
+ std::printf( " -s, --no-messages suppress error messages\n" );
+ std::printf( " -v, --invert-match select non-matching lines\n" );
+ std::printf( " --verbose verbose mode (show error messages)\n" );
+ std::printf( " -w, --word-regexp match only whole words\n" );
+ std::printf( " -x, --line-regexp match only whole lines\n" );
+ show_help_addr();
+ }
+
+
+int zgrep_stdin( int infd, const std::vector< const char * > & grep_args )
+ {
+ pid_t pid;
+ if( !set_data_feeder( &infd, &pid ) ) return 2;
+ const pid_t grep_pid = fork();
+ if( grep_pid == 0 ) // child (grep)
+ {
+ if( dup2( infd, STDIN_FILENO ) >= 0 && close( infd ) == 0 )
+ {
+ const char ** const argv = new const char *[grep_args.size()+2];
+ argv[0] = "grep";
+ for( unsigned int i = 0; i < grep_args.size(); ++i )
+ argv[i+1] = grep_args[i];
+ argv[grep_args.size()+1] = 0;
+ execvp( argv[0], (char **)argv );
+ }
+ show_error( "Can't exec `grep'." );
+ _exit( 2 );
+ }
+ // parent
+ if( grep_pid < 0 )
+ { show_error( "Can't fork `grep'", errno ); return 2; }
+ int retval = 0;
+ if( pid && wait_for_child( pid, "data feeder" ) != 0 ) retval = 2;
+ if( wait_for_child( grep_pid, "grep" ) != 0 ) retval = 2;
+ if( close( infd ) != 0 )
+ { show_error( "Can't close output of data feeder", errno ); return 2; }
+ return retval;
+ }
+
+
+int zgrep_file( int infd, const std::string & input_filename,
+ const std::vector< const char * > & grep_args,
+ const bool grep_list, const bool grep_show_name )
+ {
+ pid_t pid;
+ if( !set_data_feeder( &infd, &pid ) ) return 2;
+ int fda[2]; // pipe from grep
+ if( pipe( fda ) < 0 )
+ { show_error( "Can't create pipe", errno ); return 2; }
+ const pid_t grep_pid = fork();
+ if( grep_pid == 0 ) // child (grep)
+ {
+ if( dup2( infd, STDIN_FILENO ) >= 0 &&
+ dup2( fda[1], STDOUT_FILENO ) >= 0 &&
+ close( infd ) == 0 && close( fda[0] ) == 0 && close( fda[1] ) == 0 )
+ {
+ const char ** const argv = new const char *[grep_args.size()+2];
+ argv[0] = "grep";
+ for( unsigned int i = 0; i < grep_args.size(); ++i )
+ argv[i+1] = grep_args[i];
+ argv[grep_args.size()+1] = 0;
+ execvp( argv[0], (char **)argv );
+ }
+ show_error( "Can't exec `grep'." );
+ _exit( 2 );
+ }
+ // parent
+ close( fda[1] );
+ if( grep_pid < 0 )
+ { show_error( "Can't fork `grep'", errno ); return 2; }
+ enum { buffer_size = 256 };
+ uint8_t buffer[buffer_size];
+ bool line_begin = true;
+ while( true )
+ {
+ const int size = readblock( fda[0], buffer, buffer_size );
+ if( size != buffer_size && errno )
+ { show_error( "Read error", errno ); return 2; }
+ if( size > 0 && !grep_list )
+ {
+ if( grep_show_name )
+ for( int i = 0; i < size; ++i )
+ {
+ if( line_begin )
+ { line_begin = false; std::printf( "%s:", input_filename.c_str() ); }
+ if( buffer[i] == '\n' ) line_begin = true;
+ putchar( buffer[i] );
+ }
+ else if( std::fwrite( buffer, 1, size, stdout ) != (unsigned int)size )
+ { show_error( "Write error", errno ); return 2; }
+ }
+ if( size < buffer_size ) break;
+ }
+ int retval = 0;
+ if( pid && wait_for_child( pid, "data feeder" ) != 0 ) retval = 2;
+ if( wait_for_child( grep_pid, "grep" ) != 0 ) retval = 2;
+ if( grep_list && retval == 0 )
+ std::printf( "%s\n", input_filename.c_str() );
+ if( close( infd ) != 0 )
+ { show_error( "Can't close output of data feeder", errno ); return 2; }
+ if( close( fda[0] ) != 0 )
+ { show_error( "Can't close output of grep", errno ); return 2; }
+ return retval;
+ }