diff options
Diffstat (limited to 'src/manconv_main.c')
-rw-r--r-- | src/manconv_main.c | 209 |
1 files changed, 209 insertions, 0 deletions
diff --git a/src/manconv_main.c b/src/manconv_main.c new file mode 100644 index 0000000..e0d9972 --- /dev/null +++ b/src/manconv_main.c @@ -0,0 +1,209 @@ +/* + * manconv_main.c: convert manual page from one encoding to another + * + * Copyright (C) 2007, 2008 Colin Watson. + * + * This file is part of man-db. + * + * man-db is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * man-db is distributed in the hope that it will be useful, but + * WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with man-db; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#ifdef HAVE_CONFIG_H +# include "config.h" +#endif /* HAVE_CONFIG_H */ + +#include <assert.h> +#include <stdbool.h> +#include <stdlib.h> +#include <string.h> +#include <unistd.h> + +#include "argp.h" +#include "error.h" +#include "gl_array_list.h" +#include "gl_xlist.h" +#include "progname.h" +#include "xalloc.h" + +#include "gettext.h" +#define _(String) gettext (String) +#define N_(String) gettext_noop (String) + +#include "manconfig.h" + +#include "appendstr.h" +#include "cleanup.h" +#include "debug.h" +#include "encodings.h" +#include "pipeline.h" +#include "glcontainers.h" +#include "sandbox.h" +#include "util.h" + +#include "decompress.h" +#include "manconv.h" + +int quiet = 0; +man_sandbox *sandbox; + +static const char *from_codes; +static char *to_code; +static gl_list_t from_code; +static const char *filename; + +static gl_list_t split_codes (const char *codestr) +{ + char *codestrtok, *codestrtok_ptr; + char *tok; + gl_list_t codelist = new_string_list (GL_ARRAY_LIST, true); + + if (!codestr) + return codelist; + + codestrtok = xstrdup (codestr); + codestrtok_ptr = codestrtok; + + for (tok = strsep (&codestrtok_ptr, ":"); tok; + tok = strsep (&codestrtok_ptr, ":")) { + if (!*tok) + continue; /* ignore empty fields */ + gl_list_add_last (codelist, xstrdup (tok)); + } + + free (codestrtok); + + return codelist; +} + +const char *argp_program_version = "manconv " PACKAGE_VERSION; +const char *argp_program_bug_address = PACKAGE_BUGREPORT; +error_t argp_err_exit_status = FAIL; + +static const char args_doc[] = N_("[-f CODE[:...]] -t CODE [FILENAME]"); + +static struct argp_option options[] = { + OPT ("from-code", 'f', N_("CODE[:...]"), + N_("possible encodings of original text")), + OPT ("to-code", 't', N_("CODE"), N_("encoding for output")), + OPT ("debug", 'd', 0, N_("emit debugging messages")), + OPT ("quiet", 'q', 0, N_("produce fewer warnings")), + OPT_HELP_COMPAT, + { 0 } +}; + +static error_t parse_opt (int key, char *arg, struct argp_state *state) +{ + switch (key) { + case 'f': + from_codes = arg; + return 0; + case 't': + to_code = xstrdup (arg); + if (!strstr (to_code, "//")) + to_code = appendstr (to_code, "//TRANSLIT", + (void *) 0); + return 0; + case 'd': + debug_level = true; + return 0; + case 'q': + quiet = 1; + return 0; + case 'h': + argp_state_help (state, state->out_stream, + ARGP_HELP_STD_HELP); + break; + case ARGP_KEY_ARG: + if (filename) + argp_usage (state); + filename = arg; + return 0; + case ARGP_KEY_SUCCESS: + if (!to_code) + argp_error (state, + _("must specify an output " + "encoding")); + from_code = split_codes (from_codes); + return 0; + } + return ARGP_ERR_UNKNOWN; +} + +static struct argp argp = { options, parse_opt, args_doc }; + +int main (int argc, char *argv[]) +{ + decompress *decomp; + + set_program_name (argv[0]); + + init_debug (); + pipeline_install_post_fork (pop_all_cleanups); + sandbox = sandbox_init (); + init_locale (); + + if (argp_parse (&argp, argc, argv, 0, 0, 0)) + exit (FAIL); + assert (from_code); + + if (filename) { + decomp = decompress_open (filename, 0); + if (!decomp) + error (FAIL, 0, _("can't open %s"), filename); + } else + decomp = decompress_fdopen (dup (STDIN_FILENO)); + decompress_start (decomp); + + if (!gl_list_size (from_code)) { + char *lang, *page_encoding; + + /* Note that we don't need to explicitly check the page's + * preprocessor encoding here, as the manconv function will + * do that itself and override the requested input encoding + * with it if it finds one. + */ + lang = lang_dir (filename); + page_encoding = get_page_encoding (lang); + if (STREQ (page_encoding, "UTF-8")) { + /* Steal memory. */ + gl_list_add_last (from_code, page_encoding); + debug ("guessed input encoding %s for %s\n", + page_encoding, filename); + } else { + gl_list_add_last (from_code, xstrdup ("UTF-8")); + /* Steal memory. */ + gl_list_add_last (from_code, page_encoding); + debug ("guessed input encodings UTF-8:%s for %s\n", + page_encoding, filename); + } + + free (lang); + } + + if (manconv (decomp, from_code, to_code, NULL) != 0) + /* manconv already wrote an error message to stderr. Just + * exit non-zero. + */ + exit (FATAL); + + free (to_code); + gl_list_free (from_code); + + decompress_wait (decomp); + + sandbox_free (sandbox); + + return 0; +} |