diff options
Diffstat (limited to 'src/ult_src.c')
-rw-r--r-- | src/ult_src.c | 379 |
1 files changed, 379 insertions, 0 deletions
diff --git a/src/ult_src.c b/src/ult_src.c new file mode 100644 index 0000000..43e7a9b --- /dev/null +++ b/src/ult_src.c @@ -0,0 +1,379 @@ +/* + * ult_src.c: Find the ultimate source of a page + * + * Copyright (C) 1994, 1995 Graeme W. Wilford. (Wilf.) + * Copyright (C) 2001, 2002, 2003, 2004, 2006, 2007, 2008, 2009, 2010, 2011, + * 2012 Colin Watson. + * + * This file is part of man-db. + * + * man-db is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * man-db is distributed in the hope that it will be useful, but + * WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with man-db; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA + * + * code to seek out the original (ultimate) source man file for + * any specified man file. Soft and hard links and .so inclusions + * are traced. Use: reduce amount of cat files to a minimum. + * + * Mon May 2 11:14:28 BST 1994 Wilf. (G.Wilford@ee.surrey.ac.uk) + */ + +#ifdef HAVE_CONFIG_H +# include "config.h" +#endif /* HAVE_CONFIG_H */ + +#include <string.h> +#include <stdlib.h> +#include <stdio.h> +#include <ctype.h> +#include <sys/types.h> +#include <sys/stat.h> +#include <errno.h> +#include <assert.h> +#include <dirent.h> +#include <unistd.h> + +#include "canonicalize.h" +#include "dirname.h" +#include "error.h" +#include "gl_xlist.h" +#include "xvasprintf.h" + +#include "gettext.h" +#define _(String) gettext (String) + +#include "manconfig.h" + +#include "pipeline.h" +#include "decompress.h" + +#include "globbing.h" +#include "ult_src.h" + +/* Find minimum value hard link filename for given file and inode. + * Returns a newly allocated string. + */ +static char *ult_hardlink (const char *fullpath, ino_t inode) +{ + DIR *mdir; + struct dirent *manlist; + char *base, *dir, *ret; + const char *slash; + + slash = strrchr (fullpath, '/'); + assert (slash); + dir = xstrndup (fullpath, slash - fullpath); + base = xstrdup (++slash); + + mdir = opendir (dir); + if (mdir == NULL) { + if (quiet < 2) + error (0, errno, _("can't search directory %s"), dir); + free (dir); + free (base); + return NULL; + } + + while ((manlist = readdir (mdir))) { + if (manlist->d_ino == inode && + strcmp (base, manlist->d_name) > 0) { + free (base); + base = xstrdup (manlist->d_name); + debug ("ult_hardlink: (%s)\n", base); + } + } + closedir (mdir); + + /* If we already are the link with the smallest name value */ + /* return NULL */ + + if (strcmp (base, slash) == 0) { + free (dir); + free (base); + return NULL; + } + + ret = xasprintf ("%s/%s", dir, base); + free (dir); + free (base); + return ret; +} + +/* Resolve all symbolic links within 'fullpath'. + * Returns a newly allocated string. + */ +static char *ult_softlink (const char *fullpath) +{ + char *resolved_path; + + resolved_path = canonicalize_file_name (fullpath); + if (!resolved_path) { + /* discard the unresolved path */ + if (quiet < 2) { + if (errno == ENOENT) + error (0, 0, + _("warning: %s is a dangling symlink"), + fullpath); + else + error (0, errno, _("can't resolve %s"), + fullpath); + } + return NULL; + } + + debug ("ult_softlink: (%s)\n", resolved_path); + + return resolved_path; +} + +/* Test 'buffer' to see if it contains a .so include. If so and it's not an + * absolute filename, return newly allocated string whose contents are the + * include. + */ +static char *test_for_include (const char *buffer) +{ + if (!buffer) + return NULL; + + /* strip out any leading whitespace (if any) */ + while (CTYPE (isspace, *buffer)) + buffer++; + + /* see if the `command' is a .so */ + if (strncmp (buffer, ".so", 3) == 0) { + buffer += 3; + + /* strip out any whitespace between the command and + it's argumant */ + while (CTYPE (isspace, *buffer)) + buffer++; + + /* If .so's argument is an absolute filename, it could be + * either (i) a macro inclusion, (ii) a non local manual page + * or (iii) a (somewhat bogus) reference to a local manual + * page. + * + * If (i) or (ii), we must not follow the reference. (iii) is + * a problem with the manual page, thus we don't want to + * follow any absolute inclusions in our quest for the + * ultimate source file */ + if (*buffer != '/') { + const char *end = buffer; + while (*end && !CTYPE (isspace, *end)) + ++end; + return xstrndup (buffer, end - buffer); + } + } + return NULL; +} + +static char *find_include (const char *name, const char *path, + const char *include) +{ + char *ret; + char *dirname; + char *temp_file; + + /* Restore the original path from before ult_softlink() etc., in + * case it went outside the mantree. + */ + ret = xasprintf ("%s/%s", path, include); + + /* If the original path from above doesn't exist, try to create new + * path as if the "include" was relative to the current man page. + */ + if (CAN_ACCESS (ret, F_OK)) + return ret; + + dirname = dir_name (name); + temp_file = xasprintf ("%s/%s", dirname, include); + free (dirname); + + if (CAN_ACCESS (temp_file, F_OK)) { + /* Just plain include. */ + free (ret); + ret = canonicalize_file_name (temp_file); + } else { + /* Try globbing - the file suffix might be missing. */ + char *temp_file_asterisk = xasprintf ("%s*", temp_file); + gl_list_t candidate_files = expand_path (temp_file_asterisk); + + free (temp_file_asterisk); + if (gl_list_size (candidate_files)) { + const char *candidate_file = gl_list_get_at + (candidate_files, 0); + if (CAN_ACCESS (candidate_file, F_OK)) { + free (ret); + ret = canonicalize_file_name (candidate_file); + } + } + gl_list_free (candidate_files); + } + free (temp_file); + + return ret; +} + +/* + * recursive function which finds the ultimate source file by following + * any ".so filename" directives in the first line of the man pages. + * Also (optionally) traces symlinks and hard links(!). + * + * name is full pathname, path is the MANPATH directory (/usr/man) + * flags is a combination of SO_LINK | SOFT_LINK | HARD_LINK + */ +const char *ult_src (const char *name, const char *path, + struct stat *buf, int flags, gl_list_t trace) +{ + static char *base; /* must be static */ + static short recurse; /* must be static */ + + /* initialise the function */ + + if (trace) + gl_list_add_last (trace, xstrdup (name)); + + /* as ult_softlink() & ult_hardlink() do all of their respective + * resolving in one call, only need to sort them out once + */ + + if (recurse == 0) { + struct stat new_buf; + free (base); + base = xstrdup (name); + + debug ("\nult_src: File %s in mantree %s\n", name, path); + + /* If we don't have a buf, allocate and assign one */ + if (!buf && ((flags & SOFT_LINK) || (flags & HARD_LINK))) { + buf = &new_buf; + if (lstat (base, buf) == -1) { + if (quiet < 2) + error (0, errno, _("can't resolve %s"), + base); + return NULL; + } + } + + /* Permit semi local (inter-tree) soft links */ + if (flags & SOFT_LINK) { + assert (buf); /* initialised above */ + if (S_ISLNK (buf->st_mode)) { + /* Is a symlink, resolve it. */ + char *softlink = ult_softlink (base); + if (softlink) { + free (base); + base = softlink; + } else + return NULL; + } + } + + /* Only deal with local (inter-dir) HARD links */ + if (flags & HARD_LINK) { + assert (buf); /* initialised above */ + if (buf->st_nlink > 1) { + /* Has HARD links, find least value */ + char *hardlink = ult_hardlink (base, + buf->st_ino); + if (hardlink) { + free (base); + base = hardlink; + } + } + } + } + + /* keep a check on recursion level */ + else if (recurse == 10) { + if (quiet < 2) + error (0, 0, _("%s is self referencing"), name); + return NULL; + } + + if (flags & SO_LINK) { + const char *buffer; + char *decomp_base; + pipeline *decomp; + char *include; + struct stat st; + + if (stat (base, &st) < 0) { + struct compression *comp = comp_file (base); + + if (comp) { + free (base); + base = comp->stem; + comp->stem = NULL; /* steal memory */ + } else { + if (quiet < 2) + error (0, errno, _("can't open %s"), + base); + return NULL; + } + } + + /* base may change for recursive calls to ult_src, but + * decompress_open doesn't keep its own copy. + */ + decomp_base = xstrdup (base); + decomp = decompress_open (decomp_base); + if (!decomp) { + if (quiet < 2) + error (0, errno, _("can't open %s"), base); + free (decomp_base); + return NULL; + } + pipeline_start (decomp); + + /* make sure that we skip over any comments */ + do { + buffer = pipeline_readline (decomp); + } while (buffer && STRNEQ (buffer, ".\\\"", 3)); + + include = test_for_include (buffer); + if (include) { + char *new_name; + const char *ult; + + free (base); + base = find_include (name, path, include); + free (include); + + debug ("ult_src: points to %s\n", base); + + recurse++; + /* Take a copy; it's unwise to pass base directly to + * a recursive call, as it may be freed. + */ + new_name = xstrdup (base); + ult = ult_src (new_name, path, NULL, flags, trace); + free (new_name); + recurse--; + + pipeline_wait (decomp); + pipeline_free (decomp); + free (decomp_base); + return ult; + } + + pipeline_wait (decomp); + pipeline_free (decomp); + free (decomp_base); + } + + /* We have the ultimate source */ + if (trace) + gl_list_add_last (trace, xstrdup (base)); + return base; +} |