# -*- perl -*- # Lintian::Index::Item -- Representation of path entry in a package # # Copyright (C) 2011 Niels Thykier # Copyright (C) 2020 Felix Lechner # # This program is free software; you can redistribute it and/or modify it # under the terms of the GNU General Public License as published by the Free # Software Foundation; either version 2 of the License, or (at your option) # any later version. # # This program is distributed in the hope that it will be useful, but WITHOUT # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or # FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for # more details. # # You should have received a copy of the GNU General Public License along with # this program. If not, see . package Lintian::Index::Item; use v5.20; use warnings; use utf8; use autodie qw(open); use Carp qw(croak confess); use Const::Fast; use Date::Parse qw(str2time); use List::SomeUtils qw(all); use Path::Tiny; use Syntax::Keyword::Try; use Text::Balanced qw(extract_delimited); use Unicode::UTF8 qw(valid_utf8 decode_utf8 encode_utf8); use Lintian::Pointer::Item; use Lintian::SlidingWindow; use Lintian::Util qw(normalize_link_target); use Moo; use namespace::clean; use constant { TYPE_FILE => 0x00_01_00_00, TYPE_HARDLINK => 0x00_02_00_00, TYPE_DIR => 0x00_04_00_00, TYPE_SYMLINK => 0x00_08_00_00, TYPE_BLOCK_DEV => 0x00_10_00_00, TYPE_CHAR_DEV => 0x00_20_00_00, TYPE_PIPE => 0x00_40_00_00, TYPE_OTHER => 0x00_80_00_00, TYPE_MASK => 0x00_ff_00_00, UNSAFE_PATH => 0x01_00_00_00, FS_PATH_IS_OK => 0x02_00_00_00, OPEN_IS_OK => 0x06_00_00_00, # Implies FS_PATH_IS_OK ACCESS_INFO => 0x07_00_00_00, # 0o6777 == 0xdff, which covers set[ug]id + sticky bit. Accordingly, # 0xffff should be more than sufficient for the foreseeable future. OPERM_MASK => 0x00_00_ff_ff, }; use overload ( q{""} => \&_as_string, 'qr' => \&_as_regex_ref, 'bool' => \&_bool, q{!} => \&_bool_not, q{.} => \&_str_concat, 'cmp' => \&_str_cmp, 'eq' => \&_str_eq, 'ne' => \&_str_ne, 'fallback' => 0, ); const my $EMPTY => q{}; const my $SPACE => q{ }; const my $SLASH => q{/}; const my $DOT => q{.}; const my $DOUBLE_DOT => q{..}; const my $DOUBLE_QUOTE => q{"}; const my $BACKSLASH => q{\\}; const my $HASHBANG => q{#!}; const my $MAXIMUM_LINK_DEPTH => 18; const my $BYTE_MAXIMUM => 255; const my $SINGLE_OCTAL_MASK => oct(7); const my $DUAL_OCTAL_MASK => oct(77); const my $ELF_MAGIC_SIZE => 4; const my $LINCITY_MAGIC_SIZE => 6; const my $SHELL_SCRIPT_MAGIC_SIZE => 2; const my $READ_BITS => oct(444); const my $WRITE_BITS => oct(222); const my $EXECUTABLE_BITS => oct(111); const my $SETUID => oct(4000); const my $SETGID => oct(2000); =head1 NAME Lintian::Index::Item - Lintian representation of a path entry in a package =head1 SYNOPSIS my ($name, $type, $dir) = ('lintian', 'source', '/path/to/entry'); =head1 INSTANCE METHODS =over 4 =item init_from_tar_output =item get_quoted_filename =item unescape_c_style =cut my $datepattern = qr/\d{4}-\d{2}-\d{2}/; my $timepattern = qr/\d{2}\:\d{2}(?:\:\d{2}(?:\.\d+)?)?/; my $symlinkpattern = qr/\s+->\s+/; my $hardlinkpattern = qr/\s+link\s+to\s+/; # adapted from https://www.perlmonks.org/?node_id=1056606 my %T = ( (map {chr() => chr} 0..$BYTE_MAXIMUM), (map {sprintf('%o',$_) => chr} 0..($BYTE_MAXIMUM & $SINGLE_OCTAL_MASK)), (map {sprintf('%02o',$_) => chr} 0..($BYTE_MAXIMUM & $DUAL_OCTAL_MASK)), (map {sprintf('%03o',$_) => chr} 0..$BYTE_MAXIMUM), (split //, "r\rn\nb\ba\af\ft\tv\013") ); sub unescape_c_style { my ($escaped) = @_; (my $result = $escaped) =~ s/\\([0-7]{1,3}|.)/$T{$1}/g; return $result; } sub get_quoted_filename { my ($unknown, $skip) = @_; # extract quoted file name my ($delimited, $extra) = extract_delimited($unknown, $DOUBLE_QUOTE, $skip, $BACKSLASH); return (undef, undef) unless defined $delimited; # drop quotes my $cstylename = substr($delimited, 1, (length $delimited) - 2); # convert c-style escapes my $name = unescape_c_style($cstylename); return ($name, $extra); } sub init_from_tar_output { my ($self, $line) = @_; chomp $line; # allow spaces in ownership and filenames (#895175 and #950589) my ($initial, $size, $date, $time, $remainder) = split(/\s+(\d+)\s+($datepattern)\s+($timepattern)\s+/, $line,2); die encode_utf8( $self->index->identifier . ": Cannot parse tar output: $line") unless all { defined } ($initial, $size, $date, $time, $remainder); $self->size($size); $self->date($date); $self->time($time); my ($permissions, $ownership) = split(/\s+/, $initial, 2); die encode_utf8($self->index->identifier .": Cannot parse permissions and ownership in tar output: $line") unless all { defined } ($permissions, $ownership); $self->perm($permissions); my ($owner, $group) = split(qr{/}, $ownership, 2); die encode_utf8($self->index->identifier . ": Cannot parse owner and group in tar output: $line") unless all { defined } ($owner, $group); $self->owner($owner); $self->group($group); my ($name, $extra) = get_quoted_filename($remainder, $EMPTY); die encode_utf8($self->index->identifier . ": Cannot parse file name in tar output: $line") unless all { defined } ($name, $extra); # strip relative prefix $name =~ s{^\./+}{}s; # slashes cannot appear in names but are sometimes doubled # as in emboss-explorer_2.2.0-10.dsc # better implemented in a Moo trigger on the attribute $name =~ s{/+}{/}g; # make sure directories end with a slash, except root $name .= $SLASH if length $name && $self->perm =~ / ^d /msx && $name !~ m{ /$ }msx; $self->name($name); # look for symbolic link target if ($self->perm =~ /^l/) { my ($linktarget, undef) = get_quoted_filename($extra, $symlinkpattern); die encode_utf8($self->index->identifier .": Cannot parse symbolic link target in tar output: $line") unless defined $linktarget; # do not remove multiple slashes from symlink targets # caught by symlink-has-double-slash, which is tested # leaves resolution of these links unsolved # do not strip relative prefix for symbolic links $self->link($linktarget); } # look for hard link target if ($self->perm =~ /^h/) { my ($linktarget, undef)= get_quoted_filename($extra, $hardlinkpattern); die encode_utf8($self->index->identifier . ": Cannot parse hard link target in tar output: $line") unless defined $linktarget; # strip relative prefix $linktarget =~ s{^\./+}{}s; # slashes cannot appear in names but are sometimes doubled # as in emboss-explorer_2.2.0-10.dsc # better implemented in a Moo trigger on the attribute, but requires # separate attributes for hard and symbolic link targets $linktarget =~ s{/+}{/}g; $self->link($linktarget); } return; } =item bytes_match(REGEX) Returns the matched string if REGEX matches the file's byte contents, or $EMPTY otherwise. =cut sub bytes_match { my ($self, $regex) = @_; return $EMPTY unless $self->is_file; return $EMPTY unless $self->is_open_ok; return $EMPTY unless length $regex; open(my $fd, '<:raw', $self->unpacked_path); my $sfd = Lintian::SlidingWindow->new; $sfd->handle($fd); my $match; while (my $block = $sfd->readwindow) { if ($block =~ /($regex)/) { $match = $1; last; } } close $fd; return $match // $EMPTY; } =item mentions_in_operation(REGEX) Returns the matched string if REGEX matches in a file location that is likely an operation (vs text), or $EMPTY otherwise. =cut sub mentions_in_operation { my ($self, $regex) = @_; # prefer strings(1) output (eg. for ELF) if we have it # may not work as expected on ELF due to ld's SHF_MERGE my $match; if (length $self->strings && $self->strings =~ /($regex)/) { $match = $1; } elsif ($self->is_script) { $match = $self->bytes_match($regex); } return $match // $EMPTY; } =item magic(COUNT) Returns the specified COUNT of magic bytes for the file. =cut sub magic { my ($self, $count) = @_; return $EMPTY if length $self->link; return $EMPTY if $self->size < $count; return $EMPTY unless $self->is_open_ok; my $magic; open(my $fd, '<', $self->unpacked_path); die encode_utf8($self->index->identifier . ": Could not read $count bytes from " . $self->name) unless read($fd, $magic, $count) == $count; close $fd; return $magic; } =item C Returns the C for the file if it is a script. =cut has hashbang => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; return $EMPTY unless $self->is_script; my $trimmed_bytes = $EMPTY; my $magic; open(my $fd, '<', $self->unpacked_path); if (read($fd, $magic, 2) && $magic eq $HASHBANG && !eof($fd)) { $trimmed_bytes = <$fd>; } close $fd; # decoding UTF-8 fails on magyarispell_1.6.1-2.dsc and ldc_1.24.0-1.dsc # remove comment, if any $trimmed_bytes =~ s/^([^#]*)/$1/; # trim both ends $trimmed_bytes =~ s/^\s+|\s+$//g; return $trimmed_bytes; } ); =item interpreter_with_options Returns the interpreter requested by a script with options after stripping C. =cut has interpreter_with_options => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; my $with_options = $self->hashbang; $with_options =~ s{^/usr/bin/env\s+}{}; return $with_options; } ); =item interpreter Returns the interpreter requested by a script but strips C. =cut has interpreter => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; my $interpreter = $self->interpreter_with_options; # keep base command without options $interpreter =~ s/^(\S+).*/$1/; return $interpreter; } ); =item C Returns true if file is a script that calls C. =cut has calls_env => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; # must return a boolean success value #943724 return 1 if $self->hashbang =~ m{^/usr/bin/env\s+}; return 0; } ); =item C Returns true if file is a script requesting a recognized shell interpreter. =cut has is_shell_script => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; my $interpreter = $self->interpreter; # keep basename my ($basename) = ($interpreter =~ m{([^/]*)/?$}s); return 1 if $basename =~ /^(?:[bd]?a|t?c|(?:pd|m)?k|z)?sh$/; return 0; } ); =item is_elf Returns true if file is an ELF executable, and false otherwise. =cut has is_elf => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; return 1 if $self->magic($ELF_MAGIC_SIZE) eq "\x7FELF"; return 0; } ); =item is_script Returns true if file is a script and false otherwise. =cut has is_script => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; # skip lincity data files; magic: #!#!#! return 0 if $self->magic($LINCITY_MAGIC_SIZE) eq '#!#!#!'; return 0 unless $self->magic($SHELL_SCRIPT_MAGIC_SIZE) eq $HASHBANG; return 1; } ); =item is_maintainer_script Returns true if file is a maintainer script and false otherwise. =cut has is_maintainer_script => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; return 1 if $self->name =~ /^ config | (?:pre|post)(?:inst|rm) $/x && $self->is_open_ok; return 0; } ); =item identity Returns the owner and group of the path, separated by a slash. NB: If only numerical owner information is available in the package, this may return a numerical owner (except uid 0 is always mapped to "root") =cut sub identity { my ($self) = @_; return $self->owner . $SLASH . $self->group; } =item operm Returns the file permissions of this object in octal (e.g. 0644). NB: This is only well defined for file entries that are subject to permissions (e.g. files). Particularly, the value is not well defined for symlinks. =cut sub operm { my ($self) = @_; return $self->path_info & OPERM_MASK; } =item octal_permissions =cut sub octal_permissions { my ($self) = @_; return sprintf('%04o', $self->operm); } =item children Returns a list of children (as Lintian::File::Path objects) of this entry. The list and its contents should not be modified. Only returns direct children of this directory. The entries are sorted by name. NB: Returns the empty list for non-dir entries. =cut sub children { my ($self) = @_; croak encode_utf8('No index in ' . $self->name) unless defined $self->index; my @names = values %{$self->childnames}; return map { $self->index->lookup($_) } @names; } =item descendants Returns a list of children (as Lintian::File::Path objects) of this entry. The list and its contents should not be modified. Descends recursively into subdirectories and return the descendants in breadth-first order. Children of a given directory will be sorted by name. NB: Returns the empty list for non-dir entries. =cut sub descendants { my ($self) = @_; my @descendants = $self->children; my @directories = grep { $_->is_dir } @descendants; push(@descendants, $_->descendants) for @directories; return @descendants; } =item timestamp Returns a Unix timestamp for the given path. This is a number of seconds since the start of Unix epoch in UTC. =cut sub timestamp { my ($self) = @_; my $timestamp = $self->date . $SPACE . $self->time; return str2time($timestamp, 'GMT'); } =item child(BASENAME) Returns the child named BASENAME if it is a child of this directory. Otherwise, this method returns C. Even for directories, BASENAME should not end with a slash. When invoked on non-dirs, this method always returns C. Example: $dir_entry->child('foo') => $entry OR undef =cut sub child { my ($self, $basename) = @_; croak encode_utf8('No index in ' . $self->name) unless defined $self->index; croak encode_utf8($self->index->identifier . ': Basename is required') unless length $basename; my $childname = $self->childnames->{$basename}; return undef unless $childname; return $self->index->lookup($childname); } =item is_symlink Returns a truth value if this entry is a symlink. =item is_hardlink Returns a truth value if this entry is a hardlink to a regular file. NB: The target of a hardlink is always a regular file (and not a dir etc.). =item is_dir Returns a truth value if this entry is a dir. NB: Unlike the "-d $dir" operator this will never return true for symlinks, even if the symlink points to a dir. =item is_file Returns a truth value if this entry is a regular file (or a hardlink to one). NB: Unlike the "-f $file" operator this will never return true for symlinks, even if the symlink points to a file (or hardlink). =item is_regular_file Returns a truth value if this entry is a regular file. This is eqv. to $path->is_file and not $path->is_hardlink. NB: Unlike the "-f $file" operator this will never return true for symlinks, even if the symlink points to a file. =cut sub is_symlink { my ($self) = @_; return $self->path_info & TYPE_SYMLINK ? 1 : 0; } sub is_hardlink { my ($self) = @_; return $self->path_info & TYPE_HARDLINK ? 1 : 0; } sub is_dir { my ($self) = @_; return $self->path_info & TYPE_DIR ? 1 : 0; } sub is_file { my ($self) = @_; return $self->path_info & (TYPE_FILE | TYPE_HARDLINK) ? 1 : 0; } sub is_regular_file { my ($self) = @_; return $self->path_info & TYPE_FILE ? 1 : 0; } =item link_normalized Returns the target of the link normalized against it's directory name. If the link cannot be normalized or normalized path might escape the package root, this method returns C. NB: This method will return the empty string for links pointing to the root dir of the package. Only available on "links" (i.e. symlinks or hardlinks). On non-links this will croak. I: If you want the symlink target as a L object, use the L method with no arguments instead. =cut has link_normalized => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; my $name = $self->name; my $link = $self->link; croak encode_utf8($self->index->identifier . ": $name is not a link") unless length $link; my $dir = $self->dirname; # hardlinks are always relative to the package root $dir = $SLASH if $self->is_hardlink; my $target = normalize_link_target($dir, $link); return $target; } ); =item is_readable Returns a truth value if the permission bits of this entry have at least one bit denoting readability set (bitmask 0444). =item is_writable Returns a truth value if the permission bits of this entry have at least one bit denoting writability set (bitmask 0222). =item is_executable Returns a truth value if the permission bits of this entry have at least one bit denoting executability set (bitmask 0111). =cut sub is_readable { my ($self) = @_; return $self->path_info & $READ_BITS; } sub is_writable { my ($self) = @_; return $self->path_info & $WRITE_BITS; } sub is_executable { my ($self) = @_; return $self->path_info & $EXECUTABLE_BITS; } =item all_bits_set =cut sub all_bits_set { my ($self, $bits) = @_; return ($self->operm & $bits) == $bits; } =item is_setuid =cut sub is_setuid { my ($self) = @_; return $self->operm & $SETUID; } =item is_setgid =cut sub is_setgid { my ($self) = @_; return $self->operm & $SETGID; } =item unpacked_path Returns the path to this object on the file system, which must be a regular file, a hardlink or a directory. This method may fail if: =over 4 =item * The object is neither a directory or a file-like object (e.g. a named pipe). =item * If the object is dangling symlink or the path traverses a symlink outside the package root. =back To test if this is safe to call, if the target is (supposed) to be a: =over 4 =item * file or hardlink then test with L. =item * dir then assert L returns a defined entry, for which L returns a truth value. =back =cut sub unpacked_path { my ($self) = @_; $self->_check_access; croak encode_utf8('No index in ' . $self->name) unless defined $self->index; my $basedir = $self->index->basedir; croak encode_utf8($self->index->identifier . ': No base directory') unless length $basedir; my $unpacked = path($basedir)->child($self->name)->stringify; # bug in perl, file operator should not care but does # https://github.com/Perl/perl5/issues/10550 # also, https://github.com/Perl/perl5/issues/9674 utf8::downgrade $unpacked; return $unpacked; } =item is_open_ok Returns a truth value if it is safe to attempt open a read handle to the underlying file object. Returns a truth value if the path may be opened. =cut sub is_open_ok { my ($self) = @_; my $path_info = $self->path_info; return 1 if ($path_info & OPEN_IS_OK) == OPEN_IS_OK; return 0 if $path_info & ACCESS_INFO; try { $self->_check_open; } catch { return 0; # perlcritic 1.140-1 requires the semicolon on the next line }; return 1; } sub _check_access { my ($self) = @_; my $path_info = $self->path_info; return 1 if ($path_info & FS_PATH_IS_OK) == FS_PATH_IS_OK; return 0 if $path_info & ACCESS_INFO; my $resolvable = $self->resolve_path; unless ($resolvable) { $self->path_info($self->path_info | UNSAFE_PATH); # NB: We are deliberately vague here to avoid suggesting # whether $path exists. In some cases (e.g. lintian.d.o) # the output is readily available to wider public. confess encode_utf8($self->index->identifier .': Attempt to access through broken or unsafe symlink: ' . $self->name); } $self->path_info($self->path_info | FS_PATH_IS_OK); return 1; } sub _check_open { my ($self) = @_; $self->_check_access; # Symlinks can point to a "non-file" object inside the # package root # Leave "_path_access" here as _check_access marks it either as # "UNSAFE_PATH" or "FS_PATH_IS_OK" confess encode_utf8($self->index->identifier .': Opening of irregular file not supported: ' . $self->name) unless $self->is_file || ($self->is_symlink && -e $self->unpacked_path); $self->path_info($self->path_info | OPEN_IS_OK); return 1; } =item follow Return dereferenced link if applicable =cut sub follow { my ($self, $maxlinks) = @_; return $self unless length $self->link; return $self->dereferenced if defined $self->dereferenced; # set limit $maxlinks //= $MAXIMUM_LINK_DEPTH; # catch recursive links return undef if $maxlinks <= 0; # reduce counter $maxlinks--; my $reference; croak encode_utf8('No index in ' . $self->name) unless defined $self->index; if ($self->is_hardlink) { # hard links are resolved against package root $reference = $self->index->lookup; } else { # otherwise resolve against the parent $reference = $self->parent_dir; } croak encode_utf8($self->index->identifier . ': No parent reference for link in ' . $self->name) unless defined $reference; # follow link my $dereferenced = $reference->resolve_path($self->link, $maxlinks); $self->dereferenced($dereferenced); return $self->dereferenced; } =item resolve_path([PATH]) Resolve PATH relative to this path entry. If PATH starts with a slash and the file hierarchy has a well-defined root directory, then PATH will instead be resolved relatively to the root dir. If the file hierarchy does not have a well-defined root dir (e.g. for source packages), this method will return C. If PATH is omitted, then the entry is resolved and the target is returned if it is valid. Except for symlinks, all entries always resolve to themselves. NB: hardlinks also resolve as themselves. It is an error to attempt to resolve a PATH against a non-directory and non-symlink entry - as such resolution would always fail (i.e. foo/../bar is an invalid path unless foo is a directory or a symlink to a dir). The resolution takes symlinks into account and following them provided that the target path is valid (and can be followed safely). If the path is invalid or circular (symlinks), escapes the root directory or follows an unsafe symlink, the method returns C. Otherwise, it returns the path entry that denotes the target path. If PATH contains at least one path segment and ends with a slash, then the resolved path will end in a directory (or fail). Otherwise, the resolved PATH can end in any entry I a symlink. Examples: $symlink_entry->resolve_path => $nonsymlink_entry OR undef $x->resolve_path => $x For directory or symlink entries (dol), you can also resolve a path: $dol_entry->resolve_path('some/../where') => $nonsymlink_entry OR undef # Note the trailing slash $dol_entry->resolve_path('some/../where/') => $dir_entry OR undef =cut sub resolve_path { my ($self, $request, $maxlinks) = @_; croak encode_utf8('No index in ' . $self->name) unless defined $self->index; croak encode_utf8( $self->index->identifier . ': Can only resolve string arguments') if defined $request && ref($request) ne $EMPTY; $request //= $EMPTY; if (length $self->link) { # follow the link my $dereferenced = $self->follow($maxlinks); return undef unless defined $dereferenced; # and use that to resolve the request return $dereferenced->resolve_path($request, $maxlinks); } my $reference; # check for absolute reference; remove slash if ($request =~ s{^/+}{}s) { # require anchoring for absolute references return undef unless $self->index->anchored; # get root entry $reference = $self->index->lookup; } elsif ($self->is_dir) { # directories are their own starting point $reference = $self; } else { # otherwise, use parent directory $reference = $self->parent_dir; } return undef unless defined $reference; # read first segment; strip all trailing slashes for recursive use if ($request =~ s{^([^/]+)/*}{}) { my $segment = $1; # single dot, or two slashes in a row return $reference->resolve_path($request, $maxlinks) if $segment eq $DOT || !length $segment; # for double dot, go up a level if ($segment eq $DOUBLE_DOT) { my $parent = $reference->parent_dir; return undef unless defined $parent; return $parent->resolve_path($request, $maxlinks); } # look for child otherwise my $child = $reference->child($segment); return undef unless defined $child; return $child->resolve_path($request, $maxlinks); } croak encode_utf8($self->index->identifier . ": Cannot parse path resolution request: $request") if length $request; # nothing else to resolve return $self; } =item name Returns the name of the file (relative to the package root). NB: It will never have any leading "./" (or "/") in it. =item basename Returns the "filename" part of the name, similar basename(1) or File::Basename::basename (without passing a suffix to strip in either case). NB: Returns the empty string for the "root" dir. =item dirname Returns the "directory" part of the name, similar to dirname(1) or File::Basename::dirname. The dirname will end with a trailing slash (except the "root" dir - see below). NB: Returns the empty string for the "root" dir. =item link If this is a link (i.e. is_symlink or is_hardlink returns a truth value), this method returns the target of the link. If this is not a link, then this returns undef. If the path is a symlink this method can be used to determine if the symlink is relative or absolute. This is I true for hardlinks, where the link target is always relative to the root. NB: Even for symlinks, a leading "./" will be stripped. =item normalized =item faux Returns a truth value if this entry absent in the package. This can happen if a package does not include all intermediate directories. =item size Returns the size of the path in bytes. NB: Only regular files can have a non-zero file size. =item date Return the modification date as YYYY-MM-DD. =item time =item perm =item path_info =item owner Returns the owner of the path entry as a username. NB: If only numerical owner information is available in the package, this may return a numerical owner (except uid 0 is always mapped to "root") =item group Returns the group of the path entry as a username. NB: If only numerical owner information is available in the package, this may return a numerical group (except gid 0 is always mapped to "root") =item uid Returns the uid of the owner of the path entry. NB: If the uid is not available, 0 will be returned. This usually happens if the numerical data is not collected (e.g. in source packages) =item gid Returns the gid of the owner of the path entry. NB: If the gid is not available, 0 will be returned. This usually happens if the numerical data is not collected (e.g. in source packages) =item file_type Return the data from L if it has been collected. Note this is only defined for files as Lintian only runs L on files. =item java_info =item strings =item C =item index =item parent_dir =item child_table =item sorted_children Returns the parent directory entry of this entry as a L. NB: Returns C for the "root" dir. =item C =item parent_dir Return the parent dir entry of this the path entry. =item dereferenced =cut has name => ( is => 'rw', lazy => 1, coerce => sub { my ($string) = @_; return $string // $EMPTY;}, trigger => sub { my ($self, $name) = @_; my ($basename) = ($name =~ m{([^/]*)/?$}s); $self->basename($basename); # allow newline in names; need /s for dot matching (#929729) my ($dirname) = ($name =~ m{^(.+/)?(?:[^/]+/?)$}s); $self->dirname($dirname); }, default => $EMPTY ); has basename => ( is => 'rw', lazy => 1, coerce => sub { my ($string) = @_; return $string // $EMPTY;}, default => $EMPTY ); has dirname => ( is => 'rw', lazy => 1, coerce => sub { my ($string) = @_; return $string // $EMPTY;}, default => $EMPTY ); has link => ( is => 'rw', coerce => sub { my ($string) = @_; return $string // $EMPTY;}, default => $EMPTY ); has normalized => ( is => 'rw', coerce => sub { my ($string) = @_; return $string // $EMPTY;}, default => $EMPTY ); has faux => (is => 'rw', default => 0); has size => (is => 'rw', default => 0); has date => ( is => 'rw', default => sub { my ($sec,$min,$hour,$mday,$mon,$year,$wday,$yday,$isdst) = gmtime; return sprintf('%04d-%02d-%02d', $year, $mon, $mday); } ); has time => ( is => 'rw', default => sub { my ($sec,$min,$hour,$mday,$mon,$year,$wday,$yday,$isdst) = gmtime; return sprintf('%02d:%02d:%02d', $hour, $min, $sec); } ); has perm => (is => 'rw'); has path_info => (is => 'rw'); has owner => ( is => 'rw', coerce => sub { my ($string) = @_; return $string // 'root'; }, default => 'root' ); has group => ( is => 'rw', coerce => sub { my ($string) = @_; return $string // 'root'; }, default => 'root' ); has uid => ( is => 'rw', coerce => sub { my ($value) = @_; return int($value // 0); }, default => 0 ); has gid => ( is => 'rw', coerce => sub { my ($value) = @_; return int($value // 0); }, default => 0 ); has md5sum => ( is => 'rw', coerce => sub { my ($checksum) = @_; return ($checksum // 0); }, default => 0 ); has file_type => ( is => 'rw', coerce => sub { my ($text) = @_; return ($text // $EMPTY); }, default => $EMPTY ); has java_info => ( is => 'rw', coerce => sub { my ($hashref) = @_; return ($hashref // {}); }, default => sub { {} } ); has strings => ( is => 'rw', coerce => sub { my ($text) = @_; return ($text // $EMPTY); }, default => $EMPTY ); has ar_info => ( is => 'rw', coerce => sub { my ($hashref) = @_; return ($hashref // {}); }, default => sub { {} } ); has index => (is => 'rw'); has childnames => (is => 'rw', default => sub { {} }); has parent_dir => ( is => 'rw', lazy => 1, default => sub { my ($self) = @_; # do not return root as its own parent return if $self->name eq $EMPTY; croak encode_utf8('No index in ' . $self->name) unless defined $self->index; # returns root by default return $self->index->lookup($self->dirname); } ); has dereferenced => (is => 'rw'); =item elf =cut sub elf { my ($self, @args) = @_; if (@args) { $self->index->elf_storage->{$self->name} = $args[0]; return (); } my %copy = %{$self->index->elf_storage->{$self->name} // {} }; return \%copy; } =item elf_by_member =cut sub elf_by_member { my ($self, @args) = @_; if (@args) { my $object_name = $args[0]; my $by_object = $args[1]; my $tmp = $self->index->elf_storage_by_member->{$self->name} // {}; $tmp->{$object_name} = $by_object; $self->index->elf_storage_by_member->{$self->name} = $tmp; return (); } my %copy = %{$self->index->elf_storage_by_member->{$self->name} // {} }; return \%copy; } =item pointer =cut sub pointer { my ($self, $position) = @_; my $pointer = Lintian::Pointer::Item->new; $pointer->item($self); $pointer->position($position); return $pointer; } =item bytes Returns verbatim file contents as a scalar. =item is_valid_utf8 Boolean true if file contents are valid UTF-8. =item decoded_utf8 Returns a decoded, wide-character string if file contents are valid UTF-8. =cut sub bytes { my ($self) = @_; return $EMPTY unless $self->is_open_ok; my $bytes = path($self->unpacked_path)->slurp; return $bytes; } sub is_valid_utf8 { my ($self) = @_; my $bytes = $self->bytes; return 0 unless defined $bytes; return valid_utf8($bytes); } sub decoded_utf8 { my ($self) = @_; return $EMPTY unless $self->is_valid_utf8; return decode_utf8($self->bytes); } ### OVERLOADED OPERATORS ### # overload apparently does not like the mk_ro_accessor, so use a level # of indirection sub _as_regex_ref { my ($self) = @_; my $name = $self->name; return qr{ \Q$name\E }xsm; } sub _as_string { my ($self) = @_; return $self->name; } sub _bool { # Always true (used in "if ($info->index('some/path')) {...}") return 1; } sub _bool_not { my ($self) = @_; return !$self->_bool; } sub _str_cmp { my ($self, $str, $swap) = @_; return $str cmp $self->name if $swap; return $self->name cmp $str; } sub _str_concat { my ($self, $str, $swap) = @_; return $str . $self->name if $swap; return $self->name . $str; } sub _str_eq { my ($self, $str) = @_; return $self->name eq $str; } sub _str_ne { my ($self, $str) = @_; return $self->name ne $str; } =back =head1 AUTHOR Originally written by Niels Thykier for Lintian. =head1 SEE ALSO lintian(1) =cut 1; # Local Variables: # indent-tabs-mode: nil # cperl-indent-level: 4 # End: # vim: syntax=perl sw=4 sts=4 sr et