=head1 NAME Module::List - module `directory' listing =head1 SYNOPSIS use Module::List qw(list_modules); $id_modules = list_modules("Data::ID::", { list_modules => 1}); $prefixes = list_modules("", { list_prefixes => 1, recurse => 1 }); =head1 DESCRIPTION This module deals with the examination of the namespace of Perl modules. The contents of the module namespace is split across several physical directory trees, but this module hides that detail, providing instead a view of the abstract namespace. =cut package Module::List; { use 5.006; } use warnings; use strict; use Carp qw(croak); use File::Spec; use IO::Dir 1.03; our $VERSION = "0.004"; use parent "Exporter"; our @EXPORT_OK = qw(list_modules); =head1 FUNCTIONS =over =item list_modules(PREFIX, OPTIONS) This function generates a listing of the contents of part of the module namespace. The part of the namespace under the module name prefix PREFIX is examined, and information about it returned as specified by OPTIONS. Module names are handled by this function in standard bareword syntax. They are always fully-qualified; isolated name components are never used. A module name prefix is the part of a module name that comes before a component of the name, and so either ends with "::" or is the empty string. OPTIONS is a reference to a hash, the elements of which specify what is to be returned. The options are: =over =item list_modules Truth value, default false. If true, return names of modules in the relevant part of the namespace. =item list_prefixes Truth value, default false. If true, return module name prefixes in the relevant part of the namespace. Note that prefixes are returned if the corresponding directory exists, even if there is nothing in it. =item list_pod Truth value, default false. If true, return names of POD documentation files that are in the module namespace. =item trivial_syntax Truth value, default false. If false, only valid bareword names are permitted. If true, bareword syntax is ignored, and any "::"-separated name that can be turned into a correct filename by interpreting name components as filename components is permitted. This is of no use in listing actual Perl modules, because the illegal names can't be used in Perl, but some programs such as B use a "::"-separated name for the sake of appearance without really using bareword syntax. The loosened syntax applies both to the names returned and to the I parameter. Precisely, the `trivial syntax' is that each "::"-separated component cannot be "." or "..", cannot contain "::" or "/", and (except for the final component of a leaf name) cannot end with ":". This is precisely what is required to achieve a unique interconvertible "::"-separated path syntax on Unix. This criterion might change in the future on non-Unix systems, where the filename syntax differs. =item recurse Truth value, default false. If false, only names at the next level down from PREFIX (having one more component) are returned. If true, names at all lower levels are returned. =item use_pod_dir Truth value, default false. If false, POD documentation files are expected to be in the same directory that the corresponding module file would be in. If true, POD files may also be in a subdirectory of that named "C". (Any POD files in such a subdirectory will therefore be visible under two module names, one treating the "C" subdirectory level as part of the module name.) =item return_path Truth value, default false. If false, only the existence of requested items is reported. If true, the pathnames of the files in which they exist are reported. =back Note that the default behaviour, if an empty options hash is supplied, is to return nothing. You I specify what kind of information you want. The function returns a reference to a hash, the keys of which are the names of interest. By default, the value associated with each of these keys is undef. If additional information about each item was requested, the value for each item is a reference to a hash, containing some subset of these items: =over =item module_path Pathname of the module of this name. Specifically, this identifies the file that would be read in order to load the module. This may be a C<.pmc> file if one is available. Absent if there is no module. =item pod_path Pathname of the POD document of this name. Absent if there is no discrete POD document. (POD in a module file doesn't constitute a discrete POD document.) =item prefix_paths Reference to an array of the pathnames of the directories referenced by this prefix. The directories are listed in the order corresponding to @INC. Absent if this is not a prefix. =back =cut sub list_modules($$) { my($prefix, $options) = @_; my $trivial_syntax = $options->{trivial_syntax}; my($root_leaf_rx, $root_notleaf_rx); my($notroot_leaf_rx, $notroot_notleaf_rx); if($trivial_syntax) { $root_leaf_rx = $notroot_leaf_rx = qr#:?(?:[^/:]+:)*[^/:]+:?#; $root_notleaf_rx = $notroot_notleaf_rx = qr#:?(?:[^/:]+:)*[^/:]+#; } else { $root_leaf_rx = $root_notleaf_rx = qr/[a-zA-Z_][0-9a-zA-Z_]*/; $notroot_leaf_rx = $notroot_notleaf_rx = qr/[0-9a-zA-Z_]+/; } croak "bad module name prefix `$prefix'" unless $prefix =~ /\A(?:${root_notleaf_rx}:: (?:${notroot_notleaf_rx}::)*)?\z/x && $prefix !~ /(?:\A|[^:]::)\.\.?::/; my $list_modules = $options->{list_modules}; my $list_prefixes = $options->{list_prefixes}; my $list_pod = $options->{list_pod}; my $use_pod_dir = $options->{use_pod_dir}; return {} unless $list_modules || $list_prefixes || $list_pod; my $recurse = $options->{recurse}; my $return_path = $options->{return_path}; my @prefixes = ($prefix); my %seen_prefixes; my %results; while(@prefixes) { my $prefix = pop(@prefixes); my @dir_suffix = split(/::/, $prefix); my $module_rx = $prefix eq "" ? $root_leaf_rx : $notroot_leaf_rx; my $pmc_rx = qr/\A($module_rx)\.pmc\z/; my $pm_rx = qr/\A($module_rx)\.pm\z/; my $pod_rx = qr/\A($module_rx)\.pod\z/; my $dir_rx = $prefix eq "" ? $root_notleaf_rx : $notroot_notleaf_rx; $dir_rx = qr/\A$dir_rx\z/; foreach my $incdir (@INC) { my $dir = File::Spec->catdir($incdir, @dir_suffix); my $dh = IO::Dir->new($dir) or next; my @entries = $dh->read; $dh->close; if($list_modules) { foreach my $pmish_rx ($pmc_rx, $pm_rx) { foreach my $entry (@entries) { if($entry =~ $pmish_rx) { my $name = $prefix.$1; if($return_path) { my $path = File::Spec->catfile($dir, $entry); $results{$name} ||= {}; $results{$name}->{module_path} = $path unless exists($results{$name}->{module_path}); } else { $results{$name} = undef; } } } } } if($list_pod) { my @poddirs = [ $dir, \@entries ]; if($use_pod_dir) { my $pdir = File::Spec->catdir($dir, "pod"); my $pdh = IO::Dir->new($pdir); if($pdh) { push @poddirs, [ $pdir, [$pdh->read] ]; $pdh->close; } } foreach(@poddirs) { my($dir, $entries) = @$_; foreach my $entry (@$entries) { if($entry =~ $pod_rx) { my $name = $prefix.$1; if($return_path) { my $path = File::Spec->catfile($dir, $entry); $results{$name} ||= {}; $results{$name}->{pod_path} = $path unless exists($results{$name}->{pod_path}); } else { $results{$name} = undef; } } } } } if($list_prefixes || $recurse) { foreach my $entry (@entries) { if(File::Spec->no_upwards($entry) && $entry =~ $dir_rx && -d File::Spec->catdir($dir, $entry)) { my $newpfx = $prefix.$entry."::"; if($recurse && !exists($seen_prefixes{$newpfx})) { push @prefixes, $newpfx; $seen_prefixes{$newpfx} = undef; } if($list_prefixes) { if($return_path) { $results{$newpfx} ||= { prefix_paths => [] }; push @{$results{$newpfx}->{prefix_paths}}, File::Spec->catfile($dir, $entry); } else { $results{$newpfx} = undef; } } } } } } } return \%results; } =back =head1 SEE ALSO L =head1 AUTHOR Andrew Main (Zefram) =head1 COPYRIGHT Copyright (C) 2004, 2006, 2009, 2011, 2017 Andrew Main (Zefram) =head1 LICENSE This module is free software; you can redistribute it and/or modify it under the same terms as Perl itself. =cut 1;