From 4a6ceffb98a0b785494f680d3776c4bfc4052f9e Mon Sep 17 00:00:00 2001 From: "berkeviktor@aol.com" Date: Thu, 24 Feb 2011 04:14:30 +0100 Subject: add xchat r1489 --- plugins/perl/lib/Pod/Html.pm | 2399 ++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 2399 insertions(+) create mode 100644 plugins/perl/lib/Pod/Html.pm (limited to 'plugins/perl/lib/Pod/Html.pm') diff --git a/plugins/perl/lib/Pod/Html.pm b/plugins/perl/lib/Pod/Html.pm new file mode 100644 index 00000000..3695564b --- /dev/null +++ b/plugins/perl/lib/Pod/Html.pm @@ -0,0 +1,2399 @@ +package Pod::Html; +use strict; +require Exporter; + +use vars qw($VERSION @ISA @EXPORT @EXPORT_OK); +$VERSION = 1.08; +@ISA = qw(Exporter); +@EXPORT = qw(pod2html htmlify); +@EXPORT_OK = qw(anchorify); + +use Carp; +use Config; +use Cwd; +use File::Spec; +use File::Spec::Unix; +use Getopt::Long; + +use locale; # make \w work right in non-ASCII lands + +=head1 NAME + +Pod::Html - module to convert pod files to HTML + +=head1 SYNOPSIS + + use Pod::Html; + pod2html([options]); + +=head1 DESCRIPTION + +Converts files from pod format (see L) to HTML format. It +can automatically generate indexes and cross-references, and it keeps +a cache of things it knows how to cross-reference. + +=head1 FUNCTIONS + +=head2 pod2html + + pod2html("pod2html", + "--podpath=lib:ext:pod:vms", + "--podroot=/usr/src/perl", + "--htmlroot=/perl/nmanual", + "--libpods=perlfunc:perlguts:perlvar:perlrun:perlop", + "--recurse", + "--infile=foo.pod", + "--outfile=/perl/nmanual/foo.html"); + +pod2html takes the following arguments: + +=over 4 + +=item backlink + + --backlink="Back to Top" + +Adds "Back to Top" links in front of every C heading (except for +the first). By default, no backlinks are generated. + +=item cachedir + + --cachedir=name + +Creates the item and directory caches in the given directory. + +=item css + + --css=stylesheet + +Specify the URL of a cascading style sheet. Also disables all HTML/CSS +C + + + +$block +END_OF_HEAD + + # load/reload/validate/cache %Pages and %Items + get_cache( $Dircache, $Itemcache, \@Podpath, $Podroot, $Recurse ); + + # scan the pod for =item directives + scan_items( \%Local_Items, "", @poddata ); + + # put an index at the top of the file. note, if $Doindex is 0 we + # still generate an index, but surround it with an html comment. + # that way some other program can extract it if desired. + $index =~ s/--+/-/g; + + my $hr = ( $Doindex and $index ) ? qq(

) : ""; + + unless ($Doindex) { + $index = qq(\n); + } + + print HTML << "END_OF_INDEX"; + + +

+$index +$hr +

+ + +END_OF_INDEX + + # now convert this file + my $after_item; # set to true after an =item + my $need_dd = 0; + warn "Converting input file $Podfile\n" if $Verbose; + foreach my $i ( 0 .. $#poddata ) { + $_ = $poddata[$i]; + $Paragraph = $i + 1; + if (/^(=.*)/s) { # is it a pod directive? + $Ignore = 0; + $after_item = 0; + $need_dd = 0; + $_ = $1; + if (/^=begin\s+(\S+)\s*(.*)/si) { # =begin + process_begin( $1, $2 ); + } elsif (/^=end\s+(\S+)\s*(.*)/si) { # =end + process_end( $1, $2 ); + } elsif (/^=cut/) { # =cut + process_cut(); + } elsif (/^=pod/) { # =pod + process_pod(); + } else { + next if @Begin_Stack && $Begin_Stack[-1] ne 'html'; + + if (/^=(head[1-6])\s+(.*\S)/s) { # =head[1-6] heading + process_head( $1, $2, $Doindex && $index ); + } elsif (/^=item\s*(.*\S)?/sm) { # =item text + $need_dd = process_item($1); + $after_item = 1; + } elsif (/^=over\s*(.*)/) { # =over N + process_over(); + } elsif (/^=back/) { # =back + process_back($need_dd); + } elsif (/^=for\s+(\S+)\s*(.*)/si) { # =for + process_for( $1, $2 ); + } else { + /^=(\S*)\s*/; + warn "$0: $Podfile: unknown pod directive '$1' in " + . "paragraph $Paragraph. ignoring.\n" + unless $Quiet; + } + } + $Top = 0; + } else { + next if $Ignore; + next if @Begin_Stack && $Begin_Stack[-1] ne 'html'; + print HTML and next if @Begin_Stack && $Begin_Stack[-1] eq 'html'; + print HTML "

\n" if $need_dd; + my $text = $_; + if ( $text =~ /\A\s+/ ) { + process_pre( \$text ); + print HTML "

\n$text

\n"; + + } else { + process_text( \$text ); + + # experimental: check for a paragraph where all lines + # have some ...\t...\t...\n pattern + if ( $text =~ /\t/ ) { + my @lines = split( "\n", $text ); + if ( @lines > 1 ) { + my $all = 2; + foreach my $line (@lines) { + if ( $line =~ /\S/ && $line !~ /\t/ ) { + $all--; + last if $all == 0; + } + } + if ( $all > 0 ) { + $text =~ s/\t+//g; + $text =~ s/^//gm; + $text = + '' + . $text + . '

'; + } + } + } + ## end of experimental + + if ($after_item) { + $After_Lpar = 1; + } + print HTML "

$text

\n"; + } + print HTML "

\n" if $need_dd; + $after_item = 0; + } + } + + # finish off any pending directives + finish_list(); + + # link to page index + print HTML "

$Backlink

\n" + if $Doindex + and $index + and $Backlink; + + print HTML < + + +END_OF_TAIL + + # close the html file + close(HTML); + + warn "Finished\n" if $Verbose; +} + +############################################################################## + +sub usage { + my $podfile = shift; + warn "$0: $podfile: @_\n" if @_; + die < --infile= --outfile= + --podpath=:...: --podroot= + --libpods=:...: --recurse --verbose --index + --netscape --norecurse --noindex --cachedir= + + --backlink - set text for "back to top" links (default: none). + --cachedir - directory for the item and directory cache files. + --css - stylesheet URL + --flush - flushes the item and directory caches. + --[no]header - produce block header/footer (default is no headers). + --help - prints this message. + --hiddendirs - search hidden directories in podpath + --htmldir - directory for resulting HTML files. + --htmlroot - http-server base directory from which all relative paths + in podpath stem (default is /). + --[no]index - generate an index at the top of the resulting html + (default behaviour). + --infile - filename for the pod to convert (input taken from stdin + by default). + --libpods - colon-separated list of pages to search for =item pod + directives in as targets of C<> and implicit links (empty + by default). note, these are not filenames, but rather + page names like those that appear in L<> links. + --outfile - filename for the resulting html file (output sent to + stdout by default). + --podpath - colon-separated list of directories containing library + pods (empty by default). + --podroot - filesystem base directory from which all relative paths + in podpath stem (default is .). + --[no]quiet - suppress some benign warning messages (default is off). + --[no]recurse - recurse on those subdirectories listed in podpath + (default behaviour). + --title - title that will appear in resulting html file. + --[no]verbose - self-explanatory (off by default). + --[no]netscape - deprecated, has no effect. for backwards compatibility only. + +END_OF_USAGE + +} + +sub parse_command_line { + my ( + $opt_backlink, $opt_cachedir, $opt_css, $opt_flush, + $opt_header, $opt_help, $opt_htmldir, $opt_htmlroot, + $opt_index, $opt_infile, $opt_libpods, $opt_netscape, + $opt_outfile, $opt_podpath, $opt_podroot, $opt_quiet, + $opt_recurse, $opt_title, $opt_verbose, $opt_hiddendirs + ); + + unshift @ARGV, split ' ', $Config{pod2html} if $Config{pod2html}; + my $result = GetOptions( + 'backlink=s' => \$opt_backlink, + 'cachedir=s' => \$opt_cachedir, + 'css=s' => \$opt_css, + 'flush' => \$opt_flush, + 'header!' => \$opt_header, + 'help' => \$opt_help, + 'hiddendirs!' => \$opt_hiddendirs, + 'htmldir=s' => \$opt_htmldir, + 'htmlroot=s' => \$opt_htmlroot, + 'index!' => \$opt_index, + 'infile=s' => \$opt_infile, + 'libpods=s' => \$opt_libpods, + 'netscape!' => \$opt_netscape, + 'outfile=s' => \$opt_outfile, + 'podpath=s' => \$opt_podpath, + 'podroot=s' => \$opt_podroot, + 'quiet!' => \$opt_quiet, + 'recurse!' => \$opt_recurse, + 'title=s' => \$opt_title, + 'verbose!' => \$opt_verbose, + ); + usage( "-", "invalid parameters" ) if not $result; + + usage("-") if defined $opt_help; # see if the user asked for help + $opt_help = ""; # just to make -w shut-up. + + @Podpath = split( ":", $opt_podpath ) if defined $opt_podpath; + @Libpods = split( ":", $opt_libpods ) if defined $opt_libpods; + + $Backlink = $opt_backlink if defined $opt_backlink; + $Cachedir = $opt_cachedir if defined $opt_cachedir; + $Css = $opt_css if defined $opt_css; + $Header = $opt_header if defined $opt_header; + $Htmldir = $opt_htmldir if defined $opt_htmldir; + $Htmlroot = $opt_htmlroot if defined $opt_htmlroot; + $Doindex = $opt_index if defined $opt_index; + $Podfile = $opt_infile if defined $opt_infile; + $HiddenDirs = $opt_hiddendirs if defined $opt_hiddendirs; + $Htmlfile = $opt_outfile if defined $opt_outfile; + $Podroot = $opt_podroot if defined $opt_podroot; + $Quiet = $opt_quiet if defined $opt_quiet; + $Recurse = $opt_recurse if defined $opt_recurse; + $Title = $opt_title if defined $opt_title; + $Verbose = $opt_verbose if defined $opt_verbose; + + warn "Flushing item and directory caches\n" + if $opt_verbose && defined $opt_flush; + $Dircache = "$Cachedir/pod2htmd.tmp"; + $Itemcache = "$Cachedir/pod2htmi.tmp"; + if ( defined $opt_flush ) { + 1 while unlink( $Dircache, $Itemcache ); + } +} + +my $Saved_Cache_Key; + +sub get_cache { + my ( $dircache, $itemcache, $podpath, $podroot, $recurse ) = @_; + my @cache_key_args = @_; + + # A first-level cache: + # Don't bother reading the cache files if they still apply + # and haven't changed since we last read them. + + my $this_cache_key = cache_key(@cache_key_args); + + return if $Saved_Cache_Key and $this_cache_key eq $Saved_Cache_Key; + + # load the cache of %Pages and %Items if possible. $tests will be + # non-zero if successful. + my $tests = 0; + if ( -f $dircache && -f $itemcache ) { + warn "scanning for item cache\n" if $Verbose; + $tests = load_cache( $dircache, $itemcache, $podpath, $podroot ); + } + + # if we didn't succeed in loading the cache then we must (re)build + # %Pages and %Items. + if ( !$tests ) { + warn "scanning directories in pod-path\n" if $Verbose; + scan_podpath( $podroot, $recurse, 0 ); + } + $Saved_Cache_Key = cache_key(@cache_key_args); +} + +sub cache_key { + my ( $dircache, $itemcache, $podpath, $podroot, $recurse ) = @_; + return join( '!', + $dircache, $itemcache, $recurse, @$podpath, $podroot, stat($dircache), + stat($itemcache) ); +} + +# +# load_cache - tries to find if the caches stored in $dircache and $itemcache +# are valid caches of %Pages and %Items. if they are valid then it loads +# them and returns a non-zero value. +# +sub load_cache { + my ( $dircache, $itemcache, $podpath, $podroot ) = @_; + my ($tests); + local $_; + + $tests = 0; + + open( CACHE, "<$itemcache" ) + || die "$0: error opening $itemcache for reading: $!\n"; + $/ = "\n"; + + # is it the same podpath? + $_ = ; + chomp($_); + $tests++ if ( join( ":", @$podpath ) eq $_ ); + + # is it the same podroot? + $_ = ; + chomp($_); + $tests++ if ( $podroot eq $_ ); + + # load the cache if its good + if ( $tests != 2 ) { + close(CACHE); + return 0; + } + + warn "loading item cache\n" if $Verbose; + while () { + /(.*?) (.*)$/; + $Items{$1} = $2; + } + close(CACHE); + + warn "scanning for directory cache\n" if $Verbose; + open( CACHE, "<$dircache" ) + || die "$0: error opening $dircache for reading: $!\n"; + $/ = "\n"; + $tests = 0; + + # is it the same podpath? + $_ = ; + chomp($_); + $tests++ if ( join( ":", @$podpath ) eq $_ ); + + # is it the same podroot? + $_ = ; + chomp($_); + $tests++ if ( $podroot eq $_ ); + + # load the cache if its good + if ( $tests != 2 ) { + close(CACHE); + return 0; + } + + warn "loading directory cache\n" if $Verbose; + while () { + /(.*?) (.*)$/; + $Pages{$1} = $2; + } + + close(CACHE); + + return 1; +} + +# +# scan_podpath - scans the directories specified in @podpath for directories, +# .pod files, and .pm files. it also scans the pod files specified in +# @Libpods for =item directives. +# +sub scan_podpath { + my ( $podroot, $recurse, $append ) = @_; + my ( $pwd, $dir ); + my ( $libpod, $dirname, $pod, @files, @poddata ); + + unless ($append) { + %Items = (); + %Pages = (); + } + + # scan each directory listed in @Podpath + $pwd = getcwd(); + chdir($podroot) + || die "$0: error changing to directory $podroot: $!\n"; + foreach $dir (@Podpath) { + scan_dir( $dir, $recurse ); + } + + # scan the pods listed in @Libpods for =item directives + foreach $libpod (@Libpods) { + + # if the page isn't defined then we won't know where to find it + # on the system. + next unless defined $Pages{$libpod} && $Pages{$libpod}; + + # if there is a directory then use the .pod and .pm files within it. + # NOTE: Only finds the first so-named directory in the tree. + # if ($Pages{$libpod} =~ /([^:]*[^(\.pod|\.pm)]):/) { + if ( $Pages{$libpod} =~ /([^:]*(?; + close(POD); + clean_data( \@poddata ); + + scan_items( \%Items, "$dirname/$pod", @poddata ); + } + + # use the names of files as =item directives too. +### Don't think this should be done this way - confuses issues.(WL) +### foreach $pod (@files) { +### $pod =~ /^(.*)(\.pod|\.pm)$/; +### $Items{$1} = "$dirname/$1.html" if $1; +### } + } elsif ( $Pages{$libpod} =~ /([^:]*\.pod):/ + || $Pages{$libpod} =~ /([^:]*\.pm):/ ) + { + + # scan the .pod or .pm file for =item directives + $pod = $1; + open( POD, "<$pod" ) + || die "$0: error opening $pod for input: $!\n"; + @poddata = ; + close(POD); + clean_data( \@poddata ); + + scan_items( \%Items, "$pod", @poddata ); + } else { + warn "$0: shouldn't be here (line " . __LINE__ . "\n" unless $Quiet; + } + } + @poddata = (); # clean-up a bit + + chdir($pwd) + || die "$0: error changing to directory $pwd: $!\n"; + + # cache the item list for later use + warn "caching items for later use\n" if $Verbose; + open( CACHE, ">$Itemcache" ) + || die "$0: error open $Itemcache for writing: $!\n"; + + print CACHE join( ":", @Podpath ) . "\n$podroot\n"; + foreach my $key ( keys %Items ) { + print CACHE "$key $Items{$key}\n"; + } + + close(CACHE); + + # cache the directory list for later use + warn "caching directories for later use\n" if $Verbose; + open( CACHE, ">$Dircache" ) + || die "$0: error open $Dircache for writing: $!\n"; + + print CACHE join( ":", @Podpath ) . "\n$podroot\n"; + foreach my $key ( keys %Pages ) { + print CACHE "$key $Pages{$key}\n"; + } + + close(CACHE); +} + +# +# scan_dir - scans the directory specified in $dir for subdirectories, .pod +# files, and .pm files. notes those that it finds. this information will +# be used later in order to figure out where the pages specified in L<> +# links are on the filesystem. +# +sub scan_dir { + my ( $dir, $recurse ) = @_; + my ( $t, @subdirs, @pods, $pod, $dirname, @dirs ); + local $_; + + @subdirs = (); + @pods = (); + + opendir( DIR, $dir ) + || die "$0: error opening directory $dir: $!\n"; + while ( defined( $_ = readdir(DIR) ) ) { + if ( -d "$dir/$_" + && $_ ne "." + && $_ ne ".." + && ( $HiddenDirs || !/^\./ ) ) + { # directory + $Pages{$_} = "" unless defined $Pages{$_}; + $Pages{$_} .= "$dir/$_:"; + push( @subdirs, $_ ); + } elsif (/\.pod\z/) { # .pod + s/\.pod\z//; + $Pages{$_} = "" unless defined $Pages{$_}; + $Pages{$_} .= "$dir/$_.pod:"; + push( @pods, "$dir/$_.pod" ); + } elsif (/\.html\z/) { # .html + s/\.html\z//; + $Pages{$_} = "" unless defined $Pages{$_}; + $Pages{$_} .= "$dir/$_.pod:"; + } elsif (/\.pm\z/) { # .pm + s/\.pm\z//; + $Pages{$_} = "" unless defined $Pages{$_}; + $Pages{$_} .= "$dir/$_.pm:"; + push( @pods, "$dir/$_.pm" ); + } elsif ( -T "$dir/$_" ) { # script(?) + local *F; + if ( open( F, "$dir/$_" ) ) { + my $line; + while ( defined( $line = ) ) { + if ( $line =~ /^=(?:pod|head1)/ ) { + $Pages{$_} = "" unless defined $Pages{$_}; + $Pages{$_} .= "$dir/$_.pod:"; + last; + } + } + close(F); + } + } + } + closedir(DIR); + + # recurse on the subdirectories if necessary + if ($recurse) { + foreach my $subdir (@subdirs) { + scan_dir( "$dir/$subdir", $recurse ); + } + } +} + +# +# scan_headings - scan a pod file for head[1-6] tags, note the tags, and +# build an index. +# +sub scan_headings { + my ( $sections, @data ) = @_; + my ( $tag, $which_head, $otitle, $listdepth, $index ); + + local $Ignore = 0; + + $listdepth = 0; + $index = ""; + + # scan for =head directives, note their name, and build an index + # pointing to each of them. + foreach my $line (@data) { + if ( $line =~ /^=(head)([1-6])\s+(.*)/ ) { + ( $tag, $which_head, $otitle ) = ( $1, $2, $3 ); + + my $title = depod($otitle); + my $name = anchorify($title); + $$sections{$name} = 1; + $title = process_text( \$otitle ); + + while ( $which_head != $listdepth ) { + if ( $which_head > $listdepth ) { + $index .= "\n" + . ( "\t" x ($listdepth) ) + . ( $listdepth > 0 ? qq{

\n} + . "\t"x($listdepth + 1): "" ) + . "

"; + $listdepth++; + } elsif ( $which_head < $listdepth ) { + $listdepth--; + $index .= "\n" + . ( "\t" x $listdepth ) + . ( $listdepth > 0 ? "\t" : "" ) + . "" + . ( $listdepth >= 0 ? "\n" . ("\t"x$listdepth) + . "

" : "" ) + . "\n"; + } + } + + $index .= "\n" + . ( "\t" x $listdepth ) . "

" + . "" + . $title + . "

"; + } + } + + # finish off the lists + while ( $listdepth-- ) { + $index .= "\n" . ( "\t" x $listdepth ) + . ($listdepth > 0 ? "\t" : "") + ."\n" + . ($listdepth > 0 ? ("\t" x $listdepth) . "" : "" ); + } + + # get rid of bogus lists + $index =~ s,\t*

\s*\n,,g; + + return $index; +} + +# +# scan_items - scans the pod specified by $pod for =item directives. we +# will use this information later on in resolving C<> links. +# +sub scan_items { + my ( $itemref, $pod, @poddata ) = @_; + my ( $i, $item ); + local $_; + + $pod =~ s/\.pod\z//; + $pod .= ".html" if $pod; + + foreach $i ( 0 .. $#poddata ) { + my $txt = depod( $poddata[$i] ); + + # figure out what kind of item it is. + # Build string for referencing this item. + if ( $txt =~ /\A=item\s+\*\s*(.*)\Z/s ) { # bullet + next unless $1; + $item = $1; + } elsif ( $txt =~ /\A=item\s+(?>\d+\.?)\s*(.*)\Z/s ) { # numbered list + $item = $1; + } elsif ( $txt =~ /\A=item\s+(.*)\Z/s ) { # plain item + $item = $1; + } else { + next; + } + my $fid = fragment_id($item); + $$itemref{$fid} = "$pod" if $fid; + } +} + +# +# process_head - convert a pod head[1-6] tag and convert it to HTML format. +# +sub process_head { + my ( $tag, $heading, $hasindex ) = @_; + + # figure out the level of the =head + $tag =~ /head([1-6])/; + my $level = $1; + + if ($Listlevel) { + warn +"$0: $Podfile: unterminated list at =head in paragraph $Paragraph. ignoring.\n" + unless $Quiet; + while ($Listlevel) { + process_back(); + } + } + + print HTML "

\n"; + if ( $level == 1 && !$Top ) { + print HTML "$Backlink\n" + if $hasindex and $Backlink; + print HTML "

\n"; + } else { + print HTML "

\n"; + } + + my $name = anchorify( depod($heading) ); + my $convert = process_text( \$heading ); + $convert =~ s{]+>}{}g; + print HTML "$convert\n"; +} + +# +# emit_item_tag - print an =item's text +# Note: The global $EmittedItem is used for inhibiting self-references. +# +my $EmittedItem; + +sub emit_item_tag($$$) { + my ( $otext, $text, $compact ) = @_; + my $item = fragment_id( depod($text), -generate ); + Carp::confess( "Undefined fragment '$text' (" + . depod($text) + . ") from fragment_id() in emit_item_tag() in $Podfile" ) + if !defined $item; + $EmittedItem = $item; + ### print STDERR "emit_item_tag=$item ($text)\n"; + + print HTML ''; + if ( $Items_Named{$item}++ ) { + print HTML process_text( \$otext ); + } else { + my $name = $item; + $name = anchorify($name); + print HTML +#qq{}, + process_text( \$otext ), + # '' + ; + } + print HTML "\n"; + undef($EmittedItem); +} + +sub emit_li { + my ($tag) = @_; + if ( $Items_Seen[$Listlevel]++ == 0 ) { + push( @Listend, "" ); + print HTML "<$tag>\n"; + } + my $emitted = $tag eq 'dl' ? 'dt' : 'li'; + print HTML "<$emitted>"; + return $emitted; +} + +# +# process_item - convert a pod item tag and convert it to HTML format. +# +sub process_item { + my ($otext) = @_; + my $need_dd = 0; # set to 1 if we need a

after an item + + # lots of documents start a list without doing an =over. this is + # bad! but, the proper thing to do seems to be to just assume + # they did do an =over. so warn them once and then continue. + if ( $Listlevel == 0 ) { + warn +"$0: $Podfile: unexpected =item directive in paragraph $Paragraph. ignoring.\n" + unless $Quiet; + process_over(); + } + + # formatting: insert a paragraph if preceding item has >1 paragraph + if ($After_Lpar) { + print HTML $need_dd ? "\n" : "\n" if $After_Lpar; + $After_Lpar = 0; + } + + # remove formatting instructions from the text + my $text = depod($otext); + + my $emitted; # the tag actually emitted, used for closing + + # all the list variants: + if ( $text =~ /\A\*/ ) { # bullet + $emitted = emit_li('ul'); + if ( $text =~ /\A\*\s+(\S.*)\Z/s ) { # with additional text + my $tag = $1; + $otext =~ s/\A\*\s+//; + emit_item_tag( $otext, $tag, 1 ); + } + print HTML "" + } elsif ( $text =~ /\A\d+/ ) { # numbered list + $emitted = emit_li('ol'); + if ( $text =~ /\A(?>\d+\.?)\s*(\S.*)\Z/s ) { # with additional text + my $tag = $1; + $otext =~ s/\A\d+\.?\s*//; + emit_item_tag( $otext, $tag, 1 ); + } + print HTML ""; + } else { # definition list + $emitted = emit_li('dl'); + if ( $text =~ /\A(.+)\Z/s ) { # should have text + emit_item_tag( $otext, $text, 1 ); + } + $need_dd = 1; + } + print HTML "\n"; + return $need_dd; +} + +# +# process_over - process a pod over tag and start a corresponding HTML list. +# +sub process_over { + + # start a new list + $Listlevel++; + push( @Items_Seen, 0 ); + $After_Lpar = 0; +} + +# +# process_back - process a pod back tag and convert it to HTML format. +# +sub process_back { + my $need_dd = shift; + if ( $Listlevel == 0 ) { + warn +"$0: $Podfile: unexpected =back directive in paragraph $Paragraph. ignoring.\n" + unless $Quiet; + return; + } + + # close off the list. note, I check to see if $Listend[$Listlevel] is + # defined because an =item directive may have never appeared and thus + # $Listend[$Listlevel] may have never been initialized. + $Listlevel--; + if ( defined $Listend[$Listlevel] ) { + print HTML $need_dd ? "\n" : "\n" if $After_Lpar; + print HTML $Listend[$Listlevel]; + print HTML "\n"; + pop(@Listend); + } + $After_Lpar = 0; + + # clean up item count + pop(@Items_Seen); +} + +# +# process_cut - process a pod cut tag, thus start ignoring pod directives. +# +sub process_cut { + $Ignore = 1; +} + +# +# process_pod - process a pod tag, thus stop ignoring pod directives +# until we see a corresponding cut. +# +sub process_pod { + + # no need to set $Ignore to 0 cause the main loop did it +} + +# +# process_for - process a =for pod tag. if it's for html, spit +# it out verbatim, if illustration, center it, otherwise ignore it. +# +sub process_for { + my ( $whom, $text ) = @_; + if ( $whom =~ /^(pod2)?html$/i ) { + print HTML $text; + } elsif ( $whom =~ /^illustration$/i ) { + 1 while chomp $text; + for my $ext (qw[.png .gif .jpeg .jpg .tga .pcl .bmp]) { + $text .= $ext, last if -r "$text$ext"; + } + print HTML +qq{

$text illustration

}; + } +} + +# +# process_begin - process a =begin pod tag. this pushes +# whom we're beginning on the begin stack. if there's a +# begin stack, we only print if it us. +# +sub process_begin { + my ( $whom, $text ) = @_; + $whom = lc($whom); + push( @Begin_Stack, $whom ); + if ( $whom =~ /^(pod2)?html$/ ) { + print HTML $text if $text; + } +} + +# +# process_end - process a =end pod tag. pop the +# begin stack. die if we're mismatched. +# +sub process_end { + my ( $whom, $text ) = @_; + $whom = lc($whom); + if ( !defined $Begin_Stack[-1] or $Begin_Stack[-1] ne $whom ) { + Carp::confess( + "Unmatched begin/end at chunk $Paragraph in pod $Podfile\n"); + } + pop(@Begin_Stack); +} + +# +# process_pre - indented paragraph, made into

+# +sub process_pre { + my ($text) = @_; + my ($rest); + return if $Ignore; + + $rest = $$text; + + # insert spaces in place of tabs + $rest =~ s#(.+)# + my $line = $1; + 1 while $line =~ s/(\t+)/' ' x ((length($1) * 8) - $-[0] % 8)/e; + $line; + #eg; + + # convert some special chars to HTML escapes + $rest = html_escape($rest); + + # try and create links for all occurrences of perl.* within + # the preformatted text. + $rest =~ s{ + (\s*)(perl\w+) + }{ + if ( defined $Pages{$2} ){ # is a link + qq($1$2); + } elsif (defined $Pages{dosify($2)}) { # is a link + qq($1$2); + } else { + "$1$2"; + } + }xeg; + $rest =~ s{ + (' + | # or: + [$punc]* # 0 or more punctuation + (?: # followed + [^$any] # by a non-url char + | # or + $ # end of the string + ) # + | # or else + $ # then end of the string + ) + }{$1}igox; + + # text should be as it is (verbatim) + $$text = $rest; +} + +# +# pure text processing +# +# pure_text/inIS_text: differ with respect to automatic C<> recognition. +# we don't want this to happen within IS +# +sub pure_text($) { + my $text = shift(); + process_puretext( $text, 1 ); +} + +sub inIS_text($) { + my $text = shift(); + process_puretext( $text, 0 ); +} + +# +# process_puretext - process pure text (without pod-escapes) converting +# double-quotes and handling implicit C<> links. +# +sub process_puretext { + my ( $text, $notinIS ) = @_; + + ## Guessing at func() or [\$\@%&]*var references in plain text is destined + ## to produce some strange looking ref's. uncomment to disable: + ## $notinIS = 0; + + my ( @words, $lead, $trail ); + + # keep track of leading and trailing white-space + $lead = ( $text =~ s/\A(\s+)//s ? $1 : "" ); + $trail = ( $text =~ s/(\s+)\Z//s ? $1 : "" ); + + # split at space/non-space boundaries + @words = split( /(?<=\s)(?=\S)|(?<=\S)(?=\s)/, $text ); + + # process each word individually + foreach my $word (@words) { + + # skip space runs + next if $word =~ /^\s*$/; + + # see if we can infer a link or a function call + # + # NOTE: This is a word based search, it won't automatically + # mark "substr($var, 1, 2)" because the 1st word would be "substr($var" + # User has to enclose those with proper C<> + + if ( + $notinIS + && $word =~ m/ + ^([a-z_]{2,}) # The function name + $ + ([0-9][a-z]* # Manual page(1) or page(1M) + |[^)]*[\$\@\%][^)]+ # ($foo), (1, @foo), (%hash) + | # () + ) + $ + ([.,;]?)$ # a possible punctuation follows + /xi + ) + { + + # has parenthesis so should have been a C<> ref + ## try for a pagename (perlXXX(1))? + my ( $func, $args, $rest ) = ( $1, $2, $3 || '' ); + if ( $args =~ /^\d+$/ ) { + my $url = page_sect( $word, '' ); + if ( defined $url ) { + $word = +qq(the $word manpage$rest); + next; + } + } + ## try function name for a link, append tt'ed argument list + $word = emit_C( $func, '', "($args)" ) . $rest; + +#### disabled. either all (including $\W, $\w+{.*} etc.) or nothing. +## } elsif( $notinIS && $word =~ /^[\$\@%&*]+\w+$/) { +## # perl variables, should be a C<> ref +## $word = emit_C( $word ); + + } elsif ( $word =~ m,^\w+://\w, ) { + + # looks like a URL + # Don't relativize it: leave it as the author intended + $word = qq($word); + } elsif ( $word =~ /[\w.-]+\@[\w-]+\.\w/ ) { + + # looks like an e-mail address + my ( $w1, $w2, $w3 ) = ( "", $word, "" ); + ( $w1, $w2, $w3 ) = ( "(", $1, ")$2" ) if $word =~ /^$(.*?)$(,?)/; + ( $w1, $w2, $w3 ) = ( "<", $1, ">$2" ) + if $word =~ /^<(.*?)>(,?)/; + $word = qq($w1$w2$w3); + } else { + $word = html_escape($word) if $word =~ /["&<>]/; + } + } + + # put everything back together + return $lead . join( '', @words ) . $trail; +} + +# +# process_text - handles plaintext that appears in the input pod file. +# there may be pod commands embedded within the text so those must be +# converted to html commands. +# + +sub process_text1($$;$$); +sub pattern ($) { $_[0] ? '\s+' . ( '>' x ( $_[0] + 1 ) ) : '>' } +sub closing ($) { local ($_) = shift; ( defined && s/\s+\z// ) ? length : 0 } + +sub process_text { + return if $Ignore; + my ($tref) = @_; + my $res = process_text1( 0, $tref ); + $res =~ s/\s+$//s; + $$tref = $res; +} + +sub process_text_rfc_links { + my $text = shift; + + # For every "RFCnnnn" or "RFC nnn", link it to the authoritative + # ource. Do not use the /i modifier here. Require "RFC" to be written in + # in capital letters. + + $text =~ s{ + (?<=[^<>[:alpha:]]) # Make sure this is not an URL already + (RFC\s*([0-9]{1,5}))(?![0-9]) # max 5 digits + } + {$1}gx; + + $text; +} + +sub process_text1($$;$$) { + my ( $lev, $rstr, $func, $closing ) = @_; + my $res = ''; + + unless ( defined $func ) { + $func = ''; + $lev++; + } + + if ( $func eq 'B' ) { + + # B - boldface + $res = '' . process_text1( $lev, $rstr ) . ''; + + } elsif ( $func eq 'C' ) { + + # C

 - can be a ref or 
+		# need to extract text
+		my $par = go_ahead( $rstr, 'C', $closing );
+
+		## clean-up of the link target
+		my $text = depod($par);
+
+		### my $x = $par =~ /[BI]call emit_C($par) lev=$lev, par with BI=$x\n";
+
+		$res = emit_C( $text, $lev > 1 || ( $par =~ /[BI] - convert to character
+		$$rstr =~ s/^([^>]*)>//;
+		my $escape = $1;
+		$escape =~ s/^(\d+|X[\dA-F]+)$/#$1/i;
+		$res = "&$escape;";
+
+	} elsif ( $func eq 'F' ) {
+
+		# F - italicize
+		$res = '' . process_text1( $lev, $rstr ) . '';
+
+	} elsif ( $func eq 'I' ) {
+
+		# I - italicize
+		$res = '' . process_text1( $lev, $rstr ) . '';
+
+	} elsif ( $func eq 'L' ) {
+
+		# L - link
+		## L => produce text, use cross-ref for linking
+		## L => make text from cross-ref
+		## need to extract text
+		my $par = go_ahead( $rstr, 'L', $closing );
+
+		# some L<>'s that shouldn't be:
+		# a) full-blown URL's are emitted as-is
+		if ( $par =~ m{^\w+://}s ) {
+			return make_URL_href($par);
+		}
+
+		# b) C<...> is stripped and treated as C<>
+		if ( $par =~ /^C<(.*)>$/ ) {
+			my $text = depod($1);
+			return emit_C( $text, $lev > 1 || ( $par =~ /[BI] L<$par> to page $page, ident $ident\n";
+
+		} elsif ( $par =~ m{^(.*?)/"?(.*?)"?$} ) {    # [name]/"section"
+			    # even though this should be a "section", we go for ident first
+			( $page, $ident ) = ( $1, $2 );
+			### print STDERR "--> L<$par> to page $page, section $section\n";
+
+		} elsif ( $par =~ /\s/ ) {  # this must be a section with missing quotes
+			( $page, $section ) = ( '', $par );
+			### print STDERR "--> L<$par> to void page, section $section\n";
+
+		} else {
+			( $page, $section ) = ( $par, '' );
+			### print STDERR "--> L<$par> to page $par, void section\n";
+		}
+
+		# now, either $section or $ident is defined. the convoluted logic
+		# below tries to resolve L<> according to what the user specified.
+		# failing this, we try to find the next best thing...
+		my ( $url, $ltext, $fid );
+
+	RESOLVE: {
+			if ( defined $ident ) {
+				## try to resolve $ident as an item
+				( $url, $fid ) = coderef( $page, $ident );
+				if ($url) {
+					if ( !defined($linktext) ) {
+						$linktext = $ident;
+						$linktext .= " in " if $ident && $page;
+						$linktext .= "the $page manpage" if $page;
+					}
+					###  print STDERR "got coderef url=$url\n";
+					last RESOLVE;
+				}
+				## no luck: go for a section (auto-quoting!)
+				$section = $ident;
+			}
+			## now go for a section
+			my $htmlsection = htmlify($section);
+			$url = page_sect( $page, $htmlsection );
+			if ($url) {
+				if ( !defined($linktext) ) {
+					$linktext = $section;
+					$linktext .= " in " if $section && $page;
+					$linktext .= "the $page manpage" if $page;
+				}
+				### print STDERR "got page/section url=$url\n";
+				last RESOLVE;
+			}
+			## no luck: go for an ident
+			if ($section) {
+				$ident = $section;
+			} else {
+				$ident = $page;
+				$page  = undef();
+			}
+			( $url, $fid ) = coderef( $page, $ident );
+			if ($url) {
+				if ( !defined($linktext) ) {
+					$linktext = $ident;
+					$linktext .= " in " if $ident && $page;
+					$linktext .= "the $page manpage" if $page;
+				}
+				### print STDERR "got section=>coderef url=$url\n";
+				last RESOLVE;
+			}
+
+			# warning; show some text.
+			$linktext = $opar unless defined $linktext;
+			warn
+"$0: $Podfile: cannot resolve L<$opar> in paragraph $Paragraph.\n"
+				unless $Quiet;
+		}
+
+		# now we have a URL or just plain code
+		$$rstr = $linktext . '>' . $$rstr;
+		if ( defined($url) ) {
+			$res = "" . process_text1( $lev, $rstr ) . '';
+		} else {
+			$res = '' . process_text1( $lev, $rstr ) . '';
+		}
+
+	} elsif ( $func eq 'S' ) {
+
+		# S - non-breaking spaces
+		$res = process_text1( $lev, $rstr );
+		$res =~ s/ / /g;
+
+	} elsif ( $func eq 'X' ) {
+
+		# X<> - ignore
+		warn "$0: $Podfile: invalid X<> in paragraph $Paragraph.\n"
+			unless $$rstr =~ s/^[^>]*>//
+				or $Quiet;
+	} elsif ( $func eq 'Z' ) {
+
+		# Z<> - empty
+		warn "$0: $Podfile: invalid Z<> in paragraph $Paragraph.\n"
+			unless $$rstr =~ s/^>//
+				or $Quiet;
+
+	} else {
+		my $term = pattern $closing;
+		while ( $$rstr =~ s/\A(.*?)(([BCEFILSXZ])<(<+[^\S\n]+)?|$term)//s ) {
+
+			# all others: either recurse into new function or
+			# terminate at closing angle bracket(s)
+			my $pt = $1;
+			$pt .= $2 if !$3 && $lev == 1;
+			$res .= $lev == 1 ? pure_text($pt) : inIS_text($pt);
+			return $res if !$3 && $lev > 1;
+			if ($3) {
+				$res .= process_text1( $lev, $rstr, $3, closing $4 );
+			}
+		}
+		if ( $lev == 1 ) {
+			$res .= pure_text($$rstr);
+		} elsif ( !$Quiet ) {
+			my $snippet = substr( $$rstr, 0, 60 );
+			warn
+"$0: $Podfile: undelimited $func<> in paragraph $Paragraph: '$snippet'.\n"
+
+		}
+		$res = process_text_rfc_links($res);
+	}
+	return $res;
+}
+
+#
+# go_ahead: extract text of an IS (can be nested)
+#
+sub go_ahead($$$) {
+	my ( $rstr, $func, $closing ) = @_;
+	my $res     = '';
+	my @closing = ($closing);
+	while ( $$rstr =~
+		s/\A(.*?)(([BCEFILSXZ])<(<+\s+)?|@{[pattern $closing[0]]})//s )
+	{
+		$res .= $1;
+		unless ($3) {
+			shift @closing;
+			return $res unless @closing;
+		} else {
+			unshift @closing, closing $4;
+		}
+		$res .= $2;
+	}
+	unless ($Quiet) {
+		my $snippet = substr( $$rstr, 0, 60 );
+		warn
+"$0: $Podfile: undelimited $func<> in paragraph $Paragraph (go_ahead): '$snippet'.\n";
+	}
+	return $res;
+}
+
+#
+# emit_C - output result of C
+#    $text is the depod-ed text
+#
+sub emit_C($;$$) {
+	my ( $text, $nocode, $args ) = @_;
+	$args = '' unless defined $args;
+	my $res;
+	my ( $url, $fid ) = coderef( undef(), $text );
+
+	# need HTML-safe text
+	my $linktext = html_escape("$text$args");
+
+	if ( $text !~ /^[\$@%]/
+		&& defined($url)
+		&& ( !defined($EmittedItem) || $EmittedItem ne $fid ) )
+	{
+		$res = "$linktext";
+	} elsif ( 0 && $nocode ) {
+		$res = $linktext;
+	} else {
+		$res = "$linktext";
+	}
+	return $res;
+}
+
+#
+# html_escape: make text safe for HTML
+#
+sub html_escape {
+	my $rest = $_[0];
+	$rest =~ s/&/&/g;
+	$rest =~ s//>/g;
+	$rest =~ s/"/"/g;
+
+	# ' is only in XHTML, not HTML4.  Be conservative
+	#$rest   =~ s/'/'/g;
+	return $rest;
+}
+
+#
+# dosify - convert filenames to 8.3
+#
+sub dosify {
+	my ($str) = @_;
+	return lc($str) if $^O eq 'VMS';    # VMS just needs casing
+	if ($Is83) {
+		$str = lc $str;
+		$str =~ s/(\.\w+)/substr ($1,0,4)/ge;
+		$str =~ s/(\w+)/substr ($1,0,8)/ge;
+	}
+	return $str;
+}
+
+#
+# page_sect - make a URL from the text of a L<>
+#
+sub page_sect($$) {
+	my ( $page, $section ) = @_;
+	my ( $linktext, $page83, $link );    # work strings
+
+	# check if we know that this is a section in this page
+	if ( !defined $Pages{$page} && defined $Sections{$page} ) {
+		$section = $page;
+		$page    = "";
+		### print STDERR "reset page='', section=$section\n";
+	}
+
+	$page83 = dosify($page);
+	$page = $page83 if ( defined $Pages{$page83} );
+	if ( $page eq "" ) {
+		$link = "#" . anchorify($section);
+	} elsif ( $page =~ /::/ ) {
+		$page =~ s,::,/,g;
+
+		# Search page cache for an entry keyed under the html page name,
+		# then look to see what directory that page might be in.  NOTE:
+		# this will only find one page. A better solution might be to produce
+		# an intermediate page that is an index to all such pages.
+		my $page_name = $page;
+		$page_name =~ s,^.*/,,s;
+		if ( defined( $Pages{$page_name} )
+			&& $Pages{$page_name} =~ /([^:]*$page)\.(?:pod|pm):/ )
+		{
+			$page = $1;
+		} else {
+
+			# NOTE: This branch assumes that all A::B pages are located in
+			# $Htmlroot/A/B.html . This is often incorrect, since they are
+			# often in $Htmlroot/lib/A/B.html or such like. Perhaps we could
+			# analyze the contents of %Pages and figure out where any
+			# cousins of A::B are, then assume that.  So, if A::B isn't found,
+			# but A::C is found in lib/A/C.pm, then A::B is assumed to be in
+			# lib/A/B.pm. This is also limited, but it's an improvement.
+			# Maybe a hints file so that the links point to the correct places
+			# nonetheless?
+
+		}
+		$link = "$Htmlroot/$page.html";
+		$link .= "#" . anchorify($section) if ($section);
+	} elsif ( !defined $Pages{$page} ) {
+		$link = "";
+	} else {
+		$section = anchorify($section) if $section ne "";
+		### print STDERR "...section=$section\n";
+
+		# if there is a directory by the name of the page, then assume that an
+		# appropriate section will exist in the subdirectory
+		#	if ($section ne "" && $Pages{$page} =~ /([^:]*[^(\.pod|\.pm)]):/) {
+		if ( $section ne "" && $Pages{$page} =~ /([^:]*(?, Foo.(pod|pm) is preferred to A/Foo.(pod|pm)
+			if ( $Pages{$page} =~ /([^:]*)\.(?:pod|pm):/ ) {
+				$link = "$Htmlroot/$1.html$section";
+			} else {
+				$link = "";
+			}
+		}
+	}
+
+	if ($link) {
+
+		# Here, we take advantage of the knowledge that $Htmlfileurl ne ''
+		# implies $Htmlroot eq ''. This means that the link in question
+		# needs a prefix of $Htmldir if it begins with '/'. The test for
+		# the initial '/' is done to avoid '#'-only links, and to allow
+		# for other kinds of links, like file:, ftp:, etc.
+		my $url;
+		if ( $Htmlfileurl ne '' ) {
+			$link = "$Htmldir$link" if $link =~ m{^/}s;
+			$url = relativize_url( $link, $Htmlfileurl );
+
+			# print( "  b: [$link,$Htmlfileurl,$url]\n" );
+		} else {
+			$url = $link;
+		}
+		return $url;
+
+	} else {
+		return undef();
+	}
+}
+
+#
+# relativize_url - convert an absolute URL to one relative to a base URL.
+# Assumes both end in a filename.
+#
+sub relativize_url {
+	my ( $dest, $source ) = @_;
+
+	my ( $dest_volume, $dest_directory, $dest_file ) =
+		File::Spec::Unix->splitpath($dest);
+	$dest = File::Spec::Unix->catpath( $dest_volume, $dest_directory, '' );
+
+	my ( $source_volume, $source_directory, $source_file ) =
+		File::Spec::Unix->splitpath($source);
+	$source =
+		File::Spec::Unix->catpath( $source_volume, $source_directory, '' );
+
+	my $rel_path = '';
+	if ( $dest ne '' ) {
+		$rel_path = File::Spec::Unix->abs2rel( $dest, $source );
+	}
+
+	if (   $rel_path ne ''
+		&& substr( $rel_path, -1 ) ne '/'
+		&& substr( $dest_file, 0, 1 ) ne '#' )
+	{
+		$rel_path .= "/$dest_file";
+	} else {
+		$rel_path .= "$dest_file";
+	}
+
+	return $rel_path;
+}
+
+#
+# coderef - make URL from the text of a C<>
+#
+sub coderef($$) {
+	my ( $page, $item ) = @_;
+	my ($url);
+
+	my $fid = fragment_id($item);
+
+	if ( defined($page) && $page ne "" ) {
+
+		# we have been given a $page...
+		$page =~ s{::}{/}g;
+
+		Carp::confess(
+"Undefined fragment '$item' from fragment_id() in coderef() in $Podfile"
+		) if !defined $fid;
+
+		# Do we take it? Item could be a section!
+		my $base = $Items{$fid} || "";
+		$base =~ s{[^/]*/}{};
+		if ( $base ne "$page.html" ) {
+			###   print STDERR "coderef( $page, $item ): items{$fid} = $Items{$fid} = $base => discard page!\n";
+			$page = undef();
+		}
+
+	} else {
+
+		# no page - local items precede cached items
+		if ( defined($fid) ) {
+			if ( exists $Local_Items{$fid} ) {
+				$page = $Local_Items{$fid};
+			} else {
+				$page = $Items{$fid};
+			}
+		}
+	}
+
+	# if there was a pod file that we found earlier with an appropriate
+	# =item directive, then create a link to that page.
+	if ( defined $page ) {
+		if ($page) {
+			if ( exists $Pages{$page} and $Pages{$page} =~ /([^:.]*)\.[^:]*:/ )
+			{
+				$page = $1 . '.html';
+			}
+			my $link = "$Htmlroot/$page#" . anchorify($fid);
+
+			# Here, we take advantage of the knowledge that $Htmlfileurl
+			# ne '' implies $Htmlroot eq ''.
+			if ( $Htmlfileurl ne '' ) {
+				$link = "$Htmldir$link";
+				$url = relativize_url( $link, $Htmlfileurl );
+			} else {
+				$url = $link;
+			}
+		} else {
+			$url = "#" . anchorify($fid);
+		}
+
+		confess "url has space: $url" if $url =~ /"[^"]*\s[^"]*"/;
+	}
+	return ( $url, $fid );
+}
+
+#
+# Adapted from Nick Ing-Simmons' PodToHtml package.
+sub relative_url {
+	my $source_file      = shift;
+	my $destination_file = shift;
+
+	my $source = URI::file->new_abs($source_file);
+	my $uo = URI::file->new( $destination_file, $source )->abs;
+	return $uo->rel->as_string;
+}
+
+#
+# finish_list - finish off any pending HTML lists.  this should be called
+# after the entire pod file has been read and converted.
+#
+sub finish_list {
+	while ( $Listlevel > 0 ) {
+		print HTML "\n";
+		$Listlevel--;
+	}
+}
+
+#
+# htmlify - converts a pod section specification to a suitable section
+# specification for HTML. Note that we keep spaces and special characters
+# except ", ? (Netscape problem) and the hyphen (writer's problem...).
+#
+sub htmlify {
+	my ($heading) = @_;
+	$heading =~ s/(\s+)/ /g;
+	$heading =~ s/\s+\Z//;
+	$heading =~ s/\A\s+//;
+
+	# The hyphen is a disgrace to the English language.
+	# $heading =~ s/[-"?]//g;
+	$heading =~ s/["?]//g;
+	$heading = lc($heading);
+	return $heading;
+}
+
+#
+# similar to htmlify, but turns non-alphanumerics into underscores
+#
+sub anchorify {
+	my ($anchor) = @_;
+	$anchor =~ s/\([^)]*\)//;
+	$anchor = htmlify($anchor);
+	$anchor =~ s/\W/_/g;
+	$anchor =~ tr/_/_/s;
+	return $anchor;
+}
+
+#
+# depod - convert text by eliminating all interior sequences
+# Note: can be called with copy or modify semantics
+#
+my %E2c;
+$E2c{lt}     = '<';
+$E2c{gt}     = '>';
+$E2c{sol}    = '/';
+$E2c{verbar} = '|';
+$E2c{amp}    = '&';    # in Tk's pods
+
+sub depod1($;$$);
+
+sub depod($) {
+	my $string;
+	if ( ref( $_[0] ) ) {
+		$string = ${ $_[0] };
+		${ $_[0] } = depod1( \$string );
+	} else {
+		$string = $_[0];
+		depod1( \$string );
+	}
+}
+
+sub depod1($;$$) {
+	my ( $rstr, $func, $closing ) = @_;
+	my $res = '';
+	return $res unless defined $$rstr;
+	if ( !defined($func) ) {
+
+		# skip to next begin of an interior sequence
+		while ( $$rstr =~ s/\A(.*?)([BCEFILSXZ])<(<+[^\S\n]+)?//s ) {
+
+			# recurse into its text
+			$res .= $1 . depod1( $rstr, $2, closing $3);
+		}
+		$res .= $$rstr;
+	} elsif ( $func eq 'E' ) {
+
+		# E - convert to character
+		$$rstr =~ s/^([^>]*)>//;
+		$res .= $E2c{$1} || "";
+	} elsif ( $func eq 'X' ) {
+
+		# X<> - ignore
+		$$rstr =~ s/^[^>]*>//;
+	} elsif ( $func eq 'Z' ) {
+
+		# Z<> - empty
+		$$rstr =~ s/^>//;
+	} else {
+
+		# all others: either recurse into new function or
+		# terminate at closing angle bracket
+		my $term = pattern $closing;
+		while ( $$rstr =~ s/\A(.*?)(([BCEFILSXZ])<(<+[^\S\n]+)?|$term)//s ) {
+			$res .= $1;
+			last unless $3;
+			$res .= depod1( $rstr, $3, closing $4 );
+		}
+		## If we're here and $2 ne '>': undelimited interior sequence.
+		## Ignored, as this is called without proper indication of where we are.
+		## Rely on process_text to produce diagnostics.
+	}
+	return $res;
+}
+
+{
+	my %seen;    # static fragment record hash
+
+	sub fragment_id_readable {
+		my $text     = shift;
+		my $generate = shift;    # optional flag
+
+		my $orig = $text;
+
+		# leave the words for the fragment identifier,
+		# change everything else to underbars.
+		$text =~
+			s/[^A-Za-z0-9_]+/_/g;    # do not use \W to avoid locale dependency.
+		$text =~ s/_{2,}/_/g;
+		$text =~ s/\A_//;
+		$text =~ s/_\Z//;
+
+		unless ($text) {
+
+			# Nothing left after removing punctuation, so leave it as is
+			# E.g. if option is named: "=item -#"
+
+			$text = $orig;
+		}
+
+		if ($generate) {
+			if ( exists $seen{$text} ) {
+
+				# This already exists, make it unique
+				$seen{$text}++;
+				$text = $text . $seen{$text};
+			} else {
+				$seen{$text} = 1;    # first time seen this fragment
+			}
+		}
+
+		$text;
+	}
+}
+
+my @HC;
+
+sub fragment_id_obfuscated {         # This was the old "_2d_2d__"
+	my $text     = shift;
+	my $generate = shift;            # optional flag
+
+	# text? Normalize by obfuscating the fragment id to make it unique
+	$text =~ s/\s+/_/sg;
+
+	$text =~ s{(\W)}{
+        defined( $HC[ord($1)] ) ? $HC[ord($1)]
+        : ( $HC[ord($1)] = sprintf( "%%%02X", ord($1) ) ) }gxe;
+	$text = substr( $text, 0, 50 );
+
+	$text;
+}
+
+#
+# fragment_id - construct a fragment identifier from:
+#   a) =item text
+#   b) contents of C<...>
+#
+
+sub fragment_id {
+	my $text     = shift;
+	my $generate = shift;    # optional flag
+
+	$text =~ s/\s+\Z//s;
+	if ($text) {
+
+		# a method or function?
+		return $1 if $text =~ /(\w+)\s*\(/;
+		return $1 if $text =~ /->\s*(\w+)\s*\(?/;
+
+		# a variable name?
+		return $1 if $text =~ /^([\$\@%*]\S+)/;
+
+		# some pattern matching operator?
+		return $1 if $text =~ m|^(\w+/).*/\w*$|;
+
+		# fancy stuff... like "do { }"
+		return $1 if $text =~ m|^(\w+)\s*{.*}$|;
+
+		# honour the perlfunc manpage: func [PAR[,[ ]PAR]...]
+		# and some funnies with ... Module ...
+		return $1 if $text =~ m{^([a-z\d_]+)(\s+[A-Z,/& ][A-Z\d,/& ]*)?$};
+		return $1 if $text =~ m{^([a-z\d]+)\s+Module(\s+[A-Z\d,/& ]+)?$};
+
+		return fragment_id_readable( $text, $generate );
+	} else {
+		return;
+	}
+}
+
+#
+# make_URL_href - generate HTML href from URL
+# Special treatment for CGI queries.
+#
+sub make_URL_href($;$) {
+	my ($url) = shift;
+	my $linktext = shift || $url;
+	if ( $url !~ s{^(http:[-\w/#~:.+=&%@!]+)(\?.*)$}{$1}i ) {
+		$url = "$linktext";
+	}
+	return $url;
+}
+
+1;
-- 
cgit 1.4.1