m3
/
cross-reference


			
				
					
						
						
							12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301
							#!/usr/bin/perl
# $Id: Local.pm,v 1.9 2006/12/07 04:59:38 reed%reedloden.com Exp $
# Local.pm -- Subroutines that need to be customized for each installation
#
#	Dawn Endico <endico@mozilla.org>
#
######################################################################
# This package is for placing subroutines that are likely to need
# to be customized for each installation. In particular, the file
# and directory description snarfing mechanism is likely to be
# different for each project.

package Local;

require Exporter;
@ISA = qw(Exporter);
@EXPORT = qw(&fdescexpand &descexpand &dirdesc &convertwhitespace
             &localexpandtemplate
	     &isForce &isImage &isHTML &isCSS &getMimeType
            );

use lib 'lib';
use LXR::Common;
use File::Basename;
use File::Glob qw(bsd_glob :globally :nocase);

# dme: Create descriptions for a file in a directory listing
# If no description, return the string "\&nbsp\;" to keep the
# table looking pretty.
#
# In mozilla search the beginning of a source file for a short
# description. Not all files have them and the ones that do use
# many different formats. Try to find as many of these without
# printing gobbledygook or something silly like a file name or a date.
#
# Read in the beginning of the file into a string. I chose 60 because the
# Berkeley copyright notice is around 40 lines long so we need a bit more
# than this.
#
# It's common for file descriptions to be delimited by the file name or
# the word "Description" which precedes the description. Search the entire
# string for these. Sometimes they're put in odd places such as inside
# the copyright notice or after the code begins. The file name should be
# followed by a colon or some pattern of dashes.
#
# If no such description is found then use the contents of the "first"
# comment as the description. First, strip off the copyright notice plus
# anything before it. Remove rcs comments. Search for the first bit of
# code (usually #include) and remove it plus anything after it. In what's
# left, find the contents of the first comment, and get the first paragraph.
# If that's too long, use only the first sentence up to a period. If that's
# still too long then we probably have a list or something that will look
# strange if we print it out so give up and return null.
#
# Yes, this is a lot of trouble to go through but its easier than getting
# people to use the same format and re-writing thousands of comments. Not
# everything printed will really be a summary of the file, but still the
# signal/noise ratio seems pretty high.
#
# Yea, though I walk through the valley of the shadow of pattern
# matching, I shall fear no regex.
sub fdescexpand {
    # use global vars here because the expandtemplate subroutine makes
    # passing parameters impossible. Use $filename from source and
    # $Path from Common.pm
    my $filename = $main::filename;
    my $copy= "";
    local $desc= "";
    my $lic_length = 40;
    my $lic_start;
    my $maxlines = 20; #only look at the beginning of the file
    my $excessivelines = 200; #sometimes people are too verbose for our own good
    my $inlicense = 0;

    #for broken symlinks list their target
    my $realf = $Path->{'real'}.'/'.$filename;
    if (!-e $realf && -l $realf) {
        $desc = readlink $realf;
        $desc =~ s/\&/&amp;/g;
        $desc = '<tt>'.$desc.'</tt>';
        return $desc;
    }
    #handle man pages
    if ($filename =~ /\.\d+\w?(?:\.in|)$/) {
        return descmanfile($realf);
    }
    #ignore files that are neither source code nor html
    return ("\&nbsp\;") unless
	    ($filename =~ /\.(?:[chr](?:p?p?|c)|mm?|idl|java|p[lm]|(?:pl|vb|j|c|re)s|vb|html?)$/) ||
	    0;

    if (open(FILE, $realf)) {
        while(<FILE>){
            my $descline = $_;
	    $desc .= $descline ;
            if (defined $lic_start && $descline =~ /END.*LICENSE/) {
                my $lic_delta = $. - $lic_start;
                $lic_length = $lic_delta if $lic_delta > $lic_length;
                $inlicense = 0;
            }
            if (!defined $lic_start && $descline =~ /BEGIN.*LICENSE/) {
                $lic_start = $.;
                $inlicense = 1;
            }
            if($. > $excessivelines) {
                last;
            }
	    if(!$inlicense && $. > $lic_length + $maxlines) {
		last;
	    }
	}
	close(FILE);
    }
    if ($filename =~ /\.html?$/) {
        if ($desc =~ m{<title[^>]*>(.*?)</title}is) {
            $desc = $1;
            $desc =~ s/<[^>].*>//g;
            return $desc;
        }
    }

    # sanity check: if there's no description then stop
    if (!($desc =~ /\w/)){
	return("\&nbsp\;");
    }

    # save a copy for later
    $copy = $desc;

    # Look for well behaved <filename><separator> formatted
    # descriptions before we go to the trouble of looking for
    # one in the first comment. The whitespace between the
    # delimiter and the description may include a newline.
    if (($desc =~ s/(?:.*?\Q$filename\E\s*?- ?-*\s*)([^\n]*)(?:.*)/$1/sgi) ||
        ($desc =~ s/(?:.*?\Q$filename\E\s*?:\s*)([^\n]*)(?:.*)/$1/sgi) ||
        ($desc =~ s/(?:.*?Description:\s*)([^\n]*)(?:.*)/$1/sgi)
	){
        # if the description is non-empty then clean it up and return it
        if ($desc =~ /\w/) {
            #strip trailing asterisks and "*/"
            $desc =~ s#\*/?\s*$##;
            $desc =~ s#^[^\S]*\**[^\S]*#\n#gs;

            # Strip beginning and trailing whitespace
            $desc =~ s/^\s+//;
            $desc =~ s/\s+$//;

            # Strip junk from the beginning
            $desc =~ s#[^\w]*##ms;

            #htmlify the comments making links to symbols and files
            $desc = markupstring($desc, $Path->{'virt'});
            return($desc);
        }
    }

    # we didn't find any well behaved descriptions above so start over
    # and look for one in the first comment
    $desc = $copy;

    # Strip off code from the end, starting at the first cpp directive
    $desc =~ s/\n#.*//s;

    # Strip off code from the end, starting at typedef
    $desc =~ s/\ntypedef.*//s;

    # Strip off license
    $desc =~ s#(?:/\*.*license.*?\*/)(.*)#$1#is;

    # Strip off copyright notice
    $desc =~ s#(?:/\*.*copyright.*?\*/)(.*)#$1#is;

    # Strip off emacs line
    $desc =~ s#(/\*.*tab-width.*?\*/)(.*)#$2#isg;

    # excise rcs crud
    $desc =~ s#Id: \Q$filename\E.*?Exp \$##g;

    # Yuck, nuke these silly comments in js/jsj /* ** */
    $desc =~ s#\n\s*/\*+[\s\*]+\*/\n#\n#sg;

    # Don't bother to continue if there aren't any comments here
    if(!($desc =~ m#/\*#)) {
	return("&nbsp;");
    }

    # Remove lines generated by jmc
    $desc =~ s#\n.*?Source date:.*\n#\n#;
    $desc =~ s#\n.*?Generated by jmc.*\n#\n#;

    # Extract the first comment
    $desc =~ s#(?:.*?/\*+)(.*?)(?:(?:\*+/.*)|(?:$))#$1#s;

    # Strip silly borders
    $desc =~ s#\n\s*[\*\=\-\s]+#\n#sg;

    # Strip beginning and trailing whitespace
    $desc =~ s/^\s+//;
    $desc =~ s/\s+$//;

    # Strip out file name
    $desc =~ s#$filename##i;

    # Strip By line
    $desc =~ s#By [^\n]*##;

    # Strip out dates
    $desc =~ s#\d{1,2}/\d{1,2}/\d\d\d\d##;
    $desc =~ s#\d{1,2}/\d{1,2}/\d\d##;
    $desc =~ s#\d{1,2} \w\w\w \d\d\d\d##;

    # Strip junk from the beginning
    $desc =~ s#[^\w]*##;

    # Extract the first paragraph
    $desc =~ s#(\n\s*?\n.*)##s;

    # If the description is too long then just use the first sentence
    # this will fail if no period was used.
    if (length($desc) > 200 ) {
        $desc =~ s#([^\.]+\.)\s.*#$1#s;
    }

    # If the description is still too long then assume it will look
    # like gobbledygook and give up
    if (length($desc) > 200 ) {
	return("&nbsp;");
    }

    # htmlify the comments, making links to symbols and files
    $desc = markupstring($desc, $Path->{'virt'});

    if ($desc) {
	return($desc);
    }else{
	return("\&nbsp\;");
    }
}

sub get_readable_file {
    my ($path, $glob) = @_;
    my @files = bsd_glob($path.$glob);
    foreach (@files) {
        next unless -f;
        next unless -r;
        return $_;
    }
    return '';
}

# dme: create a short description for a subdirectory in a directory listing
# If no description, return the string "\&nbsp\;" to keep the
# table looking pretty.
#
# In Mozilla, if the directory has a README file look in it for lines
# like the ones used in source code: "directoryname --- A short description"
sub descexpand {
    # use global vars here because the expandtemplate subroutine makes
    # passing parameters impossible. Use $filename from source and
    # $Path from Common.pm
    my $filename = $main::filename;
    $filename .= '/' unless $filename =~ m{/$};
    my $linecount=0;
    local $desc= "";

    my $rpath = $Path->{'real'};
    my $readme = get_readable_file($rpath . $filename, '{README,ReadMe}{.html,.htm,.txt,.TXT,.markdown,}');
    if ($readme =~ /\.html?$/ && open(DESC, $readme)) {
        undef $/;
        $desc = <DESC>;
        $/ = "\n";
        close(DESC);

        # Make sure there is no <span> embedded in our string. If so
        # then we've matched against the wrong /span and this string is junk
        # so we'll throw it away and refrain from writing a description.
        # Disallowing embedded spans theoretically removes some flexibility
        # but this seems to be a little used tag and doing this makes lxr
        # a lot faster.
        if ($desc =~ /<span class=\"?lxrshortdesc\"?>(.*?)<\/span>/is) {
            $short = $1;
            if (!($short =~ /\<span/is)) {
                return ($short);
            }
        }
    }

    $desc = "";
    if (open(FILE, $readme)) {
	$path = $Path->{'virt'}.$filename;
	$path =~ s#/(.+)/#$1#;
        while (<FILE>){
            if ($linecount++ > 10) {
                last;
            } elsif (/\s*\Q$path\E\s*-\s*-*\s*/i){
                $desc = (split(/\s*\Q$path\E\s*-\s*-*\s*/i))[1];
                if ($desc) {last};
            } elsif (/\s*\Q$filename\E\s*-\s*-*\s*/i){
                $desc = (split(/\s*\Q$filename\E\s*-\s*-*\s*/i))[1];
                if ($desc) {last};
            } elsif (/\Q$path\E\s*:\s*/i){
                $desc = (split(/ \Q$path\E\s*:\s*/i))[1];
                if ($desc) {last};
            } elsif (/\Q$filename\E\s*:\s*/i){
                $desc = (split(/ \Q$filename\E\s*:\s*/i))[1];
                if ($desc) {last};
            } elsif (/^[A-Z ]+$/) {
                my $i = 0;
                while ($i++ < 5 && <FILE>) {
                    $linecount++;
                    $desc = $_ if /[a-z]{4}/;
                }
                if ($desc) {last};
            }
        }
        close(FILE);
    }
    $desc = descmakefilepl($rpath, $Path->{'virt'}, $filename, 0) || $desc;
    $desc ||= descdebcontrol2($rpath, $Path->{'virt'}, $filename, 0);
    if ($filename =~ m%^debian/$%i) {
        $desc ||= descdebcontrol2($rpath, $Path->{'virt'}, './', 0);
    }
    $desc ||= descrpmspec($rpath, $Path->{'virt'}, $filename, 0);
# git would be one of the following, but it doesn't work
# because the file {git}/description or {git}/.git/description
# doesn't seem to actually appear in checkouts...
=broken
    if (!$desc && open(FILE, $rpath.$filename.'description')) {
        $desc = <FILE>;
        close(FILE);
    }
=cut
    if (!$desc && open(FILE, $rpath.$filename.'README')) {
        $desc = <FILE>;
        close(FILE);
    }
    $desc ||= descmozrdf($rpath, $Path->{'virt'}, $filename, 0);

    #strip trailing asterisks and "*/"
    $desc =~ s{\*/?\s*$}{};

    if ($desc){
        #htmlify the comments making links to symbols and files
        my $tail = ($filename =~ m!/!) ? $filename : '';
        $desc = markupstring($desc, $Path->{'virt'}.$tail);

        return($desc);
    } else {
        return("\&nbsp\;");
    }
}

# dme: Print a descriptive blurb in directory listings between
# the document heading and the table containing the actual listing.
#
# For Mozilla, we extract this information from the README file if
# it exists. If the file is short then just print the whole thing.
# For longer files print the first paragraph or so. As much as
# possible make this work for randomly formatted files rather than
# inventing strict rules which create gobbledygook when they're broken.
sub dirdesc {
    my ($path) = @_;
    my $rpath = $Path->{'real'};
    if ($rpath =~ m{_files/$}) {
        return if deschtmlfilesfolder($path);
    }
    if (-f $rpath."/README.html") {
        return if descreadmehtml($path);
    }
    if (-f $rpath."/README" ||
        -f $rpath."/ReadMe" ||
        -f $rpath."/README.TXT") {
        return if descreadme($path);
    }
    if (-f $rpath.'/DEBIAN/control' ||
        -f $rpath.'/debian/control') {
        return if descdebcontrol($path);
    }
}

sub deschtmlfilesfolder {
    my ($path) = @_;
    my $rpath = $Path->{'real'};
    my $base = $rpath;
    # chomp off the directory special bit
    $base =~ s{_files/}{};
    # try file.htm
    my $file = "$base.htm";
    unless (-f $file) {
      # try file.html
      $file .= 'l';
      return undef unless -f $file;
    }
    if (!(open(DESC, $file))) {
        return undef;
    }
    # we'll want the file name later
    $file =~ s{^.*/}{};
    my $line;
    my $result;
    while ($line = <DESC>) {
        if ($line =~ m{<title>(.*)</title>}i) {
            $result = $1;
            last;
        }
    }
    close(DESC);
    return undef unless $result;
    # we don't know if the content will be good or bad, it's easier to assume it's good for a bit
    # convert it to bad
    $result =~ s/\&lt;/</g;
    $result =~ s/\&gt;/>/g;
    $result =~ s/\&amp;/&/g;
    # and now know that all content is bad, and convert it to good
    $result =~ s/</&lt;/g;
    $result =~ s/>/&gt;/g;
    $result =~ s/\&/&amp;/g;
    print "<p><h2><a href='../$file'>$result</a></h2><p>";
    return 1;
}

sub descreadmehtml {
    my ($path, $readme) = @_;

    my $string = "";
    my $rpath = $Path->{'real'};
    $readme = get_readable_file($rpath, $readme) || get_readable_file($rpath, 'README{.html,.htm}');
    if (!$readme || !open(DESC, $readme)) {
	return;
    }
    undef $/;
    $string = <DESC>;
    $/ = "\n";
    close(DESC);

    # if the README is 0 length then give up
    if (!$string) {
        return;
    }

    # check if there's a short desc nested inside the long desc. If not, do
    # a non-greedy search for a long desc. assume there are no other stray
    # spans within the description.
    my $shortname = basename $readme;
    if ($string =~ /<span class=\"?lxrlongdesc\"?>(.*?<span class=\"?lxrshortdesc\"?>.*?<\/span>.*?)<\/span>/is) {
        $long = $1;
        if (!($long =~ m{<span.*?</span}is)) {
            $long .= "<p>\nSEE ALSO: ./$shortname\n";
        }
    } elsif ($string =~ m{<span class=['"]?lxrlongdesc['"]?>(.*?)</span>}is) {
        $long = $1;
        if (!($long =~ m{<span}is)) {
            $long .= "<p>\nSEE ALSO: ./$shortname\n";
        }
    } elsif ($string =~ m{<pre>(.*?)</pre>}is) {
        $long = $1;
        $long =~ s{^\s*$}{}g;
        $long =~ s/\n{2,}/\n/sg;
        $long =~ s{^((?:[^\n]*\n){1,10})(.*)$}{$1}s;
        $long = "<pre>" . $long;
	if ($2) {
            $readme =~ s{^.*/}{./};
            $long .= "<p>SEE ALSO: $$shortname\n";
        }
        $long .= "\n</pre>";
    }
    return 0 unless $long;
    print $long;
    return 1;
}

sub descreadme {
    my ($path, $readme) = @_;

    my $string = "";
#    $string =~ s#(</?([^>^\s]+[^>]*)>.*$)#($2~/B|A|IMG|FONT|BR|EM|I|TT/i)?$1:""#sg;
    my $n;
    my $count;
    my $temp;

    my $maxlines = 20;  # If file is less than this then just print it all
    my $minlines = 5;   # Too small. Go back and add another paragraph.
    my $chopto = 10;    # Truncate long READMEs to this length

    my $rpath = $Path->{'real'};
    $readme = get_readable_file($rpath, $readme) || get_readable_file($rpath, '{README,ReadMe}{.txt,.TXT,.markdown,}');

    if (!(open(DESC, $readme))) {
	return;
    }

    undef $/;
    $string = <DESC>;
    $/ = "\n";
    close(DESC);

    # if the README is 0 length then give up
    if (!$string){
	return;
    }
    # strip the emacs tab line
    $string =~ s/.*tab-width:[ \t]*([0-9]+).*\n//;

    # strip the npl
    $string =~ s/.*The contents of this .* All Rights.*Reserved\.//s;

    # strip the short description from the beginning
    $path =~ s#/(.+)/#$1#;
    $string =~ s/.*\Q$path\E\/*\s+--- .*//;

    # strip away junk
    $string =~ s/#+\s*\n/\n/;
    $string =~ s/---+\s*\n/\n/g;
    $string =~ s/===+\s*\n/\n/g;

    # strip blank lines at beginning and end of file.
    $string =~ s/^\s*\n//gs;
    $string =~ s/\s*\n$//gs;
    chomp($string);
    $_ = $string;
    $count = tr/\n//;

    # If the file is small there's not much use splitting it up.
    # Just print it all
    if ($count > $maxlines) {
        # grab the first n paragraphs, with n decreasing until the
        # string is 10 lines or shorter or until we're down to
	# one paragraph.
	$n = 6;
	$temp = $string;
	while ( ($count > $chopto) && ($n-- > 1) ) {
            $string =~ s/^((?:(?:[\S\t ]*?\n)+?[\t ]*\n){$n}?)(.*)/$1/s;
	    $_ = $string;
	    $string =~ s/\s*\n$//gs;
	    $count = tr/\n//;
	}

	# if we have too few lines then back up and grab another paragraph
	$_ = $string;
	$count = tr/\n//;
	if ($count < $minlines) {
	    $n = $n+1;
	    $temp =~ s/^((?:(?:[\S\t ]*?\n)+?[\t ]*\n){$n}?)(.*)/$1/s;
	    $string = $temp;
	}

	# if we have more than $maxlines then truncate to $chopto
	# and add an ellipsis.
	if ($count > $maxlines) {
	    $string =~ s/^((?:[\S \t]*\n){$chopto}?)(.*)/$1/s;
	    chomp($string);
	    $string = $string . "\n...";
	}

        # since not all of the README is displayed here,
        # add a link to it.
        chomp($string);
        my $shortname = basename $readme;
        if ($string =~ /SEE ALSO/) {
            $string = $string . ", $shortname";
        } else {
            $string = $string . "\n\nSEE ALSO: ./$shortname";
        }
    }

    $string = markupstring($string, $Path->{'virt'});
    $string = convertwhitespace($string, 1);
    $string =~ s/(SEE ALSO:)/\n$1/g;

    # strip blank lines at beginning and end of file again
    $string =~ s/^\s*\n//gs;
    $string =~ s/\s*\n$//gs;
    chomp($string);

    print("<pre>\n" . $string . "</pre>\n<p>\n");
}

sub descdebcontrol {
    my ($path) = @_;

    if (!(open(DESC, $Path->{'real'}.'/DEBIAN/control')) &&
        !(open(DESC, $Path->{'real'}.'/debian/control'))) {
        return;
    }

    my $line;
    while ($line = <DESC>) {
        if ($line =~ /^Description:\s*(.*)/) {
            $string = $1;
            last;
        }
        next if /^\w+:/;
        $string .= $line;
    }
    close(DESC);
    my $string = descdebcontrol2($Path->{'real'}, $Path->{'virt'}, './', 1);
    chomp($string);
    $string = markupstring($string, $Path->{'virt'});
    $string = convertwhitespace($string, 1);
    # strip blank lines at beginning and end of file again
    $string =~ s/^\s*\n//gs;
    $string =~ s/\s*\n$//gs;
    chomp($string);

    print("<pre>" . $string . "</pre>\n<p>\n");
}

sub descdebcontrol2 {
    my $line;
    my $package;
    my %collection;
    my %descriptions;
    my ($rpath, $directory, $filename, $multiline) = @_;
    return '' unless open(FILE, $rpath.$filename.'DEBIAN/control') ||
                     open(FILE, $rpath.$filename.'debian/control');
    while ($filename eq '../') {
        $directory =~ m{^(.*)/+([^/]+)};
        ($directory, $filename) = ($1, $2.'/');
    }
    $directory =~ s{/+$}{};
    $directory =~ s{^.*/}{};
    while ($line = <FILE>) {
    restart:
        next unless $line =~ /^(Source|Package|Description):\s*(.*)\s*$/;
        my ($kind, $value) = ($1, $2);
        $collection{$kind} = $value;
	if ($kind eq 'Package') {
            if ($package =~ /^$|-d(?:ev|bg)$/) {
	        $package = $value;
            }
        }
        next unless $kind eq 'Description';
        if ($multiline) {
            my $accum;
            while ($line = <FILE>) {
                last unless $line =~ /\S/;
                last if $line =~ /^\S+:/;
                $accum .= $line;
            }
            $value = $accum if $accum =~ /\S/;
        }
        $descriptions{$collection{'Package'}} = $value;
        if ($multiline) {
            goto restart if $line =~ /^\w+:/;
        }
    }
    close(FILE);
    return $descriptions{$collection{Source}}
        || $descriptions{$directory}
        || $descriptions{$package};
}

sub descrpmspec {
    my ($rpath, $directory, $filename, $multiline) = @_;
    my $path = $rpath . $filename;
    my $desc;
    foreach my $spec (<$path/*.spec>) {
        open SPEC, '<', $spec;
        while (<SPEC>) {
            next unless /^Summary:\s+(\S.*)/;
            $desc = $1;
            last;
        }
        close SPEC;
        next unless defined $desc;
        return $desc;
    }
    return undef;
}

sub descmakefilepl {
    my ($rpath, $directory, $filename, $multiline) = @_;
    my $path = $rpath . $filename;
    my $desc;
    if (open(SPEC, '<', "$path/Makefile.PL")) {
        while (<SPEC>) {
            next unless /^\s*['"]?ABSTRACT['"]?\s+=>['"](.*)['"](?:,|$)/;
            $desc = $1;
        }
        close SPEC;
    }
    return $desc;
}

sub descmozrdf {
    my ($line, $description, $name, $displayName);
    my ($rpath, $directory, $filename, $multiline) = @_;
    my (@descs, $descre, @display, $dispre, @names, $namere);

    foreach my $file (qw(install.rdf contents.rdf)) {
        next unless open(FILE, '<', $rpath.$filename.$file);
        $line = <FILE>;
        unless ($line) {
            close FILE;
            next;
        }
        my $wide;
        if ($line =~ /^(?:(\xFE\xFF)|(\xFF\xFE))/) {
if (1) {
            $wide = 1;
} else {
            # this requires a working version of Encode and Encode::LocalConfig
            # given all i want is to not have null characters, it's overkill.
            close FILE;
            next unless open(FILE, '<:encoding(UTF-16)', $rpath.$filename.$file);
}
        }
        do {
            $line =~ s/\x00//g if $wide;
            while ($line =~ /xmlns(?::(\S+)|)=(?:"([^"]*)"|'([^']*)')/g) {
                my $ns = $2.$3;
                if ($ns eq 'http://www.mozilla.org/rdf/chrome#' ||
                    $ns eq 'http://www.mozilla.org/2004/em-rdf#') {
                    my $prefix = ($1 ? "$1:" : '');
                    push @descs, $prefix . 'description';
                    push @display, $prefix . 'displayName';
                    push @names, $prefix . 'name';
                    $descre = "(?:" . join('|', @descs) . ')\s*';
                    $dispre = "(?:" . join('|', @display) . ')\s*';
                    $namere = "(?:" . join('|', @names) . ')\s*';
                }
            }
            if ($descre) {
                unless ($description) {
                    if ($line =~ /$descre=(?:"([^"]*)"|'([^']*)')/) {
                        $description = "$1$2";
                    }
                    if ($line =~ m{<$descre>(.*)}) {
                        my $frag = $1;
                        my $newline;
                        unless ($frag =~ m{(.*?)</$descre}s) {
                            while ($newline = <FILE>) {
                                 $line .= $newline;
                                 $frag .= $newline;
                                 $frag =~ m{(.*?)</$descre}s;
                            }
                        }
                        $description = $1;
                        $description =~ s/<!\[CDATA\[(.*?)\]\]>/$1/g;
                        $description =~ s/\s+/ /msg;
                    }
                }
                unless ($displayName) {
                    if ($line =~ /$dispre=(?:"([^"]*)"|'([^']*)')/) {
                        $displayName = "$1$2";
                    }
                    if ($line =~ m{<$dispre>(.*)</$dispre}) {
                        $displayName = $1;
                        $displayName =~ s/<!\[CDATA\[(.*?)\]\]>/$1/g;
                    }
                }
                unless ($name) {
                    if ($line =~ /$namere=(?:"([^"]*)"|'([^']*)')/) {
                        $name = "$1$2";
                    }
                    if ($line =~ m{<$namere>(.*)</$namere}) {
                        $name = $1;
                        $name =~ s/<!\[CDATA\[(.*?)\]\]>/$1/g;
                    }
                }
            }
        } while ($line = <FILE>);
        close(FILE);
    }
    return $description || $displayName || $name;
}

sub readman {
    my $string = <DESC>;
    while ($string =~ /\\$/) {
        chop($string);
        $string .= <DESC>;
    }
    return $string;
}

sub descmanfile {
    my ($path) = @_;
    if (!(open(DESC, $path))) {
        return;
    }

    my ($line, $string);
    while ($line = readman()) {
        if ($line =~ m{^\.so (?:man\d+\.*/|)(.*)$}) {
            my $file = $1;
            my $dir = $path;
            $dir =~ s{/[^/]+$}{/$file};
            if (-f $dir) {
                close(DESC);
                return descmanfile($dir);
            }
        }
        if ($line =~ /^\..*SH \S/) {
            $string = $line;
            $string = readman() while ($string =~ /^\.\\"/);
            $string = readman() while ($string =~ /^\./);
            $string = readman() while ($string =~ /^\.\\"/);
            last;
        }
        if ($line =~ /^\.\\" .SH (?:"|'|)NAME(?:"|'|)\s*$/) {
            (undef, $string) = (readman(), readman());
            last;
        }
        if ($line =~ /^(?:|.\\" ).SH (?:"|'|)(?:NAME|\x540D\x79F0)(?:"|'|)\s*$/) {
            $string = <DESC>;
            last;
        }
    }
    close(DESC);
    chomp($string);
    $string =~ s/\\//g;
    $string = markupstring($string, $Path->{'virt'});
    $string = convertwhitespace($string);
    # strip blank lines at beginning and end of file again
    $string =~ s/^\s*\n//gs;
    $string =~ s/\s*\n$//gs;
    chomp($string);

    return $string;
}

# dme: substitute carriage returns and spaces in original text
# for html equivalent so we don't need to use <pre> and can
# use variable width fonts but preserve the formatting
sub convertwhitespace {
    my ($string, $pre) = @_;
    my $p = $pre ? '' : '<p>';

    # handle ascii bulleted lists
    $string =~ s/<p>\n\s+o\s/<p>\n\&nbsp\;\&nbsp\;o /sg;
    $string =~ s/\n\s+o\s/&nbsp\;\n<br>\&nbsp\;\&nbsp\;o /sg;

    #find paragraph breaks and replace with <P>
    $string =~ s/\n\s*\n/$p\n/sg;

    return($string);
}

my $skip;
sub beginskip
{
    $skip = 1;
    return '<![MXR[';
}

sub endskip
{
    return '' unless $skip;
    $skip = undef;
    return ']]>';
}

sub isForce {
my $force = $HTTP->{'param'}->{'force'};
$force = (defined $force && $force =~ /1|on|yes/ ? 1 : 0);
return $force;
}

sub isImage {
    return 0 if isForce();
my ($file, $ignore) = @_;
    return 0 unless (defined $ignore || $ENV{HTTP_ACCEPT} !~ 'text/html');
    return ($file =~ /\.(p?[jmp][pnm]e?g|gif|x[bp]m|svg|ico|ani|bmp)$/i);
}

sub isHTML {
    return 0 if isForce();
my $file = shift;
    return ($file =~ /\.html?$/);
}

sub isCSS {
    return 0 if isForce();
my $file = shift;
    return ($file =~ /stylesheet\.(css)$/) ||
          (($file =~ /\.(css)$/) && $ENV{HTTP_ACCEPT} !~ 'text/html');
}

sub getMimeType
{
    my ($file) = @_;
    my ($cat, $kind) = ('application', 'octet-stream');
    if (isHTML($file)) {
        $cat = 'text';
        $kind = 'html';
    } elsif (isCSS($file)) {
        $cat = 'text';
        $kind = 'css';
    } elsif (isImage($file)) {
        $kind = 'x-unknown';
        $cat = 'image';
        $kind = 'jpeg' if $file =~ /\.jpe?g$/i;
        $kind = 'pjepg' if $file =~ /\.pjpe?g$/i;
        $kind = 'gif' if $file =~ /\.gif$/i;
        $kind = 'png' if $file =~ /\.[jp]ng$/i;
        $kind = 'bitmap' if $file =~ /\.bmp$/i;
        $kind = 'svg+xml' if $file =~ /\.svg$/i;
        $kind = 'x-icon' if $file =~ /\.(ico|ani|xpm)$/i;
    }
    return "$cat/$kind";
}

sub localexpandtemplate
{
    my $template = shift;
    return LXR::Common::expandtemplate($template,
                          ('bonsaihost',        \&bonsaihost),
                          ('beginbonsai',       \&beginbonsai),
                          ('endbonsai',         \&endbonsai),
                          ('bonsaihghost',      \&bonsaihghost),
                          ('beginbonsaihg',     \&beginbonsaihg),
                          ('endbonsaihg',       \&endbonsaihg),
                          ('trachost',          \&trachost),
                          ('begintrac',         \&begintrac),
                          ('endtrac',           \&endtrac),
                          ('viewvctail',        \&viewvctail),
                          ('viewvchost',        \&viewvchost),
                          ('beginviewvc',       \&beginviewvc),
                          ('endviewvc',         \&endviewvc),
                          ('begincvsweb',       \&begincvsweb),
                          ('endcvsweb',         \&endcvsweb),
                          ('cvswebhost',        \&cvswebhost),
                          ('websvnhost',        \&websvnhost),
                          ('beginwebsvn',       \&beginwebsvn),
                          ('endwebsvn',         \&endwebsvn),
                          ('webhghost',         \&webhghost),
                          ('beginwebhg',        \&beginwebhg),
                          ('endwebhg',          \&endwebhg),
                          ('gitorioushost',     \&gitorioushost),
                          ('gitrev',            \&gitrev),
                          ('gitpath',           \&gitpath),
                          ('begingitorious',    \&begingitorious),
                          ('endgitorious',      \&endgitorious),
                          ('githubrepo',        \&githubrepo),
                          ('begingithub',       \&begingithub),
                          ('endgithub',         \&endgithub),
                          ('oghghost',          \&oghghost),
                          ('beginoghg',         \&beginoghg),
                          ('endoghg',           \&endoghg),
                          ('ogroot',            \&ogroot),
                          ('loggerheadhost',        \&loggerheadhost),
                          ('beginloggerhead',       \&beginwebzr),
                          ('endloggerhead',         \&endloggerhead)
);
};

my $bonsai_host;
sub bonsaihost
{
    return $bonsai_host if defined $bonsai_host;
    my $bonsai_not_found = 'http://error.bonsai-not-found.tld';
    $bonsai_host = $bonsai_not_found;
    my $cvsrootfile = $Path->{'real'}.'/CVS/Root';
    return $bonsai_not_found unless -f $cvsrootfile;
    return $bonsai_not_found unless open(CVSROOT,'<',$cvsrootfile);
    my $cvsroot = <CVSROOT>;
    close(CVSROOT);
    if ($cvsroot =~ m{mozilla\.org:/www}) {
        $bonsai_host = 'http://bonsai-www.mozilla.org';
    } elsif ($cvsroot =~ m{mozilla\.org:/l10n}) {
        $bonsai_host = 'http://bonsai-l10n.mozilla.org';
    } elsif ($cvsroot =~ /mozilla\.org:/) {
        $bonsai_host = 'http://bonsai.mozilla.org';
    } elsif ($cvsroot =~ /gnome\.org:/) {
        $bonsai_host = 'http://cvs.gnome.org/bonsai';
    } elsif ($cvsroot =~ /freedesktop\.org:/) {
        $bonsai_host = 'http://bonsai.freedesktop.org';
    }
    return $bonsai_host;
}

sub beginbonsai
{
    return &beginskip unless &bonsaihost !~ /bonsai-not-found/;
    return &beginskip if $Path->{'svnrepo'};# =~ /songbird/;
    return '';
}

sub endbonsai
{
    return &endskip;
}

sub bonsaihghost
{
    return "http://bonsai-hg.example.com";
}

sub beginbonsaihg
{
    return &beginskip unless checkhg($Path->{'virt'}, $Path->{'real'});
    return '';
}

sub endbonsaihg
{
    return &endskip;
}

sub trachost
{
    my $trac_not_found = 'http://error.trac-not-found.tld/ '.$Path->{'svnrepo'};
    return 'https://projects.maemo.org/trac' if $Path->{'svnrepo'} =~ /projects\.maemo\.org/;
    return 'http://publicsvn.songbirdnest.com/trac' if $Path->{'svnrepo'} =~ /songbird/;
    return 'http://trac.webkit.org/projects/webkit' if $Path->{'svnrepo'} =~ /webkit/;
    return 'http://svn-mirror.flock.com/trac/flock' if $Path->{'svnrepo'} =~ /flock/;
    return $trac_not_found;
}

sub begintrac
{
    return &beginskip unless $Path->{'svnrepo'} =~ /flock|songbird|webkit/;
    return '';
}

sub endtrac
{
    return &endskip;
}

sub viewvctail
{
    if ($Path->{'svnrepo'} =~ m{\Qgarage.maemo.org/svn/\E([^/]+)}) {
        return "?root=$1";
    }
    return '?';
}

sub viewvchost
{
    return 'https://garage.maemo.org/plugins/scmsvn/viewcvs.php' if $Path->{'svnrepo'} =~ /garage/;
    return 'https://garage.maemo.org/plugins/scmsvn/viewcvs.php/' if $Path->{'svnrepo'} =~ /garage/;
    return 'https://stage.maemo.org/viewcvs.cgi/maemo/' if $Path->{'svnrepo'} =~ /stage/;
    return 'http://viewvc.svn.mozilla.org/vc' if $Path->{'svnrepo'} =~ /mozilla\.org/;
    return '';
}

sub beginviewvc
{
    return &beginskip unless $Path->{'svnrepo'} =~ /stage|garage|mozilla\.org/;
    return '';
}

sub endviewvc
{
    return &endskip;
}

sub begincvsweb
{
    return '' if &cvswebhost !~ /not-found/;
    return &beginskip;
}

sub endcvsweb
{
    return &endskip;
}

my $cvsweb_host;
sub cvswebhost
{
    return $cvsweb_host if defined $cvsweb_host;
    my $cvsweb_not_found = 'http://error.cvsweb-not-found.tld';
    $cvsweb_host = $cvsweb_not_found;
    my $cvsrootfile = $Path->{'real'}.'/CVS/Root';
    return $cvsweb_not_found unless -f $cvsrootfile;
    return $cvsweb_not_found unless open(CVSROOT,'<',$cvsrootfile);
    my $cvsroot = <CVSROOT>;
    close(CVSROOT);
    if ($cvsroot =~ m{mozdev\.org:/cvs}) {
        $cvsweb_host = 'http://www.mozdev.org/source/browse';
    }
    return $cvsweb_host;
}

sub websvnhost
{
    return '';
}

sub beginwebsvn
{
    return &beginskip unless 0;
    return '';
}

sub endwebsvn
{
    return &endskip;
}

my %hghostcache = ();
sub hgcachehost {
  my ($key, $val) = @_;
  return $hghostcache{$key} = $val;
}

sub rawhghost
{
    my $hg_not_found = 'http://error.hg-not-found.tld';
    my ($virt, $real) = ($Path->{'virt'}, $Path->{'real'});
    my $key = "$virt\n$real";
    my $hgroot = $hghostcache{$key};
    return $hgroot if defined $hgroot;
    my $path = checkhg($virt, $real);
    return hgcachehost($key, $hg_not_found) unless $path =~ /^(\d+)/;
    my $i = $1;
    while ($i--) {
      $virt =~ s{/[^/]+/?$}{};
      $real =~ s{/[^/]+/?$}{};
    }
    my $hgpath = checkhg($virt, $real);
    return hgcachehost($key, $hg_not_found) unless ($hgpath =~ m{^0 (\S+)/store/data$});
    my $hgrc = "$1/hgrc";
    return hgcachehost($key, $hg_not_found) unless open (HGRC, '<', $hgrc);
    my $line;
    my $scanstate = 0;
#[paths]
#default = http://hg.mozilla.org/mozilla-central
    while ($line = <HGRC>) {
      if ($scanstate == 0) {
        $scanstate = 1 if $line =~ /^\[paths\]/;
      } elsif ($scanstate == 1) {
        if ($line =~ /^\s*\[([^]])*\]/) {
          if ($1 ne 'paths') {
            $scanstate = 0;
            next;
          }
        }
        if ($line =~ m{^\s*default\s*=\s*(\S+?)/?(#.*|)$}) {
          $hgroot = $1;
          last;
        }
      }
    }
    close HGRC;
    return hgcachehost($key, $hgroot || $hg_not_found);
}

sub webhghost
{
    my $host = rawhghost();
    my $gitorious_hg_not_found = 'http://error.gitorious-hg-not-found.tld';
    my $git_hg_host = $gitorious_hg_not_found;
    $host =~ s!git://gitorious\.org/[^/]+/(.*)\.git!$git_hg_host/hgweb.cgi/$1!;
    return $host;
}

sub beginwebhg
{
    return &beginskip unless checkhg($Path->{'virt'}, $Path->{'real'});
    return &beginskip if oghghost() eq 'http://src.opensolaris.org';
    return '';
}

sub endwebhg
{
    return &endskip;
}

sub gitorioushost
{
    my $host = rawhghost();
    $host =~ s!^git://(.*gitorious\.org.*)\.git!http://$1!;
    return $host;
}

sub gitrev
{
    my $git_rev_unknown = 'master';
    my $hgrev = bigexpandtemplate('$hgversion');
    return 'master' if $hgrev eq 'tip';
    my ($virt, $real) = ($Path->{'virt'}, $Path->{'real'});
    my $path = checkhg($virt, $real);
    return $git_rev_unknown unless $path =~ m{^\d+ (.+)/store/data(.*)};
    my $gitmap = "$1/git-mapfile";
    return $git_rev_unknown unless open (GITMAP, '<', $gitmap);
    my $line;
    my $gitrev;
    local $/ = "\n";
    while ($line = <GITMAP>) {
      next unless $line =~ /(\w+) \Q$hgrev\E/;
      $gitrev = $1;
    }
    close GITMAP;
    return $gitrev || $git_rev_unknown.$hgrev;
}

sub gitpath
{
    my ($virt, $real) = ($Path->{'virt'}, $Path->{'real'});
    my $path = checkhg($virt, $real);
    return $hg_not_found unless $path =~ m{^\d+ (.+)/store/data(.*)};
    return $2;
}

sub begingitorious
{
    return &beginskip unless rawhghost() =~ /gitorious\.org/;
    return '';
}

sub endgitorious
{
    return &endskip;
}

sub githubrepo
{
    return 'https://github.com/mozilla-b2g/gaia' if $Path->{'real'} =~ /gaia/;
    return 'https://github.com/mozilla/rust' if $Path->{'real'} =~ /rust/;
    return 'https://github.com/mozilla/servo' if $Path->{'real'} =~ /servo/;
    return '';
}

sub begingithub
{
    return &beginskip unless githubrepo();
    return '';
}

sub endgithub
{
    return &endskip;
}

sub ogroot
{
    my ($virt, $real) = ($Path->{'virt'}, $Path->{'real'});
    my $path = checkhg($virt, $real);
    return '' unless $path =~ /^(\d+)/;
    my $i = $1;
    while ($i--) {
      $real =~ s{/[^/]+/?$}{};
    }
    $real =~ m{repo.opensolaris.org/(.*)};
    return $1;
}

sub oghghost
{
    my $og_not_found = 'http://error.opengrok-not-found.tld';
    my $host = webhghost();
    if ($host =~ /hg\.opensolaris\.org/) {
        return 'http://src.opensolaris.org';
    }
    return $og_not_found;
}

sub beginoghg
{
    my $host = oghghost();
    return '' if ($host eq 'http://src.opensolaris.org');
    return &beginskip;
}

sub endoghg
{
    return &endskip;
}

sub loggerheadhost
{
    my $bzrbranch = $Path->{'real'}.'/.bzr/branch';
    my $bzr_not_found = 'http://error.bzr-not-found.tld';
    return $bzr_not_found unless -d $bzrbranch;
    my ($bzrroot, $bzrrootfile);
    if (-f "$bzrbranch/bound") {
        $bzrrootfile = "$bzrbranch/bound";
        return $bzr_not_found unless open(BZRROOT,'<',$bzrrootfile);
        $bzrroot = <BZRROOT>;
        close(BZRROOT);
    } elsif (-f "$bzrbranch/branch.conf") {
        $bzrrootfile = "$bzrbranch/branch.conf";
        return $bzr_not_found unless open(BZRROOT,'<',$bzrrootfile);
        my $location;
        while ($location = <BZRROOT>) {
#-parent_location = http://dm-bugstage01.mozilla.org/bmo/3.0/
#+bound_location = http://dm-bugstage01.mozilla.org/bmo/3.0/
#+bound = True
            next unless $location =~ /^\s*(?:parent|bound)_location\s*=\s*(\S+)/;
            $bzrroot = $location;
            last;
        }
        close(BZRROOT);
    }
    return $bzrroot || $bzr_not_found;
}

sub beginloggerhead
{
    return &beginskip;
}

sub endloggerhead
{
    return &endskip;
}
1;