#!/usr/bin/perl use strict; use warnings; use TUWF ':html', 'html_escape', ':xml'; use JSON::XS; use Cwd 'abs_path'; our $ROOT; BEGIN { ($ROOT = abs_path $0) =~ s{/www/index\.pl$}{}; } use lib "$ROOT/lib/ManUtils/inst/lib/perl5"; use ManUtils; TUWF::set( logfile => $ENV{TUWF_LOG}, db_login => [undef, undef, undef], debug => 0, xml_pretty => 0, log_slow_pages => 500, # Cache the system information pre_request_handler => sub { my $self = shift; if(!$self->{systems}) { $self->{systems} = $self->dbSystemGet; $_->{full} = $_->{name}.($_->{release}?' '.$_->{release}:'') for(@{$self->{systems}}); $self->{sysbyid} = { map +($_->{id}, $_), @{$self->{systems}} }; $self->{sysbyshort} = { map +($_->{short}, $_), @{$self->{systems}} }; } 1; }, error_404_handler => sub { my $self = shift; $self->resStatus(404); my $title = 'No manual entry for '.$self->reqPath; $self->htmlHeader(title => $title); h1 $title; p 'That is, the page you were looking for doesn\'t exist.'; $self->htmlFooter; }, ); TUWF::register( qr// => \&home, qr{info/about} => \&about, qr{browse/search} => \&browsesearch, # These have to go before the other mappings, to ensure that links work for # man pages called 'pkg' or 'man'. This also means that we can't have a # system named 8 hex digits, but at least that's easy to guarantee. :) qr{([^/]+)/([0-9a-f]{8})} => \&man, qr{([^/]+)/([0-9a-f]{8})/src} => \&src, # We don't have any other single-component paths qr{([^/]+)} => \&man, qr{pkg/([^/]+)} => \&pkg_list, # pkg/$system/$category/$name (/$version); $category may contain a slash, too. qr{pkg/([^/]+)/(.+)} => \&pkg_info, # Redirects for canonical URLs qr{man/([^/]+)/(.+)} => \&man_redir, # Redirects for old URLs. # /browse/ has been moved to /pkg/ with the package category added to the path qr{browse/([^/]+)} => sub { $_[0]->resRedirect("/pkg/$_[1]", 'perm'); }, qr{browse/([^/]+)/([^/]+)(?:/([^/]+))?} => sub { my($self, $sys, $name, $ver) = @_; $sys = $self->{sysbyshort}{$sys}; return $self->resNotFound if !$sys; my $pkgs = $self->dbPackageGet(sysid => $sys->{id}, name => $name, results => 1); return $self->resNotFound if !@$pkgs; $self->resRedirect("/pkg/$sys->{short}/$pkgs->[0]{category}/$name".($ver ? "/$ver" :''), 'perm'); }, # Redirect for a specific language for a man page. # I'm not a fan of this solution; might drop it in the future. qr{lang/([^/]+)/([^/]+)} => sub { my($s, $l, $n) = @_; $n = _normalizename($n); my($m, undef) = $s->dbManPrefName($n, language => $l); return $s->resNotFound if !$m; $s->resRedirect("/$m->{name}/".substr($m->{hash}, 0, 8), 'temp'); }, qr{xml/search\.xml} => \&xmlsearch, qr{json/tree\.json} => \&jsontree, ); TUWF::run(); sub home { my $self = shift; my $stats = $self->dbStats; my $fn = sub { local $_=shift; 1 while(s/(\d)(\d{3})($|,)/$1,$2/); $_ }; $self->htmlHeader(title => 'Man Pages Archive'); h1 'Man Pages Archive'; p; lit sprintf <<' _', map $fn->($stats->{$_}), qw|hashes mans files packages|; Indexing %s versions of %s manual pages found in %s files of %s packages.

Manned.org aims to index all manual pages from a variety of systems, both old and new, and provides a convenient interface for looking up and viewing the various versions of each man page. About manned.org » _ end; h2 'Browse the manuals'; ul id => 'systems'; my %sys; push @{$sys{$_->{name}}}, $_ for(@{$self->{systems}}); for my $sys (sort keys %sys) { $sys = $sys{$sys}; (my $img = $sys->[0]{short}) =~ s/^(.+)-.+$/$1/; li; a href => "/pkg/$sys->[0]{short}" if @$sys == 1; span style => "background-image: url('images/$img.png')", ''; b $sys->[0]{name}; if(@$sys > 1) { my $i = 0; for(reverse @$sys) { a href => "/pkg/$_->{short}", ++$i > 3 ? (class => 'hidden') : (), $_->{release}; lit ' '; } a href => "#", class => 'more', 'more...' if $i > 3; } end 'a' if @$sys == 1; end; } end; h2 'Other sites'; ul id => 'external'; li; a href => 'http://man7.org/linux/man-pages/index.html', 'man7.org'; txt ' - Linux man pages from several upstream projects.'; end; li; a href => 'http://man.cx/', 'man.cx'; txt ' - Man pages extracted from Debian testing.'; end; li; a href => 'http://man.he.net/', 'man.he.net'; txt ' - Also seems to be from a Debian-like system.'; end; li; a href => 'http://linux.die.net/man/', 'die.net'; txt ' - Seems to be based on an RPM-based Linux distribution.'; end; li; a href => 'http://manpages.org/', 'manpages.org'; txt ' - Lots of mostly-nicely formatted man pages, no clue about source.'; end; li; a href => 'http://www.manpagez.com/', 'manpagez.com'; txt ' - Mac OS X, has some GTK-html and texinfo documentation as well.'; end; li; a href => 'https://www.dragonflybsd.org/cgi/web-man', 'DragonFlyBSD Man Pages'; end; li; a href => 'http://www.freebsd.org/cgi/man.cgi', 'FreeBSD.org Man Pages'; end; li; a href => 'http://www.openbsd.org/cgi-bin/man.cgi', 'OpenBSD Man Pages'; end; li; a href => 'http://netbsd.gw.com/cgi-bin/man-cgi', 'NetBSD Man Pages'; end; li; a href => 'http://manpages.ubuntu.com/', 'Ubuntu Manuals'; end; end; $self->htmlFooter; } sub about { my $self = shift; $self->htmlHeader(title => 'About'); h1 'About Manned.org'; div id => 'about'; h2 'Goal'; p; lit <<' _'; The state of online indices of manual pages is a sad one. Existing sites only offer you a single version of a man page: From one origin, and often only in a single language. Most don't even tell you where the manual actually originated from, making it very hard to determine whether the manual you found actually applies to your situation and even harder to find a manual from a specific system. Additionally, some sites render the manuals in an unreadable way, don't correctly handle special formatting - like tables - or don't correctly display non-ASCII characters.

Manned.org was created in order to improve this situation. This site aims to index the manual pages from a variaty of systems, both old and new, and allows you to browse through the various versions of a manual page to find out how each system behaves. The manuals are stored in the database as UTF-8, and are passed through groff to render them in (mostly) the same way as they are displayed in your terminal. _ end; h2 'URL format'; lit <<' _';

You can link to specific packages and man pages with several URL formats. These URLs will keep working in the future, so you should not have to worry about eventual dead links.

Man pages

The following URLs are available to refer to an individual man page:

/<name>/<8-hex-digits>
This is the permalink format for a specific man page (e.g. /ls/910be0ed).
/<name>[.<section>]
Will try to get the latest and most-close-to-upstream version of a man page (e.g. /socket or /socket.7). Note that this may fetch the man page from any available system, so may result in confusing scenarios for system-specific documentation.
/man/<system>/<name>[.<section>]
Will get the latest version of a man page from the given system (e.g. /man/ubuntu-xenial/rsync)
/man/<system>/<category>/<package>/<name>[.<section>]
Will get the latest version of a man page from the given package (e.g. /man/ubuntu-xenial/net/rsync/rsync)
/man/<system>/<category>/<package>/<version>/<name>[.<section>]
Will get the man page from a specific package version (e.g. /man/ubuntu-xenial/net/rsync/3.1.1-3ubuntu1/rsync)

Currently, the last three URLs will perform a redirect to the appropriate permalink URL, but this may change in the future.
In all URLs where an optional .<section> can be provided, the search is performed as a prefix match. For example, /cat.3 will provide the cat.3tcl man page if no exact cat.3 version is available. Linking to the full section name is also possible: /cat.3tcl. If no section is given and multiple sections are available, the lowest section number is chosen.

Packages

Linking to individual packages is also possible. These pages will show a listing of all manual pages available in the given package.

/pkg/<system>/<category>/<package>
For the latest version of a package (e.g. /pkg/arch/core/coreutils).
/pkg/<system>/<category>/<package>/<version>
For a particular version of a package (e.g. /pkg/arch/core/coreutils/8.25-2).

Note that this site only indexes packages that actually have manual pages; Linking to a package that doesn't have any will result in a 404 page.

_ h2 'The indexing process'; p; lit <<' _'; All man pages are fetched right from the (binary) packages available on the public repositories of Linux distributions. In particular:
Arch Linux
The core, extra and community repositories are fetched from a local Arch mirror. Indexing started around begin June 2012.
Debian
Historical releases were fetched from http://archive.debian.org/debian/ and http://snapshot.debian.org/. For buzz, rex and bo, only the 'main' component has been indexed, and we're missing a few man pages because some packages were missing from the repository archives. For the other releases, all components (main, contrib and non-free) from the $release and $release-updates (where available) repositories are indexed.
FreeBSD
Historical releases were fetched from http://ftp-archive.freebsd.org/mirror/FreeBSD-Archive/. The base installation tarballs are included in the database as packages prefixed with core-. The package repositories have also been indexed, except for 2.0.5 - 2.2.7 and 3.0 - 3.3 because those were not available on the ftp archive. Only the -RELEASE repositories have been included, which is generally a snapshot of the ports directory around the time of the release. A few packages are missing because the indexing script was unable to determine the package name and version for everything. Additionally, the dates indicated for many packages is a bit off, and the site doesn't handle this very well yet. :-(
Ubuntu
Historical releases were fetched from http://old-releases.ubuntu.com/ubuntu/, supported releases from a local mirror. All components (main, universe, restricted and multiverse) from the $release, $release-updates and $release-security repositories are indexed. Backports are not included at the moment. Indexing started around mid June 2012.
Only packages for a single architecture (i386 or i686) are scanned. To my knowledge, packages that come with different manuals for different architectures either don't exist or are extremely rare. It does happen that some packages are not available for all architectures. Usually, though, every package is at least available for i386/i686, so hopefully we're not missing out on much.

The repositories are scanned for new packages on a daily basis. _ end; h2 'Other systems'; p; lit <<' _'; Although further development of this site is a bit stalled at the moment, I'd love to index the manuals of most major Linux distributions in the future. Fedora and OpenSUSE, in particular, are interesting targets to index.

It would also be great to index a few more non-Linux systems such as other BSDs, Solaris/Illumos and Mac OS X. Unfortunately, those don't always follow a binary package based approach, or are otherwise less easy to properly index.

In general, systems that follow an entirely source-based distribution approach can't be indexed without compiling everything. Since that is both very resource-heavy and open to security issues, there are no plans to include manuals from such systems at the moment. So unless someone comes with a solution I hadn't thought of yet, there won't be any Gentoo manuals here. :-( _ end; h2 'Future plans'; p; lit <<' _'; This site isn't nearly as awesome yet as it could be. Here's some ideas that would be nice to have in the future: _ end; h2 'Copyright'; p; lit <<' _'; All manual pages are copyrighted by their respective authors. The manuals have been fetched from publically available repositories of free and (primarily) open source software. The distributors of said software have put in efforts to only include software and documentation that allows free distribution. Nonetheless, if a manual that does not allow to be redistributed has been inadvertently included in our index, please let me know and I will have it removed as soon as possible. _ end; end; $self->htmlFooter; } sub browsesearch { my $self = shift; my $q = $self->reqGet('q')||''; my $man = $self->dbSearch($q, 150); return $self->resRedirect("/$man->[0]{name}.$man->[0]{section}", 'temp') if @$man == 1; $self->htmlHeader(title => 'Search results for '.$q); h1 'Search results for '.$q; p 'Note: This is just a simple case-insensitive prefix match on the man names. In the future we\'ll have more powerful search functionality. Hopefully.'; if(@$man) { ul id => 'searchres'; for(@$man) { li; a href => "/$_->{name}.$_->{section}", $_->{name}; i " $_->{section}"; end; } end; } else { br; br; b 'No results :-('; } $self->htmlFooter; } sub pkg_list { my($self, $short) = @_; my $sys = $self->{sysbyshort}{$short}; return $self->resNotFound if !$sys; my $f = $self->formValidate( { get => 'c', required => 0, enum => [ '0', 'all', 'a'..'z' ], default => 'all' }, { get => 's', required => 0, regex => qr/^[a-zA-Z0-9_+.-]+$/i }, ); return $self->resNotFound if $f->{_err}; my $pkg = $self->dbPackageGet( hasman => 1, sysid => $sys->{id}, char => $f->{c} eq 'all' ? undef : $f->{c}, start => $f->{s}, results => 201, ); my $more = @$pkg > 200 && pop @$pkg; # TODO: A "previous" link would be nice... my $next = sub { use utf8; if($more) { p class => 'pagination'; a href => "/pkg/$short?c=$f->{c};s=$pkg->[199]{name}", 'next »'; end; } }; my $title = "Packages for $sys->{name}".($sys->{release}?" $sys->{release}":""); $self->htmlHeader(title => $title); h1 $title; p id => 'charselect'; for('all', 0, 'a'..'z') { a href => "/pkg/$short?c=$_", $_?uc$_:'#' if $_ ne $f->{c}; b $_?uc$_:'#' if $_ eq $f->{c}; } end; p 'Note: Packages without man pages are not listed.'; $next->(); ul id => 'packages'; for(@$pkg) { li; a href => "/pkg/$short/$_->{category}/$_->{name}", $_->{name}; i ' '.$_->{category}; end; } end; $next->(); $self->htmlFooter; } sub pkg_frompath { my($self, $sys, $path) = @_; # $path should be "$category/$name" or "$category/$name/$version", since # $category may contain a slash, let's try both options. # $category/$name # e.g. contrib/games/alien if($path =~ m{^(.+)/([^/]+)$}) { my($category, $name) = ($1, $2); my $pkg = $self->dbPackageGet(sysid => $sys, category => $category, name => $name, hasman => 1)->[0]; return ($pkg, '') if $pkg; } # $category/$name/$version # e.g. contrib/games/alien/10.2 if($path =~ m{^(.+)/([^/]+)/([^/]+)$}) { my($category, $name, $version) = ($1, $2, $3); my $pkg = $self->dbPackageGet(sysid => $sys, category => $category, name => $name, hasman => 1)->[0]; return ($pkg, $version) if $pkg; } (undef, ''); } sub pkg_info { my($self, $short, $path) = @_; my $sys = $self->{sysbyshort}{$short}; return $self->resNotFound if !$sys; my($pkg, $ver) = pkg_frompath($self, $sys->{id}, $path); return $self->resNotFound if !$pkg; my $vers = $self->dbPackageVersions($pkg->{id}); my $sel = $ver ? (grep $_->{version} eq $ver, @$vers)[0] : $vers->[0]; return $self->resNotFound if !$sel; my $f = $self->formValidate({ get => 's', required => 0}); return $self->resNotFound if $f->{_err}; my $mans = $self->dbManInfo(package => $sel->{id}, results => 201, start => $f->{s}, sort => 'syspkgname'); my $more = @$mans > 200 && pop @$mans; # Latest version of this package determines last modification date of the page. $self->setLastMod($vers->[0]{released}); my $title = "$sys->{name}".($sys->{release}?" $sys->{release}":"")." / $pkg->{category} / $pkg->{name}"; $self->htmlHeader(title => "$title $sel->{version}"); h1 $title; div id => 'pkgversions'; h2 'Versions'; ul; for(@$vers) { li; a href => "/pkg/$sys->{short}/$pkg->{category}/$pkg->{name}/$_->{version}", $_->{version} if $_ != $sel; b " $_->{version}" if $_ == $sel; i " $_->{released}"; end; } end; end; div id => 'pkgmans'; h2 "Manuals for version $sel->{version}"; ul; for(@$mans) { li; a href => "/$_->{name}/".substr($_->{hash},0,8), "$_->{name}($_->{section})"; b " $_->{locale}" if $_->{locale}; i " $_->{filename}"; end; } end; if($more) { use utf8; p class => 'pagination'; a href => "/pkg/$sys->{short}/$pkg->{category}/$pkg->{name}/$sel->{version}?s=$mans->[199]{name}", 'next »'; end; } end; $self->htmlFooter; } sub man_redir { my($self, $sys, $path) = @_; # Path can be: # 1. # 2. // # 3. /// $sys = $self->{sysbyshort}{$sys}; return $self->resNotFound if !$sys; my $man; if($path !~ m{/}) { # (1) ($man) = $self->dbManPrefName($path, sysid => $sys->{id}); } else { $path =~ s{/([^/]+)$}{}; my $name = $1; my($pkg, $ver) = pkg_frompath($self, $sys->{id}, $path); # Handles (2) and (3) return $self->resNotFound if !$pkg; my $verid = $ver && $self->dbPackageVersions($pkg->{id}, $ver)->[0]{id}; return $self->resNotFound if $ver && !$verid; ($man) = $self->dbManPrefName($name, sysid => $sys->{id}, pkgid => $pkg->{id}, pkgver => $verid); } return $self->resNotFound if !$man; $self->resRedirect("/$man->{name}/".substr($man->{hash}, 0, 8), 'temp'); }; sub _man_langsect { my($self, $man) = @_; # TODO: This is ugly, especially because clicking on a translation or # section, you can end up with a man page that is nowhere close to the man # page you're currently reading. Opening a version selector box might be a # better alternative. my @sect = $self->dbManSections($man->{name}); if(@sect > 1) { div id => 'sectionselect', class => 'hidden'; for (@sect) { if($man->{section} eq $_) { i $_; } else { a href => "/$man->{name}.$_", $_; } txt ' '; } end; } my @lang = $self->dbManLanguages($man->{name}, $man->{section}); if(@lang > 1) { div id => 'langselect', class => 'hidden'; (my $cur = $man->{locale}||'') =~ s/\..*//; for (@lang) { if(($_||'') eq $cur) { i $_ || 'default'; } else { a href => $_ ? "/lang/$_/$man->{name}.$man->{section}" : "/$man->{name}.$man->{section}", $_ || 'default'; } txt ' '; } end; } } sub _normalizename { local $_ = shift; # Firefox seems to escape [ and ] in URLs. It doesn't really have to... s/%5b/[/ig; s/%5d/]/ig; # Man pages with spaces in the path, eww s/%20/ /g; $_; } sub man { my($self, $name, $hash) = @_; $name = _normalizename($name); my $man; if($hash) { $man = $self->dbManInfo(name => $name, shorthash => $hash)->[0]; } else { ($man, undef) = $self->dbManPrefName($name); } return $self->resNotFound() if !$man; $self->setLastMod($man->{released}); $self->htmlHeader(title => $name); div id => 'manbuttons'; h1 $man->{name}; ul 'data-hash' => $man->{hash}, 'data-name' => $man->{name}, 'data-section' => $man->{section}, 'data-locale' => $man->{locale}||'', 'data-hasversions' => $self->dbManHasVersions($man->{name}, $man->{section}, $man->{locale}, $man->{hash}); li; a href => "/$man->{name}/".substr($man->{hash}, 0, 8).'/src', 'source'; end; li; a href => "/$man->{name}/".substr($man->{hash}, 0, 8), 'permalink'; end; end; end; div id => 'manres', class => 'hidden'; _man_langsect($self, $man); end; div id => 'contents'; my $c = $self->dbManContent($man->{hash}); pre; lit ManUtils::html(ManUtils::fmt_block $c); end; end; $self->htmlFooter(); } sub src { my($self, $name, $hash) = @_; $name = _normalizename($name); my $m = $self->dbManInfo(name => $name, shorthash => $hash); return $self->resNotFound if !@$m; $self->setLastMod($m->[0]{released}); $self->resHeader('Content-Type', 'text/plain; charset=UTF-8'); $self->resHeader('Content-Disposition', sprintf 'filename="%s.%s"', $m->[0]{name}, $m->[0]{section}); my $c = $self->dbManContent($m->[0]{hash}); lit $c; } sub xmlsearch { my $self = shift; my $q = $self->reqGet('q')||''; my $man = $self->dbSearch($q, 20); # The JS dropdown search expects this particular format. $self->resHeader('Content-Type' => 'text/xml; charset=UTF-8'); xml; tag 'results'; tag 'item', id => "$_->{name}.$_->{section}", %$_, undef for(@$man); end 'results'; } sub jsontree { my $self = shift; my $f = $self->formValidate( { get => 'name', required => 0, maxlength => 256 }, { get => 'section', required => 0, maxlength => 32 }, { get => 'locale', required => 0, default => '', maxlength => 32 }, { get => 'cur', required => 0, default => '', regex => qr/^[a-fA-F0-9]{40}$/ }, { get => 'hash', required => 0, default => '', regex => qr/^[a-fA-F0-9]{40}$/ }, ); return $self->resNotFound() if $f->{_err} || (!$f->{hash} && !($f->{section} && $f->{name})); my $l = $self->dbManInfo(sort => 'syspkgname', $f->{hash} ? (hash => $f->{hash}) : (name => $f->{name}, section => $f->{section}, locale => $f->{locale})); # Convert the list into a tree my $tree = []; my($sys, $sysver, $pkg, $pkgver); for my $m (@$l) { my $sysname = $self->{sysbyid}{$m->{system}}{name}; if(!$sys || $sysname ne $sys->{name}) { $sys = { name => $sysname, childs => [] }; $sysver = undef; push @$tree, $sys; } my $sysversion = $self->{sysbyid}{$m->{system}}{release} || ''; if(!$sysver || $sysversion ne $sysver->{name}) { $sysver = { name => $sysversion, childs => [] }; $pkg = undef; push @{$sys->{childs}}, $sysver; } if(!$pkg || $m->{package} ne $pkg->{name}) { $pkg = { name => $m->{package}, i => $m->{category}, table => [] }; $pkgver = undef; push @{$sysver->{childs}}, $pkg; } push @{$pkg->{table}}, [ $pkgver && $pkgver eq $m->{version} ? {name=>''} : {name => $m->{version}, href => "/pkg/$self->{sysbyid}{$m->{system}}{short}/$m->{category}/$m->{package}/$m->{version}"}, { name => "$m->{name}($m->{section})", $f->{hash} || lc($m->{hash}) eq lc($f->{cur}) ? () : (href => sprintf('/%s/%s', $m->{name}, substr $m->{hash}, 0, 8)) }, { name => substr($m->{hash}, 0, 8), $f->{hash} || lc($m->{hash}) eq lc($f->{cur}) ? () : (href => sprintf('/%s/%s', $m->{name}, substr $m->{hash}, 0, 8)) }, { name => $m->{filename} } ]; $pkgver = $m->{version}; } # Determine which elements to show/hide by default. # It might make more sense to do this in JS, but since I am utterly # incapable of writing maintainable JS I'm doing it here in order to keep the # JS stupid and simple. # TODO: Highlight systems/packages where the 'current' man page is? for my $sys (@$tree) { $sys->{expand} = 1 if $sys->{childs}[0]{name}; # Expand all systems that have named versions $sys->{expand} = 1 if $f->{hash}; # Expand everything on 'location' my $i = 0; for my $sysver (@{$sys->{childs}}) { $i++; $sysver->{expand} = 1 if !$sysver->{name}; # Expand unnamed versions (since you can't click them) $sysver->{expand} = 1 if $f->{hash}; # Expand everything on 'location' $sysver->{hide} = 1 if $i > 3 && @{$sys->{childs}} > 5; # Show only the first 3 versions for my $pkg (@{$sysver->{childs}}) { $pkg->{expand} = 1 if @{$sysver->{childs}} <= 3; # Expand everything if there's not too many things to expand $pkg->{expand} = 1 if $f->{hash}; # Expand everything on 'location' # TODO: Show/Hide duplicate hashes? } } } # Why JSON? Because TUWF::XML is pretty slow with many nodes $self->resHeader('Content-Type' => 'application/json; charset=UTF-8'); lit(JSON::XS->new->ascii->encode($tree)); } package TUWF::Object; use TUWF ':html', 'html_escape'; use Time::Local 'timegm'; sub escape_like { (my $v = shift) =~ s/([_%])/\\$1/g; $v; } sub htmlHeader { my $self = shift; my %o = @_; html; head; Link rel => 'stylesheet', type => 'text/css', href => '/man.css?2'; title $o{title}.' - manned.org'; end 'head'; body; div id => 'header'; a href => '/', 'manned.org'; form action => '/browse/search', method => 'get'; input type => 'text', name => 'q', id => 'q', tabindex => 1; input type => 'submit', value => ' '; end; end; div id => 'body'; } sub htmlFooter { my($self, %o) = @_; br style => 'clear: both'; end; div id => 'footer'; lit 'All manual pages are copyrighted by their respective authors. | About manned.org | Contact | Source'; end; script type => 'text/javascript', src => '/man.js', ''; end; end 'html'; # write the SQL queries as a HTML comment when debugging is enabled # (stolen from VNDB code) if($self->debug) { lit "\n\n"; } } # Set the last modification time from a string in yyyy-mm-dd format. sub setLastMod { my($s, $d) = @_; return if $d !~ /^(\d{4})-(\d{2})-(\d{2})/; my @t = gmtime timegm 0,0,0,$3,$2-1,$1; $s->resHeader('Last-Modified', sprintf '%s, %02d %s %04d %02d:%02d:%02d GMT', (qw|Sun Mon Tue Wed Thu Fri Sat|)[$t[6]], $t[3], (qw|Jan Feb Mar Apr May Jun Jul Aug Sep Oct Nov Dec|)[$t[4]], $t[5]+1900, $t[2], $t[1], $t[0]); } sub dbManContent { my($s, $hash) = @_; return $s->dbRow(q{SELECT content FROM contents WHERE hash = decode(?, 'hex')}, $hash)->{content}; } # Options: name, section, shorthash, package, start, results, sort sub dbManInfo { my $s = shift; my %o = @_; my %where = ( $o{name} ? ('m.name = ?' => $o{name}) : (), $o{package} ? ('m.package = ?' => $o{package}) : (), defined($o{section}) ? ('m.section = ?' => $o{section}) : (), $o{locale} ? ('m.locale = ?' => $o{locale}) : (), defined($o{locale}) && !$o{locale} ? ('m.locale IS NULL' => 1) : (), $o{shorthash} ? (q{substring(m.hash from 1 for 4) = decode(?, 'hex')} => $o{shorthash}) : (), $o{hash} ? (q{m.hash = decode(?, 'hex')} => $o{hash}) : (), $o{start} ? ('m.name > ?' => $o{start}) : (), ); $o{sort} ||= ''; my $order = $o{sort} eq 'syspkgname' ? 'ORDER BY s.name, s.relorder DESC, p.name, v.released DESC, m.name, m.locale NULLS FIRST, m.filename' : ''; return $s->dbAll(q{ SELECT p.system, p.category, p.name AS package, v.version, v.released, m.name, m.section, m.filename, m.locale, encode(m.hash, 'hex') AS hash FROM man m JOIN package_versions v ON v.id = m.package JOIN packages p ON p.id = v.package JOIN systems s ON s.id = p.system !W !s LIMIT ? }, \%where, $order, $o{results}||10000); } # Very simple (and fast) prefix match. sub dbSearch { my($s, $q, $limit) = @_; my $sect = $q =~ s/^([0-9])\s+// || $q =~ s/\(([a-zA-Z0-9]+)\)$// ? $1 : ''; my $name = $q =~ s/^([a-zA-Z0-9,.:_-]+)// ? $1 : ''; return !$name ? [] : $s->dbAll( 'SELECT name, section FROM man_index !W ORDER BY name, section LIMIT ?', { 'lower(name) LIKE ?' => escape_like(lc $name).'%', $sect ? ('section ILIKE ?' => escape_like(lc $sect).'%') : (), }, $limit ); } # Get the preferred man page for the given filters. Returns a row with the same fields as dbManInfo(). sub dbManPref { my($s, $name, $section, %o) = @_; my %where = ( 'm.name = ?' => $name, $section ? ('m.section LIKE ?' => escape_like($section).'%') : (), $o{sysid} ? ('p.system = ?' => $o{sysid}) : (), $o{package} ? ('p.id = ?' => $o{package}) : (), $o{pkgver} ? ('v.id = ?' => $o{pkgver}) : (), $o{language}? (q{substring(locale from '^[^.]+') = ?} => $o{language}) : (), ); # Criteria to determine a "preferred" man page: # 1. english: English versions of a man page have preference over other locales # 2. pkgver: Newer versions of the same package have preference over older versions # 3. stdloc: Prefer man pages in standard locations # 4. secmatch: Prefer an exact section match # 5. arch: Prefer Arch over other systems (because it tends to be the most up-to-date, and closest to upstreams) # 6. sysrel: Prefer a later system release over an older release # 7. secorder: Lower sections before higher sections (because man does it this way, for some reason) # 8. Fall back on hash comparison, to ensure the result is stable $s->dbAll(q{ WITH unfiltered AS ( SELECT s AS sys, p AS pkg, v AS ver, m AS man FROM man m JOIN package_versions v ON v.id = m.package JOIN packages p ON p.id = v.package JOIN systems s ON s.id = p.system !W ), f_english AS( SELECT * FROM unfiltered WHERE NOT EXISTS(SELECT 1 FROM unfiltered WHERE is_english_locale((man).locale)) OR is_english_locale((man).locale) ), f_pkgver AS( SELECT * FROM f_english a WHERE NOT EXISTS(SELECT 1 FROM f_english b WHERE (a.ver).package = (b.ver).package AND (a.ver).released < (b.ver).released) ), f_stdloc AS( SELECT * FROM f_pkgver WHERE NOT EXISTS(SELECT 1 FROM f_pkgver WHERE is_standard_man_location((man).filename)) OR is_standard_man_location((man).filename) ), f_secmatch AS( SELECT * FROM f_stdloc WHERE NOT EXISTS(SELECT 1 FROM f_stdloc WHERE (man).section = ?) OR (man).section = ? ), f_arch AS( SELECT * FROM f_secmatch WHERE NOT EXISTS(SELECT 1 FROM f_secmatch WHERE (sys).id = 1) OR (sys).id = 1 ), f_sysrel AS( SELECT * FROM f_arch a WHERE NOT EXISTS(SELECT 1 FROM f_arch b WHERE (a.sys).name = (b.sys).name AND (a.sys).relorder < (b.sys).relorder) ), f_secorder AS( SELECT * FROM f_sysrel a WHERE NOT EXISTS(SELECT 1 FROM f_sysrel b WHERE (a.man).section > (b.man).section) ) SELECT (pkg).system, (pkg).category, (pkg).name AS package, (ver).version, (ver).released, (man).name, (man).section, (man).filename, (man).locale, encode((man).hash, 'hex') AS hash FROM f_secorder ORDER BY (man).hash LIMIT 1 }, \%where, $section, $section)->[0]; } # Given the name of a man page with optional section, find out the actual name # and section prefix of the man page and the preferred version. sub dbManPrefName { my($s, $name, %o) = @_; my $man = $s->dbManPref($name, '', %o); return ($man, '') if $man; return (undef, '') if $name !~ s/\.([^.]+)$//; my $section = $1; $man = $s->dbManPref($name, $section, %o); return ($man, $section) if $man; return (undef, ''); } # Returns 1 of there are alternative versions of the given man page. sub dbManHasVersions { my($s, $name, $section, $locale, $hash) = @_; return $s->dbRow( q{SELECT 1 AS ok FROM man WHERE name = ? AND section = ? AND locale IS NOT DISTINCT FROM ? AND hash <> decode(?, 'hex') LIMIT 1}, $name, $section, $locale, $hash )->{ok}||0; } # Returns all available languages for a man page sub dbManLanguages { my($s, $name, $section) = @_; return map $_->{lang}, @{$s->dbAll(q{SELECT DISTINCT substring(locale from '^[^.]+') AS lang FROM man WHERE name = ? AND section = ? ORDER BY substring(locale from '^[^.]+') NULLS FIRST }, $name, $section)}; } # Returns all available languages for a man page sub dbManSections { my($s, $name) = @_; return map $_->{section}, @{$s->dbAll(q{SELECT DISTINCT section FROM man WHERE name = ? ORDER BY section}, $name)}; } sub dbSystemGet { return shift->dbAll('SELECT id, name, release, short, relorder FROM systems ORDER BY name, relorder'); } # Options: sysid char hasman start results sub dbPackageGet { my $s = shift; my %o = (results => 10, @_); my @where = ( $o{sysid} ? ('system = ?' => $o{sysid}) : (), $o{category} ? ('category = ?' => $o{category}) : (), $o{name} ? ('name = ?' => $o{name}) : (), $o{start} ? ('name > ?' => $o{start}) : (), # This seems slow, perhaps cache? defined($o{hasman}) ? ('!s EXISTS(SELECT 1 FROM package_versions pv WHERE pv.package = p.id AND EXISTS(SELECT 1 FROM man m WHERE m.package = pv.id))' => $o{hasman}?'':'NOT') : (), $o{char} ? ( 'LOWER(SUBSTR(name, 1, 1)) = ?' => $o{char} ) : (), defined($o{char}) && !$o{char} ? ( '(ASCII(name) < 97 OR ASCII(name) > 122) AND (ASCII(name) < 65 OR ASCII(name) > 90)' => 1 ) : (), ); return $s->dbAll(q{ SELECT id, system, name, category FROM packages p !W ORDER BY name LIMIT ?}, \@where, $o{results}) } sub dbPackageVersions { my($s, $id, $version) = @_; my %where = ( 'package = ?' => $id, $version ? ('version = ?' => $version) : (), 'EXISTS(SELECT 1 FROM man m WHERE m.package = v.id)' => 1, ); return $s->dbAll(q{ SELECT id, version, released FROM package_versions v !W ORDER BY released DESC}, \%where) } sub dbStats { return $_[0]->dbRow('SELECT * FROM stats_cache'); }