#!/usr/bin/perl
# $Id$
use CGI qw/:standard/;
use lib qw/./;
use LocalVars;
use DB_File;
use strict;
use Data::Dumper;
use Template;
use OurNet::FuzzyIndex;
use Data::Serializer;
use Time::HiRes qw/gettimeofday tv_interval/;
use b2g;
use POSIX;
use vars qw/%db $brdname $fpath $isgb %b2g/;
sub main
{
my($tmpl, $rh, $key);
if( !(($brdname, $fpath) = $ENV{PATH_INFO} =~ m|^/([\w\-]+?)(/.*)|) ||
!(tie %db, 'DB_File',
"$MANDATA/$brdname.db", O_RDONLY, 0666, $DB_HASH) ){
return redirect("/man.pl/$1/")
if( $ENV{PATH_INFO} =~ m|^/([\w\-]+?)$| );
print header(-status => 404);
return;
}
charset('');
print header();
$isgb = (param('gb') ? 1 : 0);
if( ($key = param('key')) ){
$rh = search($key);
}
else{
$rh = (($fpath =~ m|/$|) ? dirmode($fpath) : articlemode($fpath));
}
$rh->{brdname} = $brdname;
$tmpl = Template->new({INCLUDE_PATH => '.',
ABSOLUTE => 0,
RELATIVE => 0,
RECURSION => 0,
EVAL_PERL => 0,
COMPILE_EXT => '.tmpl',
COMPILE_DIR => $MANCACHE,
});
if( $rh->{gb} = $isgb ){
$rh->{encoding} = 'gb2312';
$rh->{lang} = 'zh_CN';
$rh->{charset} = 'gb2312';
}
else{
$rh->{encoding} = 'Big5';
$rh->{lang} = 'zh_TW';
$rh->{charset} = 'big5';
}
$tmpl->process($rh->{tmpl}, $rh);
untie %db;
}
sub dirmode
{
my(%th, $isdir);
my $serial = Data::Serializer->new(serializer => 'Storable',
digester => 'MD5',
compress => 0,
);
foreach( @{$serial->deserialize($db{$fpath})} ){
$_->[1] =~ s/([\xA1-\xF9].)/$b2g{$1}/eg if( $isgb );
#Encode::from_to($_->[1], 'big5', 'gbk') if( $isgb );
$isdir = (($_->[0] =~ m|/$|) ? 1 : 0);
push @{$th{dat}}, {isdir => $isdir,
fn => "man.pl/$brdname$_->[0]",
title => $_->[1]};
}
$th{tmpl} = 'dir.html';
$th{isroot} = ($fpath eq '/') ? 1 : 0;
$th{buildtime} = POSIX::ctime($db{_buildtime} || 0);
return \%th;
}
sub articlemode
{
my(%th);
$th{tmpl} = 'article.html';
$th{content} = $db{$fpath};
$th{content} =~ s/\033\[.*?m//g;
$th{content} =~ s|(http://[\w\-\.\:\/\,@\?=~]+)|<a href="$1">$1</a>|gs;
$th{content} =~ s|(ftp://[\w\-\.\:\/\,@~]+)|<a href="$1">$1</a>|gs;
$th{content} =~
s|批踢踢兔|<a href="http://blog.ptt2.cc">批踢踢兔</a>|gs;
$th{content} =~
s|發信站: 批踢踢實業坊|發信站: <a href="http://blog.ptt.cc">批踢踢實業坊</a>|gs;
$th{content} =~
s|ptt\.csie\.ntu\.edu\.tw|<a href="telnet://ptt.csie.ntu.edu.tw">ptt.csie.ntu.edu.tw</a>|gs;
$th{content} =~
s|ptt\.twbbs\.org|<a href="telnet://ptt.csie.ntu.edu.tw">ptt.twbbs.org</a>|gs;
$th{content} =~ s/([\xA1-\xF9].)/$b2g{$1}/eg if( $isgb );
#Encode::from_to($th{content}, 'big5', 'gbk') if( $isgb );
return \%th;
}
sub search($)
{
my($key) = @_;
my(%th, $idx, $k, $t0);
$t0 = [gettimeofday()];
$idx = OurNet::FuzzyIndex->new("$MANDATA/$brdname.idx");
my %result = $idx->query($th{key} = $key, MATCH_FUZZY);
foreach my $t (sort { $result{$b} <=> $result{$a} } keys(%result)) {
$k = $idx->getkey($t);
push @{$th{search}}, {title => $db{"title-$k"},
fn => $k,
score => $result{$t} / 10};
}
$th{elapsed} = tv_interval($t0);
$th{key} = $key;
$th{tmpl} = 'search.html';
undef $idx;
return \%th;
}
main();
1;