1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
|
#!/usr/bin/perl
# $Id$
use lib '/home/bbs/bin/';
use strict;
use OurNet::FuzzyIndex;
use Getopt::Std;
use DB_File;
use BBSFileHeader;
use Data::Serializer;
use Compress::Zlib;
my(%db, $idx, $serial);
sub main
{
die usage() unless( getopts('nz') || !@ARGV );
$serial = Data::Serializer->new(serializer => 'Storable',
digester => 'MD5',
compress => 0,
);
foreach( @ARGV ){
if( /\.db$/ ){
next if( $Getopt::Std::opt_n );
print "building idx for $_\n";
tie %db, 'DB_File', $_, O_RDONLY, 0666, $DB_HASH;
$idx = OurNet::FuzzyIndex->new(substr($_, 0, -3). '.idx');
buildidx();
}
else{
tie %db, 'DB_File', "$_.db", O_CREAT | O_RDWR, 0666, $DB_HASH;
$idx = OurNet::FuzzyIndex->new("$_.idx")
if( !$Getopt::Std::opt_n );
build("/home/bbs/man/boards/".substr($_, 0, 1)."/$_", '');
$db{_buildtime} = time();
$db{_gzip} = 1 if( $Getopt::Std::opt_z );
untie %db;
}
}
}
sub buildidx
{
my $gzipped = $db{_gzip};
foreach( keys %db ){
next if( /^title/ || /\/$/ ); # 是 title 或目錄的都跳過
$idx->insert($_,
($db{"title-$_"}. "\n".
($gzipped ? Compress::Zlib::memGunzip($db{$_}) :
$db{$_})));
}
}
sub build($$)
{
my($basedir, $doffset) = @_;
my(%bfh, $fn, @tdir);
print "building $basedir\n";
tie %bfh, 'BBSFileHeader', $basedir;
foreach( 0..($bfh{num} - 1) ){
next if( $bfh{"$_.filemode"} & 32 ); # skip HIDDEN
next if( !($fn = $bfh{"$_.filename"}) ); # skip empty filename
if( $bfh{"$_.isdir"} ){
push @tdir, ["$doffset/$fn/", # 目錄結尾要加 /
$db{"title-$doffset/$fn/"} = $bfh{"$_.title"}];
build("$basedir/$fn", "$doffset/$fn");
}
else{
push @tdir, ["$doffset/$fn",
$db{"title-$doffset/$fn"} = $bfh{"$_.title"}];
my $c = $bfh{"$_.content"};
$idx->insert("$doffset/$fn", $bfh{"$_.title"}. "\n$c")
if( !$Getopt::Std::opt_n );
$db{"$doffset/$fn"} = ($Getopt::Std::opt_z ?
Compress::Zlib::memGzip($c) : $c);
}
}
$db{"$doffset/"} = $serial->serialize(\@tdir);
}
sub usage
{
print ("$0 [-n] boardname ...\n".
"\t -n for .db only (no .idx)\n");
exit(0);
}
main();
1;
|