Namazu-devel-ja($B5l(B)

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: $B0lB@O:(B(5$B!A(B10)$BMQ$N(B$B%U%#%k%?(B

From: Yukio USUDA <usuda@xxxxxxxxxx>
Date: Wed, 12 Mar 2003 02:48:02 +0900
X-ml-name: namazu-devel-ja
X-mail-count: 02734
References: <200302281101.UAA22928@x81002.hsba.go.jp>

$B11ED$G$9(B
(B
(Bdoccat$BITMW!"0lB@O:$d(BWord$B$N(BOLE$B8F$S=P$7ITMW$H$$$&(Bfilter$B$,(B
$B?tG/A0$KM_$7$+$C$?$N$r;W$$=P$7$D$D:n6H$r$7$F$$$^$9!#(B
(B
$B$=$b$=$b%K!<%:$,$I$l$[$I$"$k$N$+$o$+$i$J$$$3$H$H!"(B
$BF0$1$P$h$$$H$$$&;Q@*$G=q$$$F$$$k%=!<%9$G$b$"$j$*CQ$:$+$7$$$N(B
$B$G$9$,!";HMQ$G$-$k%l%Y%k$K$J$C$?$i(BNamazuProject$B$K4sB#$7$?$$$H(B
$B;W$C$F$*$j$^$9!#(B
$B$=$N:]$K$O!"$J$K$+/!9=$@5$r$7$F$_$^$7$?$N$G!":FEYAwIU$7$F$*$-$^$9!#(B
$B!&%U%!%$%k$N:n@.$i$7$-%G!<%?NN0h$r8+$D$1$?$N$G(BAuthor$B$r(B
$B!!=PNO$G$-$k$h$&$K$7$F$_$^$7$?!#(B
$B!&%?!<%2%C%H$H$J$k%U%!%$%k$rJQ?t$KFI$_9~$s$G(Bfilter$B8F$S=P$7;~(B
$B!!$KEO$5$l$F$$$k$3$H$K5$$E$$$?$?$a%U%!%$%k$NFI$_9~$_$r8:$i$7(B
$B!!$^$7$?!#(B
(B
$BE:IU$7$F$$$k0lB@O:#7!A#1#0$N%U%#%k%?$K$O(B
(BUTF-16$B$r(BEUC$B$KJQ49$9$k%W%m%0%i%`$H$7$F2<5-$N%5%$%H$N(Bunicode.pl
$B$r;H$o$;$FD:$$$F$$$k$?$a!"$3$A$i$bI,MW$K$J$j$^$9!#(B
(Bhttp://www.onicos.com/staff/iz/release/
(B
(BUTF-16$B$+$i(BEUC$B$KJQ49$9$kB>$NNI$$J}K!$r$4B8CN$N$+$?$*65$($/$@$5$$!#(B
(B
$B11ED9,@8(B
(B---------------------------------------------------------------
(Btaro7_10.pl
(B
(B
(Bpackage taro7_10;
(Buse strict;
(Buse File::Copy;
(Brequire 'util.pl';
(Brequire 'gfilter.pl';
(Brequire 'unicode.pl';
(B
(Bsub mediatype() {
(B    return ('application/x-js-taro');
(B}
(B
(Bsub status() {
(B    my $unicodepath = util::checklib('unicode.pl');
(B    return 'yes' if defined $unicodepath;
(B    return 'no'; 
(B}
(B
(Bsub recursive() {
(B    return 0;
(B}
(B
(Bsub pre_codeconv() {
(B    return 0;
(B}
(B
(Bsub post_codeconv () {
(B    return 0;
(B}
(B
(Bsub add_magic ($) {
(B    my ($magic) = @_;
(B    $magic->addFileExts('(?i)\\.jtd', 'application/x-js-taro');
(B    $magic->addFileExts('(?i)\\.jfw', 'application/x-js-taro');
(B    return;
(B}
(B
(Bsub filter ($$$$$) {
(B    my ($orig_cfile, $cont, $weighted_str, $headings, $fields)
(B      = @_;
(B    my $cfile = defined $orig_cfile ? $$orig_cfile : '';
(B    my $tmpfile  = util::tmpnam('NMZ.taro');
(B    my $tmpfile2 = util::tmpnam('NMZ.taro2');
(B    open(OUT, "> $tmpfile2");
(B    binmode(OUT);
(B    my @data = unpack("C*", $$cont);
(B    my $i = 0;
(B    while ( $i <= $#data) {
(B        if (pack("C", $data[$i]) eq "T") {
(B            my $matchdata = "";
(B            my $j = $i;
(B            while ( $j <= ($i + 7)) {
(B                $matchdata .= pack("C", $data[$j]);
(B                $j++;
(B            }
(B            if ( $matchdata eq "TextV.01"){
(B                my $textsizep = pack("C4", $data[$i+8], $data[$i+9],
(B                                        $data[$i+10], $data[$i+11]);
(B                my $textsize = unpack("N", $textsizep);
(B                my $k = 1;
(B                while ( $k <= ($textsize * 2)) {
(B                    print OUT pack("C", $data[$i + 11 + $k]);
(B                    $k++;
(B                }
(B                print OUT  pack("n", 10);
(B                $i = $j + $k;
(B            }
(B        }elsif (pack("C", $data[$i]) eq "\x04") {
(B            my $matchdata = "";
(B            my $j = $i;
(B            while ( $j <= ($i + 9)) {
(B                $matchdata .= pack("C", $data[$j]);
(B                $j++;
(B            }
(B            if ( $matchdata eq pack("H20", "040000315c4f10620580")){
(B                my $textsize =  $data[$i+80] - 2;
(B                my $k = 1;
(B                my $authorname;
(B                while ( $k <= ($textsize)) {
(B                    $authorname .= pack("C", $data[$i + 95 + $k]);
(B                    $k++;
(B                }
(B                my @unicodeList = unpack("v*", $authorname);
(B                $authorname = &unicode::u2e(@unicodeList);
(B                $authorname =~ s/\x00//g;
(B                $fields->{'author'} = $authorname;
(B            }
(B        }
(B        $i++;
(B    }
(B    close(OUT);
(B
(B     my $buf; 
(B     my ($dev, $ino, $mode, $nlink, $uid, $gid,
(B     $rdev, $size, $atime, $mtime, $ctime, $blksize, $blocks)
(B        = stat("$tmpfile2");
(B    open(IN, "$tmpfile2");
(B    binmode(IN);
(B    read(IN, $buf, $size);
(B    close(IN);
(B    my @unicodeList = unpack("n*", $buf);
(B    my $eucString   = &unicode::u2e(@unicodeList);
(B
(B    open(OUT, "> $tmpfile");
(B    binmode(OUT);
(B    $i =0;
(B    while ( $i < length($eucString)) {
(B        my $code1 = unpack("C",substr($eucString, $i, 1));
(B        my $code2 = unpack("C",substr($eucString, $i+1, 1));
(B        my $code = "";
(B        if (($code1 == hex("00")) and ($code2 >= hex("20"))
(B          and ($code2 <= hex("7f"))) {
(B            $code = pack("C", $code2);
(B            $i++;
(B        }
(B        if (($code1 == hex("00")) and ($code2 == hex("0a"))) {
(B            $code = pack("C", $code2);
(B            $i++;
(B        }
(B        if (($code1 >= hex("a1")) and ($code1 <= hex("a8"))
(B          and ($code2 > hex("a0")) and ($code2 < hex("ff"))) {
(B            $code = pack("CC", $code1, $code2);
(B            $i++;
(B        }
(B        if (($code1 >= hex("b0")) and ($code1 <= hex("f4"))
(B          and ($code2 > hex("a0")) and ($code2 < hex("ff"))) {
(B            $code = pack("CC", $code1, $code2);
(B            $i++;
(B        }
(B        $i++;
(B        print OUT $code;
(B    }
(B    close(OUT);
(B
(B    {
(B        my $fh = util::efopen("< $tmpfile");
(B        $$cont = util::readfile($fh);
(B    }
(B
(B    unlink($tmpfile);
(B    unlink($tmpfile2);
(B
(B    gfilter::line_adjust_filter($cont);
(B    gfilter::line_adjust_filter($weighted_str);
(B    gfilter::white_space_adjust_filter($cont);
(B    $fields->{'title'} = gfilter::filename_to_title($cfile, $weighted_str)
(B      unless $fields->{'title'};
(B    gfilter::show_filter_debug_info($cont, $weighted_str,
(B               $fields, $headings);
(B    return undef;
(B}
(B
(B1;

Follow-Ups:
- Re: $B0lB@O:(B(5 $B!A(B 10) $BMQ$N%U%#%k%?(B
  - From: NOKUBI Takatsugu
- Re: $B0lB@O:(B(5$B!A(B10)$BMQ$N(B$B%U%#%k%?(B
  - From: Tadamasa Teranishi

References:
- $B0lB@O:(B(5$B!A(B10)$BMQ$N(B$B%U%#%k%?(B
  - From: Yukio USUDA

Prev by Date: Re: NMZ.i $B$N%9%3%"CM(B
Next by Date: Re: $B0lB@O:(B(5$B!A(B10)$BMQ$N(B$B%U%#%k%?(B
Previous by thread: $B0lB@O:(B(5$B!A(B10)$BMQ$N(B$B%U%#%k%?(B
Next by thread: Re: $B0lB@O:(B(5$B!A(B10)$BMQ$N(B$B%U%#%k%?(B
Index(es):
- Date
- Thread

Namazu-devel-ja($B5l(B)

Re: $B0lB@O:(B(5$B!A(B10)$BMQ$N(B$B%U%#%k%?(B

Namazu-devel-ja($B5l(B)

Re: $B0lB@O:(B(5$B!A(B10)$BMQ$N(B$B%U%#%k%?(B