Namazu-users-ja($B5l(B)

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: ms-word $B%I%-%e%a%s%H$N%X%C(B$B%@!"%U%C%?$O8!:wBP>]$K$J$k$N$+(B ( $B%=!<%9$,$D$$$FD9J8$G$9!#(B)

From: Amuro Ray <gundam@xxxxxxxxxxxxxxxx>
Date: Thu, 31 Jan 2002 23:47:38 +0900
X-ml-name: namazu-users-ja
X-mail-count: 02420
References: <3C56E6BE.D50F26BE@asahi-net.or.jp>

Amuro Ray$B$G$9!#(B
(B
(BTadamasa Teranishi <yw3t-trns@xxxxxxxxxxxxxxx> wrote:
(B
(B> 
(B> filter/word.pl $B$@$C$?$+$NCf$G!"(BwvWare $B$r8F$S=P$7$F$$$kItJ,$N(B
(B> $B=hM}$,$I$&$J$C$F$$$k$+$G$9$M!#(B
(B> 
(B> $B$=$&$$$($P!"(Bhtml $B$G$O$J$/!"(Btext $B=PNO$7$F=hM}$7$F$$$k$N$+$b(B
(B> $B$7$l$^$;$s!#(B
(B> 
(B
$B$4;XE&$N(BwvWare$B$N(Btext$B=PNO$G$9$,!"(Bman$B$H(B--help$B$r$_$k$H%*%W(B
$B%7%g%sIU$1$G$O$J$/!"(BwvText$B$H$$$&%9%/%j%W%H$G9T$&$h$&$G$9!#(B
(B
$B7k2L$G$9$,!"(BwvText$B$G(BHTML$B$r:n@.$7$?$iLdBj$J$/!"%X%C%@!"%U(B
$B%C%?$,4^$^$l$F$$$^$7$?!#(B
(B
$B%U%#%k%?$NJ}$G$9$,!"(BPerl$B$r$^$C$?$/CN$i$J$$$N$G!"K\20$GN)(B
$B$AFI$_$J$s$>$7$F8+$?$j$7$?$N$G$9$,!"(B
(B	
(Bsystem("$wordconvpath $tmpfile | $utfconvpath -Iu8 -Oej 
(B> $tmpfile2");
(B
$B$3$N9T$G(BwvHtml + lv$B$r9T$C$F$$$k$h$&$G$9!#(B
$B@5$7$1$l$P!"(Bword$B$NJQ49$O(BHTML$B$K$J$C$F$$$k$h$&$G$9!#(B
(B(msword.pl$B$C$FB>$N(Bperl$B$rFI$_9~$s$@$j!"$I$3$+$i8F$P$l$F$$(B
$B$k%5%V%k!<%A%s$+$^$C$?$/(B???)
(B
(B
$B2r7h$N80$K$J$k$+$o$+$j$^$;$s$,!":#$N4D6-$N(BWord$B%U%#%k%?$N(B
$B%9%/%j%W%H%U%!%$%k$rE:IU$7$^$9$N$G!"0z$-B3$-$4=u8@$r$*4j(B
$B$$$7$^$9!#(B
(B
(B
$B!V(Bmsword.pl$B!W(B
(B
(Bpackage msword;
(Buse strict;
(Buse File::Copy;
(Brequire 'util.pl';
(Brequire 'gfilter.pl';
(Brequire 'html.pl';
(B
(Bmy $wordconvpath  = undef;
(Bmy $utfconvpath   = undef;
(Bmy $wvversionpath = undef;
(B
(Bsub mediatype() {
(B    return ('application/msword');
(B}
(B
(Bsub status() {
(B    $wordconvpath = util::checkcmd('wvWare');
(B    if (defined $wordconvpath) {
(B	my $libpath = `wv-libconfig |sed -e 's/^-L//' -e 's/ .*\$//'`;
(B	chomp $libpath;
(B	if (defined $libpath) {
(B	    $wordconvpath .= " --config $libpath/wv/wvHtml.xml";
(B	} else {
(B	    $wordconvpath = undef;
(B	}
(B    } else {
(B	$wordconvpath = util::checkcmd('wvHtml');
(B    }
(B    if (defined $wordconvpath) {
(B	if (!util::islang("ja")) {
(B	    return 'yes';
(B	} else {
(B	    $utfconvpath   = util::checkcmd('lv');
(B	    $wvversionpath = util::checkcmd('wvVersion');
(B	    if ((defined $utfconvpath) && (defined $wvversionpath)) {
(B		return 'yes';
(B	    } else {
(B		return 'no';
(B	    }
(B	}
(B    } else {
(B        $wordconvpath = util::checkcmd('doccat');
(B        return 'yes' if defined $wordconvpath;
(B	return 'no';
(B    }
(B}
(B
(Bsub recursive() {
(B    return 0;
(B}
(B
(Bsub pre_codeconv() {
(B    return 0;
(B}
(B
(Bsub post_codeconv () {
(B    return 0;
(B}
(B
(Bsub add_magic ($) {
(B    return;
(B}
(B
(Bsub filter ($$$$$) {
(B    my ($orig_cfile, $cont, $weighted_str, $headings, $fields)
(B      = @_;
(B    my $err = undef;
(B 
(B    if (util::checkcmd('wvHtml')) {
(B    $err = filter_wv($orig_cfile, $cont, $weighted_str, $headings, $fields);
(B    } else { 
(B    $err = filter_doccat($orig_cfile, $cont, $weighted_str, $headings, $fields);
(B    }
(B    return $err;
(B}   
(B
(Bsub filter_wv ($$$$$) {
(B    my ($orig_cfile, $cont, $weighted_str, $headings, $fields)
(B      = @_;
(B    my $cfile = defined $orig_cfile ? $$orig_cfile : '';
(B
(B    my $tmpfile  = util::tmpnam('NMZ.word');
(B    my $tmpfile2 = util::tmpnam('NMZ.word2');
(B
(B
(B    if (util::islang("ja")) {
(B    }
(B
(B    util::vprint("Processing ms-word file ... (using  '$wordconvpath')\n");
(B
(B    { 
(B	my $fh = util::efopen("> $tmpfile");
(B	print $fh $$cont;
(B    }
(B
(B    if (!util::islang("ja")) {
(B	system("$wordconvpath $tmpfile > $tmpfile2");
(B    } else {
(B	my $version = "unknown";
(B	my $supported = undef;
(B	my $fh_cmd = util::efopen("$wvversionpath $tmpfile |");
(B	while (<$fh_cmd>) {
(B	    if (/^Version: (word\d+),/i) {
(B		$version = $1;
(B		#
(B		# Only word8 format is supported for Japanese.
(B		#
(B		if ($version =~ /^word8$/) {
(B		    $supported = 1;
(B		}
(B	    }
(B	}
(B	return _("Unsupported format: ") .  $version unless $supported;
(B	system("$wordconvpath $tmpfile | $utfconvpath -Iu8 -Oej > $tmpfile2");
(B    }
(B
(B    {
(B	my $fh = util::efopen("< $tmpfile2");
(B	$$cont = util::readfile($fh);
(B
(B	# Exclude wvHtml's footer becaues it has no good index terms.
(B	$$cont =~ s/<!--Section Ends-->.*$//s;
(B    }
(B
(B    unlink($tmpfile);
(B    unlink($tmpfile2);
(B
(B    html::html_filter($cont, $weighted_str, $fields, $headings);
(B
(B    gfilter::line_adjust_filter($cont);
(B    gfilter::line_adjust_filter($weighted_str);
(B    gfilter::white_space_adjust_filter($cont);
(B    $fields->{'title'} = gfilter::filename_to_title($cfile, $weighted_str)
(B      unless $fields->{'title'};
(B    gfilter::show_filter_debug_info($cont, $weighted_str,
(B			   $fields, $headings);
(B    return undef;
(B}
(B
(Bsub filter_doccat ($$$$$) {
(B    my ($orig_cfile, $cont, $weighted_str, $headings, $fields)
(B      = @_;
(B    my $cfile = defined $orig_cfile ? $$orig_cfile : '';
(B 
(B    my $tmpfile  = util::tmpnam('NMZ.word');
(B    my $tmpfile2 = util::tmpnam('NMZ.word2');   
(B    copy("$cfile", "$tmpfile2");
(B
(B    system("$wordconvpath -o e $tmpfile2 > $tmpfile");
(B
(B    {
(B        my $fh = util::efopen("< $tmpfile");
(B        $$cont = util::readfile($fh);
(B    }
(B
(B    unlink($tmpfile);
(B    unlink($tmpfile2);
(B
(B    gfilter::line_adjust_filter($cont);
(B    gfilter::line_adjust_filter($weighted_str);
(B    gfilter::white_space_adjust_filter($cont);
(B    $fields->{'title'} = gfilter::filename_to_title($cfile, $weighted_str)
(B	unless $fields->{'title'};
(B    gfilter::show_filter_debug_info($cont, $weighted_str,
(B               $fields, $headings);
(B    return undef;
(B}
(B
(B1;
(B
(B"$B!z!#!"(B::$B!#(B.::$B!&(B'$B!,!y!#(B.::$B!&(B'$B!,!z!#!"(B::$B!#(B.::$B!&(B'$B!,(B
(B
(BName   $B!'(B   Amuro Ray
(BE-Mail  $B!'(B  gundam@xxxxxxxxxxxxxxxx
(B
(B"$B!z!#!"(B::$B!#(B.::$B!&(B'$B!,!y!#(B.::$B!&(B'$B!,!z!#!"(B::$B!#(B.::$B!&(B'$B!,(B

Follow-Ups:
- Re: ms-word $B%I%-%e%a%s%H$N%X%C(B$B%@!"%U%C%?$O8!:wBP>]$K$J$k$N$+(B ( $B%=!<%9$,$D$$$FD9J8$G$9!#(B)
  - From: Tadamasa Teranishi

References:
- Re: ms-word $B%I%-%e%a%s%H$N%X%C(B$B%@!"%U%C%?$O8!:wBP>]$K$J$k$N$+(B
  - From: Tadamasa Teranishi

Prev by Date: Re: mknmz $BCf$K%U%!%$%k%7%9%F%`$N(B$BMFNL$,$J$/$J$k!#(B
Next by Date: Re: ms-word $B%I%-%e%a%s%H$N%X%C(B$B%@!"%U%C%?$O8!:wBP>]$K$J$k$N$+(B ( $B%=!<%9$,$D$$$FD9J8$G$9!#(B)
Previous by thread: Re: ms-word $B%I%-%e%a%s%H$N%X%C(B$B%@!"%U%C%?$O8!:wBP>]$K$J$k$N$+(B
Next by thread: Re: ms-word $B%I%-%e%a%s%H$N%X%C(B$B%@!"%U%C%?$O8!:wBP>]$K$J$k$N$+(B ( $B%=!<%9$,$D$$$FD9J8$G$9!#(B)
Index(es):
- Date
- Thread

Namazu-users-ja($B5l(B)

Re: ms-word $B%I%-%e%a%s%H$N%X%C(B$B%@!"%U%C%?$O8!:wBP>]$K$J$k$N$+(B ( $B%=!<%9$,$D$$$FD9J8$G$9!#(B)

Namazu-users-ja($B5l(B)

Re: ms-word $B%I%-%e%a%s%H$N%X%C(B$B%@!"%U%C%?$O8!:wBP>]$K$J$k$N$+(B ( $B%=!<%9$,$D$$$FD9J8$G$9!#(B)