namazu-dev(ring)

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
htmlmail - a filter to convert mail/news to HTML

From: Satoru Takabayashi <satoru-t@xxxxxxxxxxxxxxxxxx>
Date: Sat, 05 Feb 2000 20:32:51 +0900
$B$U$H;W$$N)$C$F!"(BMail/News $B$N%U%!%$%k$r(B HTML $B$KJQ49$9$k%U%#%k(B
$B%?$r:n$j$^$7$?!#(B
(B
$B;H$$J}(B:
(B
(B  % htmlmail < ~/Mail/inbox/123 > foo.html
(B  % lynx foo.html
(B
(Bhtmlmail $B$O(B CGI $B$H$7$F$b;H$($^$9!#(B($B$3$C$A$,K\Ev$NL\E*(B :-)
(B<http://home.jp.FreeBSD.org/cgi-bin/showmail> $B$N??;w$,$G$-$^(B
$B$9!#(BReferences: $B$rC)$C$?$j!"%9%l%C%I$r@8@.$7$?$j!"$H$$$C$?9b(B
$B5!G=$O$"$j$^$;$s$,!#(B
(B
(BMail/News$B$r(B CGI$B$GA4J88!:w$7$?$$$1$I!"(BMHonArc$B$r;H$&$[$I%G%#%9(B
$B%/$KM>M5$O$J$$(B($B$"$k$$$OLLE](B)$B!"$H$$$&>u67$G;H$($^$9!#(B
(B
$B4JC1$J(B perl$B%9%/%j%W%H$G$9!#E,Ev$K=$@5$7$F;H$C$F$/$@$5$$$^$;!#(B
(B
(B-- Satoru Takabayashi
(B
(B#! /usr/bin/perl -wT
(B#
(B# htmlmail - a filter to convert mail/news to HTML.
(B#            It works as CGI if $ENV{SCRIPT_NAME} is defined.
(B#
(B# Copyright (C) 2000 Satoru Takabayashi <satoru-t@xxxxxxxxxxxxxxxxxx>
(B#     All rights reserved.
(B#     This is free software with ABSOLUTELY NO WARRANTY.
(B#
(B# You can redistribute it and/or modify it under the terms of 
(B# the GNU General Public License version 2.
(B#
(B
(B
(Brequire 5.004;
(Buse strict;
(Buse FileHandle;
(Buse NKF;        # <ftp://ftp.ie.u-ryukyu.ac.jp/pub/software/kono/>
(B
(Bmy $maildir  = "/foo/bar/Mail";  # for CGI mode.
(Bmy $fieldpat = "To:|Cc:|Newsgroups:|Subject:|From:|Date:" .
(B               "|X-Mailer:|User-Agent:|Message-Id:";
(B
(Bmy $Header = << 'EOS';
(B<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN"
(B        "http://www.w3.org/TR/html4/strict.dtd">
(B<html>
(B<head>
(B<title>${subject}</title>
(B</head>
(B<body>
(B<h1>${subject}</h1>
(B<hr>
(BEOS
(B
(Bmy $Footer = << 'EOS';
(B</body>
(B</html>
(BEOS
(B
(Bmain();
(B
(Bsub main () {
(B    my $mail = "-";  # default is STDIN
(B
(B    if (defined $ENV{SCRIPT_NAME}) { # CGI mode
(B	print "Content-type: text/html\n\n";
(B	if (!defined $ENV{"PATH_INFO"}) {
(B	    print "No mail specified.";
(B	    exit 1;
(B	}
(B	$mail = $maildir . $ENV{"PATH_INFO"};
(B    } else {
(B	$mail = $ARGV[0] if defined $ARGV[0];
(B    }
(B
(B    show_mail($mail);
(B}
(B
(Bsub show_mail ($) {
(B    my ($mail) = @_;
(B
(B    my $fh = new FileHandle;
(B    $fh->open($mail) || die "$mail: $!";
(B    my @lines = map { chomp; nkf("-emXZ1", $_) } <$fh>;
(B    return if @lines == 0;
(B
(B    # Remove very first "From " line.
(B    shift @lines if $lines[0] =~ /^From /i;
(B
(B    my ($subject, $headers, $boundary) = handle_headers(\@lines);
(B
(B    $Header =~ s/\$\{subject\}/$subject/g;
(B    print $Header;
(B
(B    print "<ul>\n";
(B    print $headers;
(B    print "</ul>\n";
(B    print "<hr>\n";
(B
(B    my $body = handle_body(\@lines, $boundary);
(B
(B    print "<pre>\n";
(B    print $body;
(B    print "</pre>\n";
(B
(B    print $Footer;
(B}
(B
(Bsub handle_headers (\@) {
(B    my ($lines_ref) = @_;
(B
(B    my $subject  = "";
(B    my %headers  = ();
(B    my $boundary = "";
(B    while (@$lines_ref) {
(B	my $line = shift @$lines_ref;
(B	last if $line =~ /^$/;
(B
(B	# Connect if the next line has leading spaces.
(B	while (defined($$lines_ref[0]) && $$lines_ref[0] =~ /^\s+/) {
(B	    my $nextline = shift @$lines_ref;
(B	    $line =~ s/([\xa1-\xfe])\s+$/$1/;
(B	    $nextline =~ s/^\s+([\xa1-\xfe])/$1/;
(B	    $line .= $nextline;
(B	}
(B
(B	unless ($line =~ /^(\S+:) (.*)/) {
(B	    print STDERR ">> $line\n";
(B	    die;
(B	}
(B	my $field = $1;
(B	my $value = encode_entity($2);
(B
(B	if ($field =~ /^($fieldpat)$/) {
(B	    $headers{$field} = $value;
(B	    $subject = $value if $field eq "Subject:";
(B	}
(B
(B	if ($field eq "Content-Type:" && 
(B	    $value =~ /multipart.*boundary="(.*)"/i) 
(B	{
(B	    $boundary = $1;
(B	}
(B
(B    }
(B
(B    # Sort by $fieldpat order.
(B    my $headers = "";
(B    my @fields = split '\|', $fieldpat;
(B    for my $field (@fields) {
(B	if (defined $headers{$field}) {
(B	    $headers .= "<li><em>$field</em> " 
(B		. $headers{$field} . "\n";	
(B	}
(B    }
(B
(B    return ($subject, $headers, $boundary);
(B}
(B
(Bsub handle_body (\@$) {
(B    my ($lines_ref, $boundary) = @_;
(B
(B    my $body   = "";
(B    while (@$lines_ref) {
(B	my $line = shift @$lines_ref;
(B	$body .= $line . "\n";
(B    }
(B
(B    # Handle MIME multipart message.
(B    if ($boundary ne "") {
(B	$body =~ s/This is multipart message.\n//i;
(B	$body =~ s/--\Q$boundary\E(--)?\n?/\xff/g;
(B
(B	my (@parts) = split(/\xff/, $body);
(B	$body = "";
(B	for my $part (@parts){
(B	    if ($part =~ s/^(.*?\n\n)//s){
(B		my $head = $1;
(B		$body .= $part if $head =~ m!^content-type:.*text/plain!mi;
(B	    }
(B	}
(B    }
(B    $body = encode_entity($body);
(B    $body = hyperlink($body);
(B
(B    return $body;
(B}
(B
(Bsub encode_entity() {
(B    my ($str) = @_;
(B
(B    $str =~ s/&/&amp;/g;
(B    $str =~ s/</&lt;/g;
(B    $str =~ s/>/&gt;/g;
(B    
(B    return $str;
(B}
(B
(B
(B#  hyperlink() subroutine uses codes of MHonArc's mhtxtplain.pl.
(B#  <http://www.oac.uci.edu/indiv/ehood/mhonarc.html>
(B
(B##---------------------------------------------------------------------------##
(B##  File:
(B##	@(#) mhtxtplain.pl 2.8 99/08/15 22:19:04
(B##  Author:
(B##      Earl Hood       mhonarc@xxxxxxxxx
(B##  Description:
(B##	Library defines routine to filter text/plain body parts to HTML
(B##	for MHonArc.
(B##	Filter routine can be registered with the following:
(B##              <MIMEFILTERS>
(B##              text/plain:m2h_text_plain'filter:mhtxtplain.pl
(B##              </MIMEFILTERS>
(B##---------------------------------------------------------------------------##
(B##    MHonArc -- Internet mail-to-HTML converter
(B##    Copyright (C) 1995-1999	Earl Hood, mhonarc@xxxxxxxxx
(B##
(B##    This program is free software; you can redistribute it and/or modify
(B##    it under the terms of the GNU General Public License as published by
(B##    the Free Software Foundation; either version 2 of the License, or
(B##    (at your option) any later version.
(B##
(B##    This program is distributed in the hope that it will be useful,
(B##    but WITHOUT ANY WARRANTY; without even the implied warranty of
(B##    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
(B##    GNU General Public License for more details.
(B##
(B##    You should have received a copy of the GNU General Public License
(B##    along with this program; if not, write to the Free Software
(B##    Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
(B##    02111-1307, USA
(B##---------------------------------------------------------------------------##
(B
(Bsub hyperlink($) {
(B    my ($str) = @_;
(B
(B    my $Url    	= '(http://|https://|ftp://|afs://|wais://|telnet://|ldap://' .
(B		  '|gopher://|news:|nntp:|mid:|cid:|mailto:|prospero:)';
(B    my $UrlExp 	= $Url . q%[^\s\(\)\|<>"']*[^\.?!;,"'\|\[\]\(\)\s<>]%;
(B    my $HUrlExp = $Url . q%(?:&(?![gl]t;)|[^\s\(\)\|<>"'\&])+% .
(B			 q%[^\.?!;,"'\|\[\]\(\)\s<>\&]%;
(B
(B    ## Convert URLs to hyperlinks
(B    $str =~ s@($HUrlExp)@<a href="$1">$1</a>@gio;
(B
(B    return $str;
(B}
Prev by Date: $B7n4)%M%C%H%i%s%J!<<}O?$N(J$B$*4j$$(B
Next by Date: Re: lisp/*.el problem
Previous by thread: Re: $B7n4)%M%C%H%i%s%J!<<}O?$N$*4j$$(B
Next by thread: filters
Index(es):
- Date
- Thread