#!/usr/bin/perl # # "Beautify" quoted message and make it "ready-to-reply" by Michael Velten use utf8; # keep quotes nested up to 3rd level my $ind_max = 4; my $name = '[[:alpha:]]+([\'`-][[:alpha:]]+|[.])*'; my $fullname = '\b(' . $name . '[,]?\s+)*' . $name . '\b'; # Possible reply greetings (regexes) (note that '> ' will be prefixed) my @greetings = ( 'Dear\s+' . $fullname . '([,.]|\s*!)?', '[Hh](ello|i|ey)' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', 'Sehr geehrter?\s+' . $fullname . '([,.]|\s*!)?', 'Lieber?\s+' . $fullname . '([,.]|\s*!)?', 'Guten Tag' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Hh]allo' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Mm]oin' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Mm]esdames(,| et) [Mm]essieurs([,.]|\s*!)?', 'M(adame)\s+' . $fullname . '([,.]|\s*!)?', 'M(onsieur)\s+' . $fullname . '([,.]|\s*!)?', '[Cc]her\s+' . $fullname . '([,.]|\s*!)?', '[Cc]h[eè]re\s+' . $fullname . '([,.]|\s*!)?', '[Bb]onjour' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Ss]alut' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', 'Senhor(ita|a)?' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', 'Sra?\.?' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', 'Car([ií]ssim)?[ao]s?' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', 'Prezad([ií]ssim)?[ao]s?' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', 'Estimad([ií]ssim)?[ao]s?' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Bb]om [Dd]ia' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Bb]oa ([Tt]arde|[Nn]oite)' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Oo](i|l[aá])' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Aa]l[ôo]' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', '[Hh]ola' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', 'Se[nñ]or(ita|a)?' . '(\s+' . $fullname . ')?' . '([,.]|\s*!)?', ); # Possible reply "greetouts" (regexes) (note that '> ' will be prefixed) my @greetouts = ( '([Ww]ith )?(([Kk]ind|[Bb]est|[Ww]arm) )?([Rr]egards|[Ww]ishes)([,.]|\s*!)?', '[Bb]est([,.]|\s*!)?', '[Cc]heers([,.]|\s*!)?', '[Mm]it ([Vv]iel|[Bb]est|[Ll]ieb|[Ff]reundlich)en [Gg]r([ü]|ue)([ß]|ss)en([,.]|\s*!)?', '(([Vv]iel|[Bb]est|[Ll]ieb|[Ff]reundlich)e )?[Gg]r([ü]|ue)([ß]|ss)e([,.]|\s*!)?', '(([[Bb]est|[Ll]ieb|[Ff]reundlich)e[rn] )?[Gg]ru([ß]|ss)([,.]|\s*!)?', '[Mm]it (([[Bb]est|[Ll]ieb|[Ff]reundlich)em )?[Gg]ru([ß]|ss)([,.]|\s*!)?', '([LV]|MF)G([,.]|\s*!)?', '(([Tt]r[eè]s|[Bb]ien) )?([Cc]ordi|[Aa]mic)alement([,.]|\s*!)?', '[Aa]miti[eé]s?([,.]|\s*!)?', '[Aa]tenciosamente([,.]|\s*!)?', '[Aa]tt([,.]|\s*!)?', '[Aa]bra[cç]os?([,.]|\s*!)?', '[Aa]tentamente([,.]|\s*!)?', '[Cc]ordialmente([,.]|\s*!)?', ); my $word = '[[:alpha:]]+([\'`-][[:alpha:]]+)*'; # my $saw_greeting = 0; # my $saw_greetout = 0; my $saw_own_sig = 0; my $saw_blank_line = 0; my $inds_other_sig = 0; my $quote_header = 0; my $extra_pref = ''; my (@mail, @purged_mail); my $msg = shift; die "Usage: $0 MAIL" unless $msg; open(MAIL, "+<:encoding(UTF-8)", $msg) or die "$0: Can't open $msg: $!"; push(@mail, $_) while ; # Read whole mail # Process whole mail LINE: foreach my $line (@mail) { # Treat non-quoted lines as is if ($line !~ /^>/) { push(@purged_mail, $line); next LINE; } # Keep all lines after my own signature unmodified if ($line =~ /^--\s?$/ || $saw_own_sig) { $saw_own_sig = 1; push(@purged_mail, $line); next LINE; } # $line =~ tr/\xA0/ /; # tighten "> > " to ">> " my ($pref, $suff) = $line =~ /^([>[:space:]]+)(.*)$/; $pref =~ s/(>\s*(?!$))/>/g; # reduce multiple pre- and post-blanks to one post-blank $pref =~ s/^\s*(>+)\s*/$1 /; $line = $pref . $suff . "\n"; # prepend additional '>' for each Outlook quote header if ($line =~ /^>+ [-_=]{3,}\s*$word(\s+$word)*\s*[-_=]{3,}$/) { $quote_header = 1; next LINE; } # first line after Outlook quote header that does not start with ...: if ($quote_header == 1 && $line !~ /^>+ ([-*]\s*)?$word(\s+$word)*\s*:\s+/) { $extra_pref = '>' . $extra_pref; $quote_header = 0; } $pref = $extra_pref . $pref; $line = $pref . $suff . "\n"; # skip line if number of '>'s is greater than $ind_max my $inds = $pref =~ tr/>//; next LINE if $inds > $ind_max; # Remove other signatures if ($line =~ /^>+ --\s?$/) { $inds_other_sig = $inds; } if ($inds == $inds_other_sig) { next LINE; } else { $inds_other_sig = 0; } # Remove quoted greeting # unless ($saw_greeting) { foreach my $greeting (@greetings) { if ($line =~ /^>+ $greeting$/) { # $saw_greeting = 1; next LINE; } } # } # Remove quoted "greetout" # unless ($saw_greetout) { foreach my $greetout (@greetouts) { if ($line =~ /^>+ $greetout$/) { # $saw_greetout = 1; next LINE; } } # } # Remove quoted filler lines if ($line =~ /^>+ \s*(-*|_*|=*|\+*|#*|\**)$/) { next LINE; } # Save purged line push(@purged_mail, $line); } # Overwrite original mail with purged mail truncate(MAIL, 0); seek(MAIL, 0, 0); print MAIL @purged_mail; close(MAIL);