Mercurial > emacs
annotate lib-src/b2m.pl @ 106256:9be41d3d415d
* international/isearch-x.el, international/ja-dic-cnv.el,
international/ja-dic-utl.el, international/kkc.el,
international/robin.el: Add "Keywords: i18n", so they can be
reached from finder-by-keyword.
author | Kevin Ryde <user42@zip.com.au> |
---|---|
date | Thu, 26 Nov 2009 00:04:08 +0000 |
parents | a9f7e446141d |
children | 1d1d5d9bd884 |
rev | line source |
---|---|
46032 | 1 #!/usr/bin/perl |
2 | |
3 # b2m.pl - Script to convert a Babyl file to an mbox file | |
4 | |
100958 | 5 # Copyright (C) 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009 |
75458
9f287ea4800c
Add missing Copyright header. Years from date of installation in
Glenn Morris <rgm@gnu.org>
parents:
64083
diff
changeset
|
6 # Free Software Foundation, Inc. |
9f287ea4800c
Add missing Copyright header. Years from date of installation in
Glenn Morris <rgm@gnu.org>
parents:
64083
diff
changeset
|
7 |
94828
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
8 # Maintainer: Jonathan Kamens <jik@kamens.brookline.ma.us> |
46032 | 9 |
94828
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
10 # This program is free software: you can redistribute it and/or modify |
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
11 # it under the terms of the GNU General Public License as published by |
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
12 # the Free Software Foundation, either version 3 of the License, or |
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
13 # (at your option) any later version. |
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
14 |
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
15 # This program is distributed in the hope that it will be useful, |
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
16 # but WITHOUT ANY WARRANTY; without even the implied warranty of |
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
17 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
18 # GNU General Public License for more details. |
46032 | 19 |
20 # You should have received a copy of the GNU General Public License | |
94828
3a4bc081639c
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
79748
diff
changeset
|
21 # along with this program. If not, see <http://www.gnu.org/licenses/>. |
46032 | 22 |
23 | |
24 # Requires CPAN modules: MailTools (for Mail::Address), TimeDate (for | |
25 # Date::Parse). | |
26 | |
27 use warnings; | |
28 use strict; | |
29 use File::Basename; | |
30 use Getopt::Long; | |
31 use Mail::Address; | |
32 use Date::Parse; | |
33 | |
34 my($whoami) = basename $0; | |
64083 | 35 my($version) = '$Revision$'; |
46032 | 36 my($usage) = "Usage: $whoami [--help] [--version] [--[no]full-headers] [Babyl-file] |
37 \tBy default, full headers are printed.\n"; | |
38 | |
39 my($opt_help, $opt_version); | |
40 my($opt_full_headers) = 1; | |
41 | |
42 die $usage if (! GetOptions( | |
43 'help' => \$opt_help, | |
44 'version' => \$opt_version, | |
45 'full-headers!' => \$opt_full_headers, | |
46 )); | |
47 | |
48 if ($opt_help) { | |
49 print $usage; | |
50 exit; | |
51 } | |
52 elsif ($opt_version) { | |
53 print "$whoami version: $version\n"; | |
54 exit; | |
55 } | |
56 | |
57 die $usage if (@ARGV > 1); | |
58 | |
59 $/ = "\n\037"; | |
60 | |
61 if (<> !~ /^BABYL OPTIONS:/) { | |
62 die "$whoami: $ARGV is not a Babyl file\n$usage"; | |
63 } | |
64 | |
65 while (<>) { | |
66 my($msg_num) = $. - 1; | |
46184
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
67 my($labels, $pruned, $full_header, $header); |
46032 | 68 my($from_line, $from_addr); |
69 my($time); | |
70 | |
71 # This will strip the initial form feed, any whitespace that may | |
72 # be following it, and then a newline | |
73 s/^\s+//; | |
74 # This will strip the ^_ off of the end of the message | |
75 s/\037$//; | |
76 | |
77 if (! s/(.*)\n//) { | |
78 malformatted: | |
79 warn "$whoami: message $msg_num in $ARGV is malformatted\n"; | |
80 next; | |
81 } | |
82 $labels = $1; | |
83 | |
46184
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
84 # Strip the integer indicating whether the header is pruned |
49600
23a1cea22d13
Trailing whitespace deleted.
Juanma Barranquero <lekktu@gmail.com>
parents:
48810
diff
changeset
|
85 $labels =~ s/^(\d+)[,\s]*//; |
46184
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
86 $pruned = $1; |
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
87 |
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
88 s/(?:((?:.+\n)+)\n*)?\*\*\* EOOH \*\*\*\n+// || goto malformatted; |
46032 | 89 $full_header = $1; |
90 | |
91 if (s/((?:.+\n)+)\n+//) { | |
92 $header = $1; | |
93 } | |
94 else { | |
95 # Message has no body | |
96 $header = $_; | |
97 $_ = ''; | |
98 } | |
99 | |
46184
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
100 # "$pruned eq '0'" is different from "! $pruned". We want to make |
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
101 # sure that we found a valid label line which explicitly indicated |
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
102 # that the header was not pruned. |
81235cad75cb
Obey the rmail file and use the unpruned header properly.
Pavel Janík <Pavel@Janik.cz>
parents:
46032
diff
changeset
|
103 if ((! $full_header) || ($pruned eq '0')) { |
46032 | 104 $full_header = $header; |
105 } | |
106 | |
48810
1626973bdb2b
Make sure every message ends with a blank line, because some mbox parsers
Pavel Janík <Pavel@Janik.cz>
parents:
46737
diff
changeset
|
107 # End message with two newlines (some mbox parsers require a blank |
1626973bdb2b
Make sure every message ends with a blank line, because some mbox parsers
Pavel Janík <Pavel@Janik.cz>
parents:
46737
diff
changeset
|
108 # line before the next "From " line). |
1626973bdb2b
Make sure every message ends with a blank line, because some mbox parsers
Pavel Janík <Pavel@Janik.cz>
parents:
46737
diff
changeset
|
109 s/\s+$/\n\n/; |
46032 | 110 |
111 # Quote "^From " | |
112 s/(^|\n)From /$1>From /g; | |
113 | |
114 # Strip extra commas and whitespace from the end | |
115 $labels =~ s/[,\s]+$//; | |
116 # Now collapse extra commas and whitespace in the remaining label string | |
117 $labels =~ s/[,\s]+/, /g; | |
49600
23a1cea22d13
Trailing whitespace deleted.
Juanma Barranquero <lekktu@gmail.com>
parents:
48810
diff
changeset
|
118 |
46032 | 119 foreach my $rmail_header qw(summary-line x-coding-system) { |
120 $full_header =~ s/(^|\n)$rmail_header:.*\n/$1/i; | |
121 } | |
122 | |
123 if ($full_header =~ s/(^|\n)mail-from:\s*(From .*)\n/$1/i) { | |
124 ($from_line = $2) =~ s/\s*$/\n/; | |
125 } | |
126 else { | |
127 foreach my $addr_header qw(return-path from really-from sender) { | |
46737
7c794ace9e1a
Fix regexp for finding return address fields.
Pavel Janík <Pavel@Janik.cz>
parents:
46184
diff
changeset
|
128 if ($full_header =~ /(?:^|\n)$addr_header:\s*(.*\n(?:\B.*\n)*)/i) { |
46032 | 129 my($addr) = Mail::Address->parse($1); |
130 $from_addr = $addr->address($addr); | |
131 last; | |
132 } | |
133 } | |
134 | |
135 if (! $from_addr) { | |
136 $from_addr = "Babyl_to_mail_by_$whoami\@localhost"; | |
137 } | |
138 | |
139 if ($full_header =~ /(?:^|\n)date:\s*(\S.*\S)/i) { | |
140 $time = str2time($1); | |
141 } | |
142 | |
143 if (! $time) { | |
144 # No Date header or we failed to parse it | |
145 $time = time; | |
146 } | |
147 | |
148 $from_line = "From " . $from_addr . " " . localtime($time) . "\n"; | |
149 } | |
150 | |
151 print($from_line, ($opt_full_headers ? $full_header : $header), | |
152 ($labels ? "X-Babyl-Labels: $labels\n" : ""), "\n", | |
153 $_) || die "$whoami: error writing to stdout: $!\n"; | |
154 } | |
155 | |
156 close(STDOUT) || die "$whoami: Error closing stdout: $!\n"; | |
52401 | 157 |
158 # arch-tag: 8c7c8ab0-721c-46d7-ba3e-139801240aa8 |