1 /*@ S-nail - a mail user agent derived from Berkeley Mail.
2 *@ Routines for processing and detecting headlines.
4 * Copyright (c) 2000-2004 Gunnar Ritter, Freiburg i. Br., Germany.
5 * Copyright (c) 2012 - 2013 Steffen "Daode" Nurpmeso <sdaoden@users.sf.net>.
8 * Copyright (c) 1980, 1993
9 * The Regents of the University of California. All rights reserved.
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 3. All advertising materials mentioning features or use of this software
20 * must display the following acknowledgement:
21 * This product includes software developed by the University of
22 * California, Berkeley and its contributors.
23 * 4. Neither the name of the University nor the names of its contributors
24 * may be used to endorse or promote products derived from this software
25 * without specific prior written permission.
27 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
28 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
31 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
32 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
33 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
34 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
35 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
36 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
44 # include <stringprep.h>
48 size_t tlen
; /* Length of .tdata */
49 char const *tdata
; /* Template date - see _cmatch_data[] */
53 * Template characters for cmatch_data.tdata:
54 * 'A' An upper case char
55 * 'a' A lower case char
58 * 'O' An optional digit or space
60 * '+' Either a plus or a minus sign
62 static struct cmatch_data
const _cmatch_data
[] = {
63 { 24, "Aaa Aaa O0 00:00:00 0000" }, /* BSD/ISO C90 ctime */
64 { 28, "Aaa Aaa O0 00:00:00 AAA 0000" }, /* BSD tmz */
65 { 21, "Aaa Aaa O0 00:00 0000" }, /* SysV ctime */
66 { 25, "Aaa Aaa O0 00:00 AAA 0000" }, /* SysV tmz */
68 * RFC 822-alike From_ lines do not conform to RFC 4155, but seem to
69 * be used in the wild by UW-imap
71 { 30, "Aaa Aaa O0 00:00:00 0000 +0000" },
72 /* RFC 822 with zone spec; 1. military, 2. UT, 3. north america time
73 * zone strings; note that 1. is strictly speaking not correct as some
74 * letters are not used, and 2. is not because only "UT" is defined */
75 #define __reuse "Aaa Aaa O0 00:00:00 0000 AAA"
76 { 28 - 2, __reuse
}, { 28 - 1, __reuse
}, { 28 - 0, __reuse
},
79 #define _DATE_MINLEN 21
81 /* Skip over "word" as found in From_ line */
82 static char const * _from__skipword(char const *wp
);
84 /* Match the date string against the date template (tp), return if match.
85 * See _cmatch_data[] for template character description */
86 static int _cmatch(size_t len
, char const *date
, char const *tp
);
88 /* Check wether date is a valid 'From_' date.
89 * (Rather ctime(3) generated dates, according to RFC 4155) */
90 static int _is_date(char const *date
);
92 /* Convert the domain part of a skinned address to IDNA.
93 * If an error occurs before Unicode information is available, revert the IDNA
94 * error to a normal CHAR one so that the error message doesn't talk Unicode */
96 static struct addrguts
* _idna_apply(struct addrguts
*agp
);
99 /* Classify and check a (possibly skinned) header body according to RFC
100 * *addr-spec* rules; if it (is assumed to has been) skinned it may however be
101 * also a file or a pipe command, so check that first, then.
102 * Otherwise perform content checking and isolate the domain part (for IDNA) */
103 static int _addrspec_check(int doskin
, struct addrguts
*agp
);
105 static int gethfield(FILE *f
, char **linebuf
, size_t *linesize
, int rem
,
107 static int msgidnextc(const char **cp
, int *status
);
108 static int charcount(char *str
, int c
);
111 _from__skipword(char const *wp
)
116 while ((c
= *wp
++) != '\0' && ! blankchar(c
)) {
118 while ((c
= *wp
++) != '\0' && c
!= '"')
124 for (; blankchar(c
); c
= *wp
++)
127 return (c
== 0 ? NULL
: wp
- 1);
131 _cmatch(size_t len
, char const *date
, char const *tp
)
155 if (c
!= ' ' && ! digitchar(c
))
163 if (c
!= '+' && c
!= '-')
174 _is_date(char const *date
)
176 struct cmatch_data
const *cmdp
;
177 size_t dl
= strlen(date
);
180 if (dl
>= _DATE_MINLEN
)
181 for (cmdp
= _cmatch_data
; cmdp
->tdata
!= NULL
; ++cmdp
)
182 if (dl
== cmdp
->tlen
&&
183 (ret
= _cmatch(dl
, date
, cmdp
->tdata
)))
189 static struct addrguts
*
190 _idna_apply(struct addrguts
*agp
)
192 char *idna_utf8
, *idna_ascii
, *cs
;
194 int strict
= (value("idna-strict-checks") != NULL
);
196 sz
= agp
->ag_slen
- agp
->ag_sdom_start
;
198 idna_utf8
= ac_alloc(sz
+ 1);
199 memcpy(idna_utf8
, agp
->ag_skinned
+ agp
->ag_sdom_start
, sz
);
200 idna_utf8
[sz
] = '\0';
202 /* GNU Libidn settles on top of iconv(3) without having any fallback,
203 * so let's just let it perform the charset conversion, if any should
206 char const *tcs
= charset_get_lc();
207 idna_ascii
= idna_utf8
;
208 idna_utf8
= stringprep_convert(idna_ascii
, "UTF-8", tcs
);
209 i
= (idna_utf8
== NULL
&& errno
== EINVAL
);
211 if (idna_utf8
== NULL
) {
213 fprintf(stderr
, tr(179,
214 "Cannot convert from %s to %s\n"),
216 agp
->ag_n_flags
^= NAME_ADDRSPEC_ERR_IDNA
|
217 NAME_ADDRSPEC_ERR_CHAR
;
222 if (idna_to_ascii_8z(idna_utf8
, &idna_ascii
,
223 strict
? IDNA_USE_STD3_ASCII_RULES
: 0)
225 agp
->ag_n_flags
^= NAME_ADDRSPEC_ERR_IDNA
|
226 NAME_ADDRSPEC_ERR_CHAR
;
230 /* Replace the domain part of .ag_skinned with IDNA version */
231 sz
= strlen(idna_ascii
);
232 i
= agp
->ag_sdom_start
;
233 cs
= salloc(agp
->ag_slen
- i
+ sz
+ 1);
234 memcpy(cs
, agp
->ag_skinned
, i
);
235 memcpy(cs
+ i
, idna_ascii
, sz
);
239 agp
->ag_skinned
= cs
;
241 NAME_ADDRSPEC_ERR_SET(agp
->ag_n_flags
,
242 NAME_NAME_SALLOC
|NAME_SKINNED
|NAME_IDNA
, 0);
256 _addrspec_check(int skinned
, struct addrguts
*agp
)
258 char *addr
, *p
, in_quote
, in_domain
, hadat
;
259 union {char c
; unsigned char u
;} c
;
261 uc_it use_idna
= ! boption("idna-disable");
264 agp
->ag_n_flags
|= NAME_ADDRSPEC_CHECKED
;
265 addr
= agp
->ag_skinned
;
267 if (agp
->ag_iaddr_aend
- agp
->ag_iaddr_start
== 0) {
268 NAME_ADDRSPEC_ERR_SET(agp
->ag_n_flags
, NAME_ADDRSPEC_ERR_EMPTY
,
273 /* If the field is not a recipient, it cannot be a file or a pipe */
278 * Excerpt from nail.1:
280 * Recipient address specifications
281 * The rules are: Any name which starts with a `|' character specifies
282 * a pipe, the command string following the `|' is executed and
283 * the message is sent to its standard input; any other name which
284 * contains a `@' character is treated as a mail address; any other
285 * name which starts with a `+' character specifies a folder name; any
286 * other name which contains a `/' character but no `!' or `%'
287 * character before also specifies a folder name; what remains is
288 * treated as a mail address.
291 agp
->ag_n_flags
|= NAME_ADDRSPEC_ISPIPE
;
294 if (memchr(addr
, '@', agp
->ag_slen
) == NULL
) {
297 for (p
= addr
; (c
.c
= *p
); ++p
) {
298 if (c
.c
== '!' || c
.c
== '%')
301 jisfile
: agp
->ag_n_flags
|= NAME_ADDRSPEC_ISFILE
;
308 in_quote
= in_domain
= hadat
= 0;
310 for (p
= addr
; (c
.c
= *p
++) != '\0';) {
312 in_quote
= ! in_quote
;
313 } else if (c
.u
< 040 || c
.u
>= 0177) {
315 if (in_domain
&& use_idna
) {
317 NAME_ADDRSPEC_ERR_SET(agp
->ag_n_flags
,
318 NAME_ADDRSPEC_ERR_IDNA
, c
.u
);
323 } else if (in_domain
== 2) {
324 if ((c
.c
== ']' && *p
!= '\0') || c
.c
== '\\' ||
327 } else if (in_quote
&& in_domain
== 0) {
329 } else if (c
.c
== '\\' && *p
!= '\0') {
331 } else if (c
.c
== '@') {
333 NAME_ADDRSPEC_ERR_SET(agp
->ag_n_flags
,
334 NAME_ADDRSPEC_ERR_ATSEQ
, c
.u
);
337 agp
->ag_sdom_start
= (size_t)(p
- addr
);
338 in_domain
= (*p
== '[') ? 2 : 1;
340 } else if (c
.c
== '(' || c
.c
== ')' ||
341 c
.c
== '<' || c
.c
== '>' ||
342 c
.c
== ',' || c
.c
== ';' || c
.c
== ':' ||
343 c
.c
== '\\' || c
.c
== '[' || c
.c
== ']')
349 NAME_ADDRSPEC_ERR_SET(agp
->ag_n_flags
, NAME_ADDRSPEC_ERR_CHAR
,
356 agp
= _idna_apply(agp
);
360 return ((agp
->ag_n_flags
& NAME_ADDRSPEC_INVALID
) != 0);
364 myaddrs(struct header
*hp
)
369 if (hp
!= NULL
&& (np
= hp
->h_from
) != NULL
) {
370 if ((rv
= np
->n_fullname
) != NULL
)
372 if ((rv
= np
->n_name
) != NULL
)
376 if ((rv
= voption("from")) != NULL
)
379 /* When invoking *sendmail* directly, it's its task
380 * to generate an otherwise undeterminable From: address.
381 * However, if the user sets *hostname*, accept his desire */
382 if (voption("smtp") != NULL
|| voption("hostname") != NULL
) {
383 char *hn
= nodename(1);
384 size_t sz
= strlen(myname
) + strlen(hn
) + 2;
386 snprintf(rv
, sz
, "%s@%s", myname
, hn
);
393 myorigin(struct header
*hp
)
395 char const *ret
= NULL
, *ccp
;
398 if ((ccp
= myaddrs(hp
)) != NULL
&&
399 (np
= lextract(ccp
, GEXTRA
|GFULL
)) != NULL
)
400 ret
= np
->n_flink
!= NULL
? value("sender") : ccp
;
405 is_head(char const *linebuf
, size_t linelen
) /* XXX verbose WARN */
407 char date
[FROM_DATEBUF
];
409 return ((linelen
<= 5 || memcmp(linebuf
, "From ", 5) != 0 ||
410 ! extract_date_from_from_(linebuf
, linelen
, date
) ||
411 ! _is_date(date
)) ? 0 : 1);
415 extract_date_from_from_(char const *line
, size_t linelen
,
416 char datebuf
[FROM_DATEBUF
])
419 char const *cp
= line
;
422 cp
= _from__skipword(cp
);
426 cp
= _from__skipword(cp
);
429 if (cp
[0] == 't' && cp
[1] == 't' && cp
[2] == 'y') {
430 cp
= _from__skipword(cp
);
435 linelen
-= (size_t)(cp
- line
);
436 if (linelen
< _DATE_MINLEN
)
438 if (cp
[linelen
- 1] == '\n') {
440 /* (Rather IMAP/POP3 only) */
441 if (cp
[linelen
- 1] == '\r')
443 if (linelen
< _DATE_MINLEN
)
446 if (linelen
>= FROM_DATEBUF
)
450 jleave
: memcpy(datebuf
, cp
, linelen
);
451 datebuf
[linelen
] = '\0';
454 jerr
: cp
= tr(213, "<Unknown date>");
455 linelen
= strlen(cp
);
456 if (linelen
>= FROM_DATEBUF
)
457 linelen
= FROM_DATEBUF
;
462 extract_header(FILE *fp
, struct header
*hp
) /* XXX no header occur-cnt check */
464 struct header nh
, *hq
= &nh
;
465 char *linebuf
= NULL
, *colon
;
467 int seenfields
= 0, lc
, c
;
468 char const *val
, *cp
;
470 memset(hq
, 0, sizeof *hq
);
471 for (lc
= 0; readline_restart(fp
, &linebuf
, &linesize
, 0) > 0; lc
++)
474 while ((lc
= gethfield(fp
, &linebuf
, &linesize
, lc
, &colon
)) >= 0) {
475 if ((val
= thisfield(linebuf
, "to")) != NULL
) {
477 hq
->h_to
= cat(hq
->h_to
, checkaddrs(
478 lextract(val
, GTO
|GFULL
)));
479 } else if ((val
= thisfield(linebuf
, "cc")) != NULL
) {
481 hq
->h_cc
= cat(hq
->h_cc
, checkaddrs(
482 lextract(val
, GCC
|GFULL
)));
483 } else if ((val
= thisfield(linebuf
, "bcc")) != NULL
) {
485 hq
->h_bcc
= cat(hq
->h_bcc
, checkaddrs(
486 lextract(val
, GBCC
|GFULL
)));
487 } else if ((val
= thisfield(linebuf
, "from")) != NULL
) {
489 hq
->h_from
= cat(hq
->h_from
, checkaddrs(
490 lextract(val
, GEXTRA
|GFULL
)));
491 } else if ((val
= thisfield(linebuf
, "reply-to")) != NULL
) {
493 hq
->h_replyto
= cat(hq
->h_replyto
, checkaddrs(
494 lextract(val
, GEXTRA
|GFULL
)));
495 } else if ((val
= thisfield(linebuf
, "sender")) != NULL
) {
497 hq
->h_sender
= cat(hq
->h_sender
, checkaddrs(
498 lextract(val
, GEXTRA
|GFULL
)));
499 } else if ((val
= thisfield(linebuf
,
500 "organization")) != NULL
) {
502 for (cp
= val
; blankchar(*cp
); cp
++)
504 hq
->h_organization
= hq
->h_organization
?
505 save2str(hq
->h_organization
, cp
) :
507 } else if ((val
= thisfield(linebuf
, "subject")) != NULL
||
508 (val
= thisfield(linebuf
, "subj")) != NULL
) {
510 for (cp
= val
; blankchar(*cp
); cp
++)
512 hq
->h_subject
= hq
->h_subject
?
513 save2str(hq
->h_subject
, cp
) :
516 fprintf(stderr
, tr(266,
517 "Ignoring header field \"%s\"\n"),
521 * In case the blank line after the header has been edited out.
522 * Otherwise, fetch the header separator.
525 if (linebuf
[0] != '\0') {
526 for (cp
= linebuf
; *(++cp
) != '\0'; );
527 fseek(fp
, (long)-(1 + cp
- linebuf
), SEEK_CUR
);
529 if ((c
= getc(fp
)) != '\n' && c
!= EOF
)
536 hp
->h_bcc
= hq
->h_bcc
;
537 hp
->h_from
= hq
->h_from
;
538 hp
->h_replyto
= hq
->h_replyto
;
539 hp
->h_sender
= hq
->h_sender
;
540 hp
->h_organization
= hq
->h_organization
;
541 hp
->h_subject
= hq
->h_subject
;
543 fprintf(stderr
, tr(267, "Restoring deleted header lines\n"));
549 * Return the desired header line from the passed message
550 * pointer (or NULL if the desired header field is not available).
551 * If mult is zero, return the content of the first matching header
552 * field only, the content of all matching header fields else.
555 hfield_mult(char const *field
, struct message
*mp
, int mult
)
560 char *linebuf
= NULL
, *colon
, *oldhfield
= NULL
;
563 if ((ibuf
= setinput(&mb
, mp
, NEED_HEADER
)) == NULL
)
565 if ((lc
= mp
->m_lines
- 1) < 0)
568 if ((mp
->m_flag
& MNOFROM
) == 0 &&
569 readline_restart(ibuf
, &linebuf
, &linesize
, 0) < 0)
572 if ((lc
= gethfield(ibuf
, &linebuf
, &linesize
, lc
, &colon
)) < 0)
574 if ((hfield
= thisfield(linebuf
, field
)) != NULL
) {
575 oldhfield
= save2str(hfield
, oldhfield
);
588 * Return the next header field found in the given message.
589 * Return >= 0 if something found, < 0 elsewise.
590 * "colon" is set to point to the colon in the header.
591 * Must deal with \ continuations & other such fraud.
594 gethfield(FILE *f
, char **linebuf
, size_t *linesize
, int rem
, char **colon
)
597 size_t line2size
= 0;
601 if (*linebuf
== NULL
)
602 *linebuf
= srealloc(*linebuf
, *linesize
= 1);
607 if ((c
= readline_restart(f
, linebuf
, linesize
, 0)) <= 0)
609 for (cp
= *linebuf
; fieldnamechar(*cp
& 0377); cp
++);
611 while (blankchar(*cp
& 0377))
613 if (*cp
!= ':' || cp
== *linebuf
)
616 * I guess we got a headline.
617 * Handle wraparounding
623 while (--cp
>= *linebuf
&& blankchar(*cp
& 0377));
627 if (cp
-8 >= *linebuf
&& cp
[-1] == '=' && cp
[-2] == '?')
629 ungetc(c
= getc(f
), f
);
632 c
= readline_restart(f
, &line2
, &line2size
, 0);
636 for (cp2
= line2
; blankchar(*cp2
& 0377); cp2
++);
638 if (cp2
[0] == '=' && cp2
[1] == '?' && c
> 8)
640 if (cp
+ c
>= *linebuf
+ *linesize
- 2) {
641 size_t diff
= cp
- *linebuf
;
642 size_t colondiff
= *colon
- *linebuf
;
643 *linebuf
= srealloc(*linebuf
,
645 cp
= &(*linebuf
)[diff
];
646 *colon
= &(*linebuf
)[colondiff
];
662 * Check whether the passed line is a header line of
663 * the desired breed. Return the field body, or 0.
666 thisfield(char const *linebuf
, char const *field
)
668 while (lowerconv(*linebuf
) == lowerconv(*field
)) {
674 while (blankchar(*linebuf
))
676 if (*linebuf
++ != ':')
678 while (blankchar(*linebuf
))
684 * Get sender's name from this message. If the message has
685 * a bunch of arpanet stuff in it, we may have to skin the name
686 * before returning it.
689 nameof(struct message
*mp
, int reptype
)
693 cp
= skin(name1(mp
, reptype
));
694 if (reptype
!= 0 || charcount(cp
, '!') < 2)
696 cp2
= strrchr(cp
, '!');
698 while (cp2
> cp
&& *cp2
!= '!')
706 * Start of a "comment".
710 skip_comment(char const *cp
)
714 for (; nesting
> 0 && *cp
; cp
++) {
732 * Return the start of a route-addr (address in angle brackets),
736 routeaddr(char const *name
)
738 char const *np
, *rp
= NULL
;
740 for (np
= name
; *np
; np
++) {
743 np
= skip_comment(&np
[1]) - 1;
749 if (*np
== '\\' && np
[1])
764 * Check if a name's address part contains invalid characters.
767 is_addr_invalid(struct name
*np
, int putmsg
)
769 char cbuf
[sizeof "'\\U12340'"], *name
= np
->n_name
;
770 int f
= np
->n_flags
, ok8bit
= 1;
772 char const *fmt
= "'\\x%02X'", *cs
;
774 if ((f
& NAME_ADDRSPEC_INVALID
) == 0 || ! putmsg
||
775 (f
& NAME_ADDRSPEC_ERR_EMPTY
) != 0)
778 if (f
& NAME_ADDRSPEC_ERR_IDNA
)
779 cs
= tr(284, "Invalid domain name: \"%s\", character %s\n"),
782 else if (f
& NAME_ADDRSPEC_ERR_ATSEQ
)
783 cs
= tr(142, "\"%s\" contains invalid %s sequence\n");
785 cs
= tr(143, "\"%s\" contains invalid character %s\n");
787 c
= NAME_ADDRSPEC_ERR_GETWC(f
);
788 if (ok8bit
&& c
>= 040 && c
<= 0177)
789 snprintf(cbuf
, sizeof cbuf
, "'%c'", c
);
791 snprintf(cbuf
, sizeof cbuf
, fmt
, c
);
793 fprintf(stderr
, cs
, name
, cbuf
);
795 return ((f
& NAME_ADDRSPEC_INVALID
) != 0);
799 skin(char const *name
)
805 (void)addrspec_with_guts(1, name
, &ag
);
807 if ((ag
.ag_n_flags
& NAME_NAME_SALLOC
) == 0)
808 ret
= savestrbuf(ret
, ag
.ag_slen
);
813 /* TODO addrspec_with_guts: RFC 5322 */
815 addrspec_with_guts(int doskin
, char const *name
, struct addrguts
*agp
)
818 char *cp2
, *bufend
, *nbuf
, c
;
819 char gotlt
, gotaddr
, lastsp
;
821 memset(agp
, 0, sizeof *agp
);
823 if ((agp
->ag_input
= name
) == NULL
|| /* XXX ever? */
824 (agp
->ag_ilen
= strlen(name
)) == 0) {
825 agp
->ag_skinned
= UNCONST(""); /* ok: NAME_SALLOC is not set */
827 agp
->ag_n_flags
|= NAME_ADDRSPEC_CHECKED
;
828 NAME_ADDRSPEC_ERR_SET(agp
->ag_n_flags
, NAME_ADDRSPEC_ERR_EMPTY
,
833 if (! doskin
|| ! anyof(name
, "(< ")) {
834 /*agp->ag_iaddr_start = 0;*/
835 agp
->ag_iaddr_aend
= agp
->ag_ilen
;
836 agp
->ag_skinned
= UNCONST(name
); /* (NAME_SALLOC not set) */
837 agp
->ag_slen
= agp
->ag_ilen
;
838 agp
->ag_n_flags
= NAME_SKINNED
;
839 return _addrspec_check(doskin
, agp
);
842 /* Something makes us think we have to perform the skin operation */
843 nbuf
= ac_alloc(agp
->ag_ilen
+ 1);
844 /*agp->ag_iaddr_start = 0;*/
846 gotlt
= gotaddr
= lastsp
= 0;
848 for (cp
= name
++; (c
= *cp
++) != '\0'; ) {
851 cp
= skip_comment(cp
);
856 * Start of a "quoted-string".
857 * Copy it in its entirety.
858 * XXX RFC: quotes are "semantically invisible"
859 * XXX But it was explicitly added (Changelog.Heirloom,
860 * XXX [9.23] released 11/15/00, "Do not remove quotes
861 * XXX when skinning names"? No more info..
864 while ((c
= *cp
) != '\0') { /* TODO improve */
872 else if ((c
= *cp
) != '\0') {
883 agp
->ag_iaddr_aend
= (size_t)(cp
- name
);
885 if (cp
[0] == 'a' && cp
[1] == 't' && blankchar(cp
[2]))
886 cp
+= 3, *cp2
++ = '@';
887 else if (cp
[0] == '@' && blankchar(cp
[1]))
888 cp
+= 2, *cp2
++ = '@';
893 agp
->ag_iaddr_start
= (size_t)(cp
- (name
- 1));
900 /* (_addrspec_check() verifies these later!) */
901 agp
->ag_iaddr_aend
= (size_t)(cp
- name
);
903 while ((c
= *cp
) != '\0' && c
!= ',') {
906 cp
= skip_comment(cp
);
908 while ((c
= *cp
) != '\0') {
912 if (c
== '\\' && *cp
)
930 for (; blankchar(*cp
); ++cp
)
935 } else if (! gotaddr
) {
937 agp
->ag_iaddr_start
= (size_t)(cp
- name
);
941 agp
->ag_slen
= (size_t)(cp2
- nbuf
);
942 if (agp
->ag_iaddr_aend
== 0)
943 agp
->ag_iaddr_aend
= agp
->ag_ilen
;
945 agp
->ag_skinned
= savestrbuf(nbuf
, agp
->ag_slen
);
947 agp
->ag_n_flags
= NAME_NAME_SALLOC
| NAME_SKINNED
;
948 return _addrspec_check(doskin
, agp
);
952 * Fetch the real name from an internet mail address field.
955 realname(char const *name
)
957 char const *cp
, *cq
, *cstart
= NULL
, *cend
= NULL
;
960 int quoted
, good
, nogood
;
964 for (cp
= UNCONST(name
); *cp
; cp
++) {
969 * More than one comment in address, doesn't
970 * make sense to display it without context.
971 * Return the entire field,
973 return mime_fromaddr(name
);
975 cp
= skip_comment(cp
);
978 cend
= cstart
= NULL
;
984 if (*cp
== '\\' && cp
[1])
996 * More than one address. Just use the first one.
1001 brk
: if (cstart
== NULL
) {
1004 * If name contains only a route-addr, the
1005 * surrounding angle brackets don't serve any
1006 * useful purpose when displaying, so they
1009 return prstr(skin(name
));
1010 return mime_fromaddr(name
);
1012 rp
= rname
= ac_alloc(cend
- cstart
+ 1);
1014 * Strip quotes. Note that quotes that appear within a MIME-
1015 * encoded word are not stripped. The idea is to strip only
1016 * syntactical relevant things (but this is not necessarily
1017 * the most sensible way in practice).
1020 for (cp
= cstart
; cp
< cend
; cp
++) {
1021 if (*cp
== '(' && !quoted
) {
1022 cq
= skip_comment(++cp
);
1026 if (*cp
== '\\' && &cp
[1] < cq
)
1030 } else if (*cp
== '\\' && &cp
[1] < cend
)
1032 else if (*cp
== '"') {
1041 mime_fromhdr(&in
, &out
, TD_ISPR
|TD_ICONV
);
1043 rname
= savestr(out
.s
);
1045 while (blankchar(*rname
& 0377))
1047 for (rp
= rname
; *rp
; rp
++);
1048 while (--rp
>= rname
&& blankchar(*rp
& 0377))
1051 return mime_fromaddr(name
);
1053 * mime_fromhdr() has converted all nonprintable characters to
1054 * question marks now. These and blanks are considered uninteresting;
1055 * if the displayed part of the real name contains more than 25% of
1056 * them, it is probably better to display the plain email address
1061 for (rp
= rname
; *rp
&& rp
< &rname
[20]; rp
++)
1062 if (*rp
== '?' || blankchar(*rp
& 0377))
1066 if (good
*3 < nogood
)
1067 return prstr(skin(name
));
1072 * Fetch the sender's name from the passed message.
1074 * 0 -- get sender's name for display purposes
1075 * 1 -- get sender's name for reply
1076 * 2 -- get sender's name for Reply
1079 name1(struct message
*mp
, int reptype
)
1083 char *linebuf
= NULL
;
1084 size_t linesize
= 0;
1089 if ((cp
= hfield1("from", mp
)) != NULL
&& *cp
!= '\0')
1091 if (reptype
== 0 && (cp
= hfield1("sender", mp
)) != NULL
&&
1094 namebuf
= smalloc(namesize
= 1);
1096 if (mp
->m_flag
& MNOFROM
)
1098 if ((ibuf
= setinput(&mb
, mp
, NEED_HEADER
)) == NULL
)
1100 if (readline_restart(ibuf
, &linebuf
, &linesize
, 0) < 0)
1103 if (namesize
<= linesize
)
1104 namebuf
= srealloc(namebuf
, namesize
= linesize
+ 1);
1105 for (cp
= linebuf
; *cp
&& *cp
!= ' '; cp
++)
1107 for (; blankchar(*cp
& 0377); cp
++);
1108 for (cp2
= &namebuf
[strlen(namebuf
)];
1109 *cp
&& !blankchar(*cp
& 0377) && cp2
< namebuf
+ namesize
- 1;)
1112 if (readline_restart(ibuf
, &linebuf
, &linesize
, 0) < 0)
1114 if ((cp
= strchr(linebuf
, 'F')) == NULL
)
1116 if (strncmp(cp
, "From", 4) != 0)
1118 if (namesize
<= linesize
)
1119 namebuf
= srealloc(namebuf
, namesize
= linesize
+ 1);
1120 while ((cp
= strchr(cp
, 'r')) != NULL
) {
1121 if (strncmp(cp
, "remote", 6) == 0) {
1122 if ((cp
= strchr(cp
, 'f')) == NULL
)
1124 if (strncmp(cp
, "from", 4) != 0)
1126 if ((cp
= strchr(cp
, ' ')) == NULL
)
1130 strncpy(namebuf
, cp
, namesize
);
1133 cp2
=strrchr(namebuf
, '!')+1;
1134 strncpy(cp2
, cp
, (namebuf
+namesize
)-cp2
);
1136 namebuf
[namesize
- 2] = '!';
1137 namebuf
[namesize
- 1] = '\0';
1143 if (*namebuf
!= '\0' || ((cp
= hfield1("return-path", mp
))) == NULL
||
1145 cp
= savestr(namebuf
);
1153 msgidnextc(const char **cp
, int *status
)
1173 *cp
= skip_comment(&(*cp
)[1]);
1188 c
= *(*cp
)++ & 0377;
1189 return *status
& 02 ? lowerconv(c
) : c
;
1195 msgidcmp(const char *s1
, const char *s2
)
1201 c1
= msgidnextc(&s1
, &q1
);
1202 c2
= msgidnextc(&s2
, &q2
);
1210 * Count the occurances of c in str
1213 charcount(char *str
, int c
)
1218 for (i
= 0, cp
= str
; *cp
; cp
++)
1225 * See if the given header field is supposed to be ignored.
1228 is_ign(char const *field
, size_t fieldlen
, struct ignoretab ignoret
[2])
1233 if (ignoret
== NULL
)
1235 if (ignoret
== allignore
)
1238 * Lower-case the string, so that "Status" and "status"
1239 * will hash to the same place.
1241 realfld
= ac_alloc(fieldlen
+ 1);
1242 i_strcpy(realfld
, field
, fieldlen
+ 1);
1243 if (ignoret
[1].i_count
> 0)
1244 ret
= !member(realfld
, ignoret
+ 1);
1246 ret
= member(realfld
, ignoret
);
1252 member(char const *realfield
, struct ignoretab
*table
)
1256 for (igp
= table
->i_head
[hash(realfield
)]; igp
!= 0; igp
= igp
->i_link
)
1257 if (*igp
->i_field
== *realfield
&&
1258 strcmp(igp
->i_field
, realfield
) == 0)
1264 * Fake Sender for From_ lines if missing, e. g. with POP3.
1267 fakefrom(struct message
*mp
)
1271 if (((name
= skin(hfield1("return-path", mp
))) == NULL
||
1273 ((name
= skin(hfield1("from", mp
))) == NULL
||
1276 * XXX MAILER-DAEMON is what an old MBOX manual page says.
1277 * RFC 4155 however requires a RFC 5322 (2822) conforming
1278 * "addr-spec", but we simply can't provide that
1280 name
= "MAILER-DAEMON";
1290 for (cq
= cp
; *cq
&& *cq
!= '\n'; ++cq
)
1297 nexttoken(char const *cp
)
1305 while (*cp
!= '\0') {
1317 } else if (blankchar(*cp
) || *cp
== ',')
1326 * From username Fri Jan 2 20:13:51 2004
1331 unixtime(char const *fromline
)
1336 int i
, year
, month
, day
, hour
, minute
, second
;
1340 for (fp
= fromline
; *fp
&& *fp
!= '\n'; fp
++);
1342 if (fp
- fromline
< 7)
1347 if (strncmp(&fp
[4], month_names
[i
], 3) == 0)
1349 if (month_names
[++i
][0] == '\0')
1355 day
= strtol(&fp
[8], &xp
, 10);
1356 if (*xp
!= ' ' || xp
!= &fp
[10])
1358 hour
= strtol(&fp
[11], &xp
, 10);
1359 if (*xp
!= ':' || xp
!= &fp
[13])
1361 minute
= strtol(&fp
[14], &xp
, 10);
1362 if (*xp
!= ':' || xp
!= &fp
[16])
1364 second
= strtol(&fp
[17], &xp
, 10);
1365 if (*xp
!= ' ' || xp
!= &fp
[19])
1367 year
= strtol(&fp
[20], &xp
, 10);
1370 if ((t
= combinetime(year
, month
, day
, hour
, minute
, second
)) ==
1373 tzdiff
= t
- mktime(gmtime(&t
));
1374 tmptr
= localtime(&t
);
1375 if (tmptr
->tm_isdst
> 0)
1385 rfctime(char const *date
)
1387 char const *cp
= date
;
1390 int i
, year
, month
, day
, hour
, minute
, second
;
1392 if ((cp
= nexttoken(cp
)) == NULL
)
1394 if (alphachar(cp
[0]) && alphachar(cp
[1]) && alphachar(cp
[2]) &&
1396 if ((cp
= nexttoken(&cp
[4])) == NULL
)
1399 day
= strtol(cp
, &x
, 10); /* XXX strtol */
1400 if ((cp
= nexttoken(x
)) == NULL
)
1403 if (strncmp(cp
, month_names
[i
], 3) == 0)
1405 if (month_names
[++i
][0] == '\0')
1409 if ((cp
= nexttoken(&cp
[3])) == NULL
)
1413 * Where a two or three digit year occurs in a date, the year is to be
1414 * interpreted as follows: If a two digit year is encountered whose
1415 * value is between 00 and 49, the year is interpreted by adding 2000,
1416 * ending up with a value between 2000 and 2049. If a two digit year
1417 * is encountered with a value between 50 and 99, or any three digit
1418 * year is encountered, the year is interpreted by adding 1900.
1420 year
= strtol(cp
, &x
, 10); /* XXX strtol */
1422 if (i
== 2 && year
>= 0 && year
<= 49)
1424 else if (i
== 3 || (i
== 2 && year
>= 50 && year
<= 99))
1426 if ((cp
= nexttoken(x
)) == NULL
)
1428 hour
= strtol(cp
, &x
, 10); /* XXX strtol */
1432 minute
= strtol(cp
, &x
, 10);
1435 second
= strtol(cp
, &x
, 10);
1438 if ((t
= combinetime(year
, month
, day
, hour
, minute
, second
)) ==
1441 if ((cp
= nexttoken(x
)) != NULL
) {
1452 if (digitchar(cp
[0]) && digitchar(cp
[1]) && digitchar(cp
[2]) &&
1457 t
+= strtol(buf
, NULL
, 10) * sign
* 3600;/*XXX strtrol*/
1460 t
+= strtol(buf
, NULL
, 10) * sign
* 60; /* XXX strtol*/
1462 /* TODO WE DO NOT YET PARSE (OBSOLETE) ZONE NAMES
1463 * TODO once again, Christos Zoulas and NetBSD Mail have done
1464 * TODO a really good job already, but using strptime(3), which
1465 * TODO is not portable. Nonetheless, WE must improve, not
1466 * TODO at last because we simply ignore obsolete timezones!!
1467 * TODO See RFC 5322, 4.3! */
1474 #define is_leapyear(Y) ((((Y) % 100 ? (Y) : (Y) / 100) & 3) == 0)
1477 combinetime(int year
, int month
, int day
, int hour
, int minute
, int second
)
1481 if (second
< 0 || minute
< 0 || hour
< 0 || day
< 1)
1483 t
= second
+ minute
* 60 + hour
* 3600 + (day
- 1) * 86400;
1487 t
+= 86400 * (is_leapyear(year
) ? 29 : 28);
1507 t
+= (year
- 70) * 31536000 + ((year
- 69) / 4) * 86400 -
1508 ((year
- 1) / 100) * 86400 + ((year
+ 299) / 400) * 86400;
1513 substdate(struct message
*m
)
1518 * Determine the date to print in faked 'From ' lines. This is
1519 * traditionally the date the message was written to the mail
1520 * file. Try to determine this using RFC message header fields,
1521 * or fall back to current time.
1523 if ((cp
= hfield1("received", m
)) != NULL
) {
1524 while ((cp
= nexttoken(cp
)) != NULL
&& *cp
!= ';') {
1527 while (alnumchar(*cp
));
1530 m
->m_time
= rfctime(cp
);
1532 if (m
->m_time
== 0 || m
->m_time
> time_current
.tc_time
) {
1533 if ((cp
= hfield1("date", m
)) != NULL
)
1534 m
->m_time
= rfctime(cp
);
1536 if (m
->m_time
== 0 || m
->m_time
> time_current
.tc_time
)
1537 m
->m_time
= time_current
.tc_time
;
1541 check_from_and_sender(struct name
*fromfield
, struct name
*senderfield
)
1543 if (fromfield
&& fromfield
->n_flink
&& senderfield
== NULL
) {
1544 fprintf(stderr
, "A Sender: field is required with multiple "
1545 "addresses in From: field.\n");
1548 if (senderfield
&& senderfield
->n_flink
) {
1549 fprintf(stderr
, "The Sender: field may contain "
1550 "only one address.\n");
1557 getsender(struct message
*mp
)
1562 if ((cp
= hfield1("from", mp
)) == NULL
||
1563 (np
= lextract(cp
, GEXTRA
|GSKIN
)) == NULL
)
1565 return np
->n_flink
!= NULL
? skin(hfield1("sender", mp
)) : np
->n_name
;
1569 grab_headers(struct header
*hp
, enum gfield gflags
, int subjfirst
)
1571 /* TODO grab_headers: again, check counts etc. against RFC;
1572 * TODO (now assumes check_from_and_sender() is called afterwards ++ */
1577 comma
= (value("bsdcompat") || value("bsdmsgs")) ? 0 : GCOMMA
;
1580 hp
->h_to
= grab_names("To: ", hp
->h_to
, comma
, GTO
|GFULL
);
1582 if (subjfirst
&& (gflags
& GSUBJECT
))
1583 hp
->h_subject
= readstr_input("Subject: ", hp
->h_subject
);
1586 hp
->h_cc
= grab_names("Cc: ", hp
->h_cc
, comma
, GCC
|GFULL
);
1589 hp
->h_bcc
= grab_names("Bcc: ", hp
->h_bcc
, comma
, GBCC
|GFULL
);
1591 if (gflags
& GEXTRA
) {
1592 if (hp
->h_from
== NULL
)
1593 hp
->h_from
= lextract(myaddrs(hp
), GEXTRA
|GFULL
);
1594 hp
->h_from
= grab_names("From: ", hp
->h_from
, comma
,
1596 if (hp
->h_replyto
== NULL
)
1597 hp
->h_replyto
= lextract(value("replyto"),
1599 hp
->h_replyto
= grab_names("Reply-To: ", hp
->h_replyto
, comma
,
1601 if (hp
->h_sender
== NULL
)
1602 hp
->h_sender
= extract(value("sender"), GEXTRA
|GFULL
);
1603 hp
->h_sender
= grab_names("Sender: ", hp
->h_sender
, comma
,
1605 if (hp
->h_organization
== NULL
)
1606 hp
->h_organization
= value("ORGANIZATION");
1607 hp
->h_organization
= readstr_input("Organization: ",
1608 hp
->h_organization
);
1611 if (! subjfirst
&& (gflags
& GSUBJECT
))
1612 hp
->h_subject
= readstr_input("Subject: ", hp
->h_subject
);