/* * rfc822.c -- code for slicing and dicing RFC822 mail headers * * Copyright 1997 by Eric S. Raymond * For license terms, see the file COPYING in this directory. */ #include #include #include #if defined(STDC_HEADERS) #include #endif #include "fetchmail.h" #define HEADER_END(p) ((p)[0] == '\n' && ((p)[1] != ' ' && (p)[1] != '\t')) #ifdef TESTMAIN static int verbose; #endif /* TESTMAIN */ char *reply_hack(buf, host) /* hack message headers so replies will work properly */ char *buf; /* header to be hacked */ const char *host; /* server hostname */ { char *from, *cp, last_nws = '\0'; int parendepth, state, has_bare_name_part, has_host_part; int addresscount = 1; if (strncasecmp("From: ", buf, 6) && strncasecmp("To: ", buf, 4) && strncasecmp("Reply-To: ", buf, 10) && strncasecmp("Return-Path: ", buf, 13) && strncasecmp("Cc: ", buf, 4) && strncasecmp("Bcc: ", buf, 5)) { return(buf); } #ifndef TESTMAIN /* make room to hack the address; buf must be malloced */ for (cp = buf; *cp; cp++) if (*cp == ',' || isspace(*cp)) addresscount++; buf = (char *)xrealloc(buf, strlen(buf) + addresscount * strlen(host) + 1); #endif /* TESTMAIN */ parendepth = state = 0; has_host_part = has_bare_name_part = FALSE; for (from = buf; *from; from++) { #ifdef TESTMAIN if (verbose) { printf("state %d: %s", state, buf); printf("%*s^\n", from - buf + 10, " "); } #endif /* TESTMAIN */ if (state != 2) if (*from == '(') ++parendepth; else if (*from == ')') --parendepth; if (!parendepth && !has_host_part) switch (state) { case 0: /* before header colon */ if (*from == ':') state = 1; break; case 1: /* we've seen the colon, we're looking for addresses */ if (!isspace(*from)) last_nws = *from; if (*from == '<') state = 3; else if (*from == '@') has_host_part = TRUE; else if (*from == '"') state = 2; /* * Not expanding on last non-WS == ';' deals with groupnames, * an obscure misfeature described in sections * 6.1, 6.2.6, and A.1.5 of the RFC822 standard. */ else if ((*from == ',' || HEADER_END(from) || from[1] == '(') && has_bare_name_part && !has_host_part && last_nws != ';' && last_nws != ')') { int hostlen; while (isspace(*from) || (*from == ',')) --from; from++; hostlen = strlen(host); for (cp = from + strlen(from); cp >= from; --cp) cp[hostlen+1] = *cp; *from++ = '@'; memcpy(from, host, hostlen); from += hostlen; has_host_part = TRUE; } else if (!isspace(*from)) has_bare_name_part = TRUE; break; case 2: /* we're in a string */ if (*from == '"') state = 1; break; case 3: /* we're in a <>-enclosed address */ if (*from == '@') has_host_part = TRUE; else if (*from == '>') { state = 1; if (!has_host_part) { int hostlen; hostlen = strlen(host); for (cp = from + strlen(from); cp >= from; --cp) cp[hostlen+1] = *cp; *from++ = '@'; memcpy(from, host, hostlen); from += hostlen; has_host_part = TRUE; } } break; } /* * If we passed a comma, reset everything. */ if (from[-1] == ',' && !parendepth) { has_host_part = has_bare_name_part = FALSE; } } return(buf); } char *nxtaddr(hdr) /* parse addresses in succession out of a specified RFC822 header */ const char *hdr; /* header to be parsed, NUL to continue previous hdr */ { static char *tp, address[POPBUFSIZE+1]; static const char *hp; static int state, oldstate; #ifdef TESTMAIN static const char *orighdr; #endif /* TESTMAIN */ int parendepth = 0; #define START_HDR 0 /* before header colon */ #define SKIP_JUNK 1 /* skip whitespace, \n, and junk */ #define BARE_ADDRESS 2 /* collecting address without delimiters */ #define INSIDE_DQUOTE 3 /* inside double quotes */ #define INSIDE_PARENS 4 /* inside parentheses */ #define INSIDE_BRACKETS 5 /* inside bracketed address */ #define ENDIT_ALL 6 /* after last address */ if (hdr) { hp = hdr; state = START_HDR; #ifdef TESTMAIN orighdr = hdr; #endif /* TESTMAIN */ tp = address; } for (; *hp; hp++) { #ifdef TESTMAIN if (verbose) { printf("state %d: %s", state, orighdr); printf("%*s^\n", hp - orighdr + 10, " "); } #endif /* TESTMAIN */ if (state == ENDIT_ALL) /* after last address */ return(NULL); else if (HEADER_END(hp)) { state =