2 * This file contains functions which handle the mapping of Internet addresses
3 * to users on the Citadel system.
5 * Copyright (c) 1987-2021 by the citadel.org team
7 * This program is open source software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 3.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
25 #include <sys/types.h>
30 #include <libcitadel.h>
33 #include "sysdep_decls.h"
34 #include "citserver.h"
38 #include "internet_addressing.h"
41 #include "parsedate.h"
43 #include "ctdl_module.h"
47 /* This is the non-define version in case it is needed for debugging */
49 inline void FindNextEnd (char *bptr, char *end)
51 /* Find the next ?Q? */
52 end = strchr(bptr + 2, '?');
53 if (end == NULL) return NULL;
54 if (((*(end + 1) == 'B') || (*(end + 1) == 'Q')) &&
55 (*(end + 2) == '?')) {
56 /* skip on to the end of the cluster, the next ?= */
57 end = strstr(end + 3, "?=");
60 /* sort of half valid encoding, try to find an end. */
61 end = strstr(bptr, "?=");
65 #define FindNextEnd(bptr, end) { \
66 end = strchr(bptr + 2, '?'); \
68 if (((*(end + 1) == 'B') || (*(end + 1) == 'Q')) && (*(end + 2) == '?')) { \
69 end = strstr(end + 3, "?="); \
70 } else end = strstr(bptr, "?="); \
75 * Handle subjects with RFC2047 encoding such as:
76 * =?koi8-r?B?78bP0s3Mxc7JxSDXz9rE1dvO2c3JINvB0sHNySDP?=
78 void utf8ify_rfc822_string(char *buf) {
79 char *start, *end, *next, *nextend, *ptr;
84 iconv_t ic = (iconv_t)(-1) ;
85 char *ibuf; // Buffer of characters to be converted
86 char *obuf; // Buffer for converted characters
87 size_t ibuflen; // Length of input buffer
88 size_t obuflen; // Length of output buffer
89 char *isav; // Saved pointer to input buffer
90 char *osav; // Saved pointer to output buffer
93 int illegal_non_rfc2047_encoding = 0;
95 /* Sometimes, badly formed messages contain strings which were simply
96 * written out directly in some foreign character set instead of
97 * using RFC2047 encoding. This is illegal but we will attempt to
98 * handle it anyway by converting from a user-specified default
99 * charset to UTF-8 if we see any nonprintable characters.
102 for (i=0; i<len; ++i) {
103 if ((buf[i] < 32) || (buf[i] > 126)) {
104 illegal_non_rfc2047_encoding = 1;
105 i = len; // take a shortcut, it won't be more than one.
108 if (illegal_non_rfc2047_encoding) {
109 const char *default_header_charset = "iso-8859-1";
110 if ( (strcasecmp(default_header_charset, "UTF-8")) && (strcasecmp(default_header_charset, "us-ascii")) ) {
111 ctdl_iconv_open("UTF-8", default_header_charset, &ic);
112 if (ic != (iconv_t)(-1) ) {
115 safestrncpy(ibuf, buf, 1024);
116 ibuflen = strlen(ibuf);
118 obuf = (char *) malloc(obuflen);
120 iconv(ic, &ibuf, &ibuflen, &obuf, &obuflen);
121 osav[1024-obuflen] = 0;
130 /* pre evaluate the first pair */
131 nextend = end = NULL;
133 start = strstr(buf, "=?");
135 FindNextEnd (start, end);
137 while ((start != NULL) && (end != NULL)) {
138 next = strstr(end, "=?");
140 FindNextEnd(next, nextend);
144 /* did we find two partitions */
145 if ((next != NULL) && ((next - end) > 2)) {
147 while ((ptr < next) &&
153 /* did we find a gab just filled with blanks? */
158 len - (next - start));
160 /* now terminate the gab at the end */
161 delta = (next - end) - 2;
165 /* move next to its new location. */
170 /* our next-pair is our new first pair now. */
175 // Now we handle foreign character sets properly encoded in RFC2047 format.
176 start = strstr(buf, "=?");
177 FindNextEnd((start != NULL)? start : buf, end);
178 while (start != NULL && end != NULL && end > start) {
179 extract_token(charset, start, 1, '?', sizeof charset);
180 extract_token(encoding, start, 2, '?', sizeof encoding);
181 extract_token(istr, start, 3, '?', sizeof istr);
185 if (!strcasecmp(encoding, "B")) { // base64
186 ibuflen = CtdlDecodeBase64(ibuf, istr, strlen(istr));
188 else if (!strcasecmp(encoding, "Q")) { // quoted-printable
195 if (istr[pos] == '_') istr[pos] = ' ';
198 ibuflen = CtdlDecodeQuotedPrintable(ibuf, istr, len);
201 strcpy(ibuf, istr); // unknown encoding
202 ibuflen = strlen(istr);
205 ctdl_iconv_open("UTF-8", charset, &ic);
206 if (ic != (iconv_t)(-1) ) {
208 obuf = (char *) malloc(obuflen);
210 iconv(ic, &ibuf, &ibuflen, &obuf, &obuflen);
211 osav[1024-obuflen] = 0;
216 remove_token(end, 0, '?');
217 remove_token(end, 0, '?');
218 remove_token(end, 0, '?');
219 remove_token(end, 0, '?');
220 strcpy(end, &end[1]);
222 snprintf(newbuf, sizeof newbuf, "%s%s%s", buf, osav, end);
231 remove_token(end, 0, '?');
232 remove_token(end, 0, '?');
233 remove_token(end, 0, '?');
234 remove_token(end, 0, '?');
235 strcpy(end, &end[1]);
237 snprintf(newbuf, sizeof newbuf, "%s(unreadable)%s", buf, end);
244 * Since spammers will go to all sorts of absurd lengths to get their
245 * messages through, there are LOTS of corrupt headers out there.
246 * So, prevent a really badly formed RFC2047 header from throwing
247 * this function into an infinite loop.
250 if (passes > 20) return;
252 start = strstr(buf, "=?");
253 FindNextEnd((start != NULL)? start : buf, end);
258 inline void utf8ify_rfc822_string(char *a){};
263 char *inetcfg = NULL;
266 * Return nonzero if the supplied name is an alias for this host.
268 int CtdlHostAlias(char *fqdn) {
272 char host[256], type[256];
275 if (fqdn == NULL) return(hostalias_nomatch);
276 if (IsEmptyStr(fqdn)) return(hostalias_nomatch);
277 if (!strcasecmp(fqdn, "localhost")) return(hostalias_localhost);
278 if (!strcasecmp(fqdn, CtdlGetConfigStr("c_fqdn"))) return(hostalias_localhost);
279 if (!strcasecmp(fqdn, CtdlGetConfigStr("c_nodename"))) return(hostalias_localhost);
280 if (inetcfg == NULL) return(hostalias_nomatch);
282 config_lines = num_tokens(inetcfg, '\n');
283 for (i=0; i<config_lines; ++i) {
284 extract_token(buf, inetcfg, i, '\n', sizeof buf);
285 extract_token(host, buf, 0, '|', sizeof host);
286 extract_token(type, buf, 1, '|', sizeof type);
290 /* Process these in a specific order, in case there are multiple matches.
291 * We want localhost to override masq, for example.
294 if ( (!strcasecmp(type, "masqdomain")) && (!strcasecmp(fqdn, host))) {
295 found = hostalias_masq;
298 if ( (!strcasecmp(type, "localhost")) && (!strcasecmp(fqdn, host))) {
299 found = hostalias_localhost;
302 // "directory" used to be a distributed version of "localhost" but they're both the same now
303 if ( (!strcasecmp(type, "directory")) && (!strcasecmp(fqdn, host))) {
304 found = hostalias_localhost;
307 if (found) return(found);
309 return(hostalias_nomatch);
314 * Determine whether a given Internet address belongs to the current user
316 int CtdlIsMe(char *addr, int addr_buf_len) {
317 struct recptypes *recp;
320 recp = validate_recipients(addr, NULL, 0);
321 if (recp == NULL) return(0);
323 if (recp->num_local == 0) {
324 free_recipients(recp);
328 for (i=0; i<recp->num_local; ++i) {
329 extract_token(addr, recp->recp_local, i, '|', addr_buf_len);
330 if (!strcasecmp(addr, CC->user.fullname)) {
331 free_recipients(recp);
336 free_recipients(recp);
341 /* If the last item in a list of recipients was truncated to a partial address,
342 * remove it completely in order to avoid choking library functions.
344 void sanitize_truncated_recipient(char *str)
347 if (num_tokens(str, ',') < 2) return;
349 int len = strlen(str);
350 if (len < 900) return;
351 if (len > 998) str[998] = 0;
353 char *cptr = strrchr(str, ',');
356 char *lptr = strchr(cptr, '<');
357 char *rptr = strchr(cptr, '>');
359 if ( (lptr) && (rptr) && (rptr > lptr) ) return;
366 * This function is self explanatory.
367 * (What can I say, I'm in a weird mood today...)
369 void remove_any_whitespace_to_the_left_or_right_of_at_symbol(char *name) {
373 for (ptr=name; *ptr; ++ptr) {
374 while ( (isspace(*ptr)) && (*(ptr+1)=='@') ) {
376 if (ptr > name) --ptr;
378 while ( (*ptr=='@') && (*(ptr+1)!=0) && (isspace(*(ptr+1))) ) {
379 strcpy(ptr+1, ptr+2);
385 // values that can be returned by expand_aliases()
387 EA_ERROR, // Can't send message due to bad address
388 EA_MULTIPLE, // Alias expanded into multiple recipients -- run me again!
389 EA_LOCAL, // Local message, do no network processing
390 EA_INTERNET // Convert msg and send as Internet mail
394 // Process alias and routing info for email addresses
395 int expand_aliases(char *name, char *aliases) {
401 syslog(LOG_DEBUG, "internet_addressing: \x1b[34mexpand_aliases(%s)\x1b[0m", name);
403 int num_aliases = num_tokens(aliases, '\n');
404 for (a=0; a<num_aliases; ++a) {
405 extract_token(aaa, aliases, a, '\n', sizeof aaa);
406 char *bar = strchr(aaa, '|');
412 syslog(LOG_DEBUG, "\x1b[32malias #%d: compare <%s> to <%s>\x1b[0m", a, name, aaa);
413 if (!strcasecmp(name, aaa)) {
414 syslog(LOG_DEBUG, "internet_addressing: global alias <%s> to <%s>", name, bar);
419 if (strchr(name, ',')) {
424 char original_name[256]; // Now go for the regular aliases
425 safestrncpy(original_name, name, sizeof original_name);
427 // should these checks still be here, or maybe move them to split_recps() ?
429 remove_any_whitespace_to_the_left_or_right_of_at_symbol(name);
430 stripallbut(name, '<', '>');
432 /* Hit the email address directory */
433 if (CtdlDirectoryLookup(aaa, name, sizeof aaa) == 0) {
437 if (strcasecmp(original_name, name)) {
438 syslog(LOG_INFO, "internet_addressing: directory alias <%s> to <%s>", original_name, name);
441 /* Change "user @ xxx" to "user" if xxx is an alias for this host */
442 for (a=0; name[a] != '\0'; ++a) {
443 if (name[a] == '@') {
444 if (CtdlHostAlias(&name[a+1]) == hostalias_localhost) {
446 syslog(LOG_DEBUG, "internet_addressing: host is local, recipient is <%s>", name);
452 /* determine local or remote type, see citadel.h */
453 at = haschar(name, '@');
454 if (at == 0) return(EA_LOCAL); /* no @'s - local address */
455 if (at > 1) return(EA_ERROR); /* >1 @'s - invalid address */
456 remove_any_whitespace_to_the_left_or_right_of_at_symbol(name);
458 /* figure out the delivery mode */
459 extract_token(node, name, 1, '@', sizeof node);
461 /* If there are one or more dots in the nodename, we assume that it
462 * is an FQDN and will attempt SMTP delivery to the Internet.
464 if (haschar(node, '.') > 0) {
468 /* If we get to this point it's an invalid node name */
473 // Return a supplied list of email addresses as an array, removing superfluous information and syntax.
474 Array *split_recps(char *addresses) {
476 // Copy the supplied address list into our own memory space, because we are going to mangle it.
477 char *a = malloc(strlen(addresses));
479 syslog(LOG_ERR, "internet_addressing: malloc() failed: %m");
483 // Strip out anything in double quotes
488 for (t=addresses; t[0]; ++t) {
498 // Transform all qualifying delimiters to commas
499 for (t=a; t[0]; ++t) {
500 if ((t[0]==';') || (t[0]=='|')) {
505 // Tokenize the recipients into an array
506 Array *recipients_array = array_new(256); // no single recipient should be bigger than 256 bytes
508 int num_addresses = num_tokens(a, ',');
509 syslog(LOG_DEBUG, "\x1b[35mEXTRACING: %d addresses from <%s>\x1b[0m", num_addresses, a);
510 for (int i=0; i<num_addresses; ++i) {
511 char this_address[256];
512 extract_token(this_address, a, i, ',', sizeof this_address);
513 syslog(LOG_DEBUG, "\x1b[35mEXTRACTED: <%s>\x1b[0m", this_address);
514 striplt(this_address); // strip leading and trailing whitespace
515 stripout(this_address, '(', ')'); // remove any portion in parentheses
516 stripallbut(this_address, '<', '>'); // if angle brackets are present, keep only what is inside them
517 syslog(LOG_DEBUG, "\x1b[35mPROCESSED: <%s>\x1b[0m", this_address);
518 array_append(recipients_array, this_address);
521 free(a); // We don't need this buffer anymore.
522 return(recipients_array); // Return the completed array to the caller.
526 // Validate recipients, count delivery types and errors, and handle aliasing
527 // FIXME check for dupes!!!!!
529 // Returns 0 if all addresses are ok, ret->num_error = -1 if no addresses
530 // were specified, or the number of addresses found invalid.
532 // Caller needs to free the result using free_recipients()
534 struct recptypes *validate_recipients(char *supplied_recipients, const char *RemoteIdentifier, int Flags) {
535 struct recptypes *ret;
536 char *recipients = NULL;
541 struct ctdluser tempUS;
542 struct ctdlroom original_room;
548 syslog(LOG_DEBUG, "internet_addressing: \x1b[32mvalidate_recipients(%s) \x1b[0m", supplied_recipients);
550 ret = (struct recptypes *) malloc(sizeof(struct recptypes)); // Initialize
551 if (ret == NULL) return(NULL);
552 memset(ret, 0, sizeof(struct recptypes)); // set all values to null/zero
554 if (supplied_recipients == NULL) {
555 recipients = strdup("");
558 recipients = strdup(supplied_recipients);
561 len = strlen(recipients) + 1024; // allocate memory
562 ret->errormsg = malloc(len);
563 ret->recp_local = malloc(len);
564 ret->recp_internet = malloc(len);
565 ret->recp_room = malloc(len);
566 ret->display_recp = malloc(len);
567 ret->recp_orgroom = malloc(len);
569 ret->errormsg[0] = 0;
570 ret->recp_local[0] = 0;
571 ret->recp_internet[0] = 0;
572 ret->recp_room[0] = 0;
573 ret->recp_orgroom[0] = 0;
574 ret->display_recp[0] = 0;
575 ret->recptypes_magic = RECPTYPES_MAGIC;
577 //char *aliases = CtdlGetSysConfig(GLOBAL_ALIASES); // First hit the Global Alias Table
578 char *aliases = strdup("root|admin,ajc@citadel.org,artcancro@gmail.com\n abuse|admin\n ajc|ajc@citadel.org\n");
580 Array *recp_array = split_recps(supplied_recipients);
581 int original_array_len = array_len(recp_array);
582 syslog(LOG_DEBUG, "\x1b[32moriginal_array_len=%d\x1b[0m", original_array_len);
583 for (int r=0; r<array_len(recp_array); ++r) {
584 syslog(LOG_DEBUG, "\x1b[32m\x1b[7mrecipient #%d is %s \x1b[0m", r, (char *)array_get_element_at(recp_array, r) );
585 org_recp = (char *)array_get_element_at(recp_array, r);
586 strncpy(this_recp, org_recp, sizeof this_recp);
587 mailtype = expand_aliases(this_recp, aliases);
589 // If an alias expanded to multiple recipients, strip off those recipients and append them
590 // to the end of the array. This loop will hit those again when it gets there.
591 // Note that we don't do this after we get past the *original* array length, to avoid aliasing loops.
592 if (mailtype == EA_MULTIPLE) {
593 if (r < original_array_len) {
595 while ((comma = strrchr(this_recp, ','))) {
597 array_append(recp_array, &comma[1]);
598 strcpy(org_recp, this_recp);
606 mailtype = expand_aliases(this_recp, aliases); // do it ONCE again to handle alias expansions
607 if (mailtype == EA_MULTIPLE) {
608 mailtype = EA_ERROR; // and fail if it wants to expand a second time
614 case EA_LOCAL: // There are several types of "local" recipients.
616 // Old BBS conventions require mail to "sysop" to go somewhere. Send it to the admin room.
617 if (!strcasecmp(this_recp, "sysop")) {
619 strcpy(this_recp, CtdlGetConfigStr("c_aideroom"));
620 if (!IsEmptyStr(ret->recp_room)) {
621 strcat(ret->recp_room, "|");
623 strcat(ret->recp_room, this_recp);
626 // This handles rooms which can receive posts via email.
627 else if (!strncasecmp(this_recp, "room_", 5)) {
628 original_room = CC->room; // Remember where we parked
630 char mail_to_room[ROOMNAMELEN];
632 strncpy(mail_to_room, &this_recp[5], sizeof mail_to_room);
633 for (m = mail_to_room; *m; ++m) {
634 if (m[0] == '_') m[0]=' ';
636 if (!CtdlGetRoom(&CC->room, mail_to_room)) { // Find the room they asked for
638 err = CtdlDoIHavePermissionToPostInThisRoom( // check for write permissions to room
643 0 // 0 means "this is not a reply"
651 if (!IsEmptyStr(ret->recp_room)) {
652 strcat(ret->recp_room, "|");
654 strcat(ret->recp_room, &this_recp[5]);
656 if (!IsEmptyStr(ret->recp_orgroom)) {
657 strcat(ret->recp_orgroom, "|");
659 strcat(ret->recp_orgroom, org_recp);
663 else { // no such room exists
668 // Restore this session's original room location.
669 CC->room = original_room;
673 // This handles the most common case, which is mail to a user's inbox.
674 else if (CtdlGetUser(&tempUS, this_recp) == 0) {
676 strcpy(this_recp, tempUS.fullname);
677 if (!IsEmptyStr(ret->recp_local)) {
678 strcat(ret->recp_local, "|");
680 strcat(ret->recp_local, this_recp);
683 // No match for this recipient
690 // Yes, you're reading this correctly: if the target domain points back to the local system,
691 // the address is invalid. That's because if the address were valid, we would have
692 // already translated it to a local address by now.
693 if (IsDirectory(this_recp, 0)) {
699 if (!IsEmptyStr(ret->recp_internet)) {
700 strcat(ret->recp_internet, "|");
702 strcat(ret->recp_internet, this_recp);
711 if (IsEmptyStr(errmsg)) {
712 snprintf(append, sizeof append, "Invalid recipient: %s", this_recp);
715 snprintf(append, sizeof append, "%s", errmsg);
717 if ( (strlen(ret->errormsg) + strlen(append) + 3) < SIZ) {
718 if (!IsEmptyStr(ret->errormsg)) {
719 strcat(ret->errormsg, "; ");
721 strcat(ret->errormsg, append);
725 if (IsEmptyStr(ret->display_recp)) {
726 strcpy(append, this_recp);
729 snprintf(append, sizeof append, ", %s", this_recp);
731 if ( (strlen(ret->display_recp)+strlen(append)) < SIZ) {
732 strcat(ret->display_recp, append);
737 if (aliases != NULL) { // ok, we're done with the global alias list now
741 if ( (ret->num_local + ret->num_internet + ret->num_room + ret->num_error) == 0) {
742 ret->num_error = (-1);
743 strcpy(ret->errormsg, "No recipients specified.");
746 syslog(LOG_DEBUG, "internet_addressing: validate_recipients() = %d local, %d room, %d SMTP, %d error",
747 ret->num_local, ret->num_room, ret->num_internet, ret->num_error
751 array_free(recp_array);
758 * Destructor for recptypes
760 void free_recipients(struct recptypes *valid) {
766 if (valid->recptypes_magic != RECPTYPES_MAGIC) {
767 syslog(LOG_ERR, "internet_addressing: attempt to call free_recipients() on some other data type!");
771 if (valid->errormsg != NULL) free(valid->errormsg);
772 if (valid->recp_local != NULL) free(valid->recp_local);
773 if (valid->recp_internet != NULL) free(valid->recp_internet);
774 if (valid->recp_room != NULL) free(valid->recp_room);
775 if (valid->recp_orgroom != NULL) free(valid->recp_orgroom);
776 if (valid->display_recp != NULL) free(valid->display_recp);
777 if (valid->bounce_to != NULL) free(valid->bounce_to);
778 if (valid->envelope_from != NULL) free(valid->envelope_from);
779 if (valid->sending_room != NULL) free(valid->sending_room);
784 char *qp_encode_email_addrs(char *source) {
785 char *user, *node, *name;
786 const char headerStr[] = "=?UTF-8?Q?";
790 int need_to_encode = 0;
796 long nAddrPtrMax = 50;
801 if (source == NULL) return source;
802 if (IsEmptyStr(source)) return source;
803 syslog(LOG_DEBUG, "internet_addressing: qp_encode_email_addrs <%s>", source);
805 AddrPtr = malloc (sizeof (long) * nAddrPtrMax);
806 AddrUtf8 = malloc (sizeof (long) * nAddrPtrMax);
807 memset(AddrUtf8, 0, sizeof (long) * nAddrPtrMax);
810 while (!IsEmptyStr (&source[i])) {
811 if (nColons >= nAddrPtrMax){
814 ptr = (long *) malloc(sizeof (long) * nAddrPtrMax * 2);
815 memcpy (ptr, AddrPtr, sizeof (long) * nAddrPtrMax);
816 free (AddrPtr), AddrPtr = ptr;
818 ptr = (long *) malloc(sizeof (long) * nAddrPtrMax * 2);
819 memset(&ptr[nAddrPtrMax], 0, sizeof (long) * nAddrPtrMax);
821 memcpy (ptr, AddrUtf8, sizeof (long) * nAddrPtrMax);
822 free (AddrUtf8), AddrUtf8 = ptr;
825 if (((unsigned char) source[i] < 32) || ((unsigned char) source[i] > 126)) {
827 AddrUtf8[nColons] = 1;
829 if (source[i] == '"') {
830 InQuotes = !InQuotes;
832 if (!InQuotes && source[i] == ',') {
833 AddrPtr[nColons] = i;
838 if (need_to_encode == 0) {
845 EncodedMaxLen = nColons * (sizeof(headerStr) + 3) + SourceLen * 3;
846 Encoded = (char*) malloc (EncodedMaxLen);
848 for (i = 0; i < nColons; i++) {
849 source[AddrPtr[i]++] = '\0';
851 /* TODO: if libidn, this might get larger*/
852 user = malloc(SourceLen + 1);
853 node = malloc(SourceLen + 1);
854 name = malloc(SourceLen + 1);
858 for (i = 0; i < nColons && nPtr != NULL; i++) {
859 nmax = EncodedMaxLen - (nPtr - Encoded);
861 process_rfc822_addr(&source[AddrPtr[i]], user, node, name);
862 /* TODO: libIDN here ! */
863 if (IsEmptyStr(name)) {
864 n = snprintf(nPtr, nmax, (i==0)?"%s@%s" : ",%s@%s", user, node);
867 EncodedName = rfc2047encode(name, strlen(name));
868 n = snprintf(nPtr, nmax, (i==0)?"%s <%s@%s>" : ",%s <%s@%s>", EncodedName, user, node);
873 n = snprintf(nPtr, nmax, (i==0)?"%s" : ",%s", &source[AddrPtr[i]]);
879 ptr = (char*) malloc(EncodedMaxLen * 2);
880 memcpy(ptr, Encoded, EncodedMaxLen);
881 nnPtr = ptr + (nPtr - Encoded), nPtr = nnPtr;
882 free(Encoded), Encoded = ptr;
884 i--; /* do it once more with properly lengthened buffer */
887 for (i = 0; i < nColons; i++)
888 source[--AddrPtr[i]] = ',';
900 * Unfold a multi-line field into a single line, removing multi-whitespaces
902 void unfold_rfc822_field(char **field, char **FieldEnd)
905 char *pField = *field;
907 char *pFieldEnd = *FieldEnd;
909 while (isspace(*pField))
911 /* remove leading/trailing whitespace */
914 while (isspace(*pFieldEnd))
917 *FieldEnd = pFieldEnd;
918 /* convert non-space whitespace to spaces, and remove double blanks */
919 for (sField = *field = pField;
923 if ((*sField=='\r') || (*sField=='\n'))
926 while ( ( (*(sField + offset) == '\r') || (*(sField + offset) == '\n' )) && (sField + offset < pFieldEnd) ) {
933 if (*sField=='\"') quote = 1 - quote;
935 if (isspace(*sField)) {
940 while ((sField < pFieldEnd) &&
945 else *pField = *sField;
947 else *pField = *sField;
951 *FieldEnd = pField - 1;
956 * Split an RFC822-style address into userid, host, and full name
959 void process_rfc822_addr(const char *rfc822, char *user, char *node, char *name) {
963 strcpy(node, CtdlGetConfigStr("c_fqdn"));
966 if (rfc822 == NULL) return;
968 /* extract full name - first, it's From minus <userid> */
969 strcpy(name, rfc822);
970 stripout(name, '<', '>');
972 /* strip anything to the left of a bang */
973 while ((!IsEmptyStr(name)) && (haschar(name, '!') > 0))
974 strcpy(name, &name[1]);
976 /* and anything to the right of a @ or % */
977 for (a = 0; name[a] != '\0'; ++a) {
978 if (name[a] == '@') {
982 if (name[a] == '%') {
988 /* but if there are parentheses, that changes the rules... */
989 if ((haschar(rfc822, '(') == 1) && (haschar(rfc822, ')') == 1)) {
990 strcpy(name, rfc822);
991 stripallbut(name, '(', ')');
994 /* but if there are a set of quotes, that supersedes everything */
995 if (haschar(rfc822, 34) == 2) {
996 strcpy(name, rfc822);
997 while ((!IsEmptyStr(name)) && (name[0] != 34)) {
998 strcpy(&name[0], &name[1]);
1000 strcpy(&name[0], &name[1]);
1001 for (a = 0; name[a] != '\0'; ++a)
1002 if (name[a] == 34) {
1007 /* extract user id */
1008 strcpy(user, rfc822);
1010 /* first get rid of anything in parens */
1011 stripout(user, '(', ')');
1013 /* if there's a set of angle brackets, strip it down to that */
1014 if ((haschar(user, '<') == 1) && (haschar(user, '>') == 1)) {
1015 stripallbut(user, '<', '>');
1018 /* strip anything to the left of a bang */
1019 while ((!IsEmptyStr(user)) && (haschar(user, '!') > 0))
1020 strcpy(user, &user[1]);
1022 /* and anything to the right of a @ or % */
1023 for (a = 0; user[a] != '\0'; ++a) {
1024 if (user[a] == '@') {
1028 if (user[a] == '%') {
1035 /* extract node name */
1036 strcpy(node, rfc822);
1038 /* first get rid of anything in parens */
1039 stripout(node, '(', ')');
1041 /* if there's a set of angle brackets, strip it down to that */
1042 if ((haschar(node, '<') == 1) && (haschar(node, '>') == 1)) {
1043 stripallbut(node, '<', '>');
1046 /* If no node specified, tack ours on instead */
1048 (haschar(node, '@')==0)
1049 && (haschar(node, '%')==0)
1050 && (haschar(node, '!')==0)
1052 strcpy(node, CtdlGetConfigStr("c_nodename"));
1056 /* strip anything to the left of a @ */
1057 while ((!IsEmptyStr(node)) && (haschar(node, '@') > 0))
1058 strcpy(node, &node[1]);
1060 /* strip anything to the left of a % */
1061 while ((!IsEmptyStr(node)) && (haschar(node, '%') > 0))
1062 strcpy(node, &node[1]);
1064 /* reduce multiple system bang paths to node!user */
1065 while ((!IsEmptyStr(node)) && (haschar(node, '!') > 1))
1066 strcpy(node, &node[1]);
1068 /* now get rid of the user portion of a node!user string */
1069 for (a = 0; node[a] != '\0'; ++a)
1070 if (node[a] == '!') {
1076 /* strip leading and trailing spaces in all strings */
1081 /* If we processed a string that had the address in angle brackets
1082 * but no name outside the brackets, we now have an empty name. In
1083 * this case, use the user portion of the address as the name.
1085 if ((IsEmptyStr(name)) && (!IsEmptyStr(user))) {
1092 * convert_field() is a helper function for convert_internet_message().
1093 * Given start/end positions for an rfc822 field, it converts it to a Citadel
1094 * field if it wants to, and unfolds it if necessary.
1096 * Returns 1 if the field was converted and inserted into the Citadel message
1097 * structure, implying that the source field should be removed from the
1100 int convert_field(struct CtdlMessage *msg, const char *beg, const char *end) {
1101 char *key, *value, *valueend;
1105 const char *colonpos = NULL;
1114 for (pos = end; pos >= beg; pos--) {
1115 if (*pos == ':') colonpos = pos;
1118 if (colonpos == NULL) return(0); /* no colon? not a valid header line */
1121 key = malloc(len + 2);
1122 memcpy(key, beg, len + 1);
1124 valueend = key + len;
1125 * ( key + (colonpos - beg) ) = '\0';
1126 value = &key[(colonpos - beg) + 1];
1127 /* printf("Header: [%s]\nValue: [%s]\n", key, value); */
1128 unfold_rfc822_field(&value, &valueend);
1129 valuelen = valueend - value + 1;
1130 /* printf("UnfoldedValue: [%s]\n", value); */
1133 * Here's the big rfc822-to-citadel loop.
1136 /* Date/time is converted into a unix timestamp. If the conversion
1137 * fails, we replace it with the time the message arrived locally.
1139 if (!strcasecmp(key, "Date")) {
1140 parsed_date = parsedate(value);
1141 if (parsed_date < 0L) parsed_date = time(NULL);
1143 if (CM_IsEmpty(msg, eTimestamp))
1144 CM_SetFieldLONG(msg, eTimestamp, parsed_date);
1148 else if (!strcasecmp(key, "From")) {
1149 process_rfc822_addr(value, user, node, name);
1150 syslog(LOG_DEBUG, "internet_addressing: converted to <%s@%s> (%s)", user, node, name);
1151 snprintf(addr, sizeof(addr), "%s@%s", user, node);
1152 if (CM_IsEmpty(msg, eAuthor) && !IsEmptyStr(name)) {
1153 CM_SetField(msg, eAuthor, name, -1);
1155 if (CM_IsEmpty(msg, erFc822Addr) && !IsEmptyStr(addr)) {
1156 CM_SetField(msg, erFc822Addr, addr, -1);
1161 else if (!strcasecmp(key, "Subject")) {
1162 if (CM_IsEmpty(msg, eMsgSubject))
1163 CM_SetField(msg, eMsgSubject, value, valuelen);
1167 else if (!strcasecmp(key, "List-ID")) {
1168 if (CM_IsEmpty(msg, eListID))
1169 CM_SetField(msg, eListID, value, valuelen);
1173 else if (!strcasecmp(key, "To")) {
1174 if (CM_IsEmpty(msg, eRecipient))
1175 CM_SetField(msg, eRecipient, value, valuelen);
1179 else if (!strcasecmp(key, "CC")) {
1180 if (CM_IsEmpty(msg, eCarbonCopY))
1181 CM_SetField(msg, eCarbonCopY, value, valuelen);
1185 else if (!strcasecmp(key, "Message-ID")) {
1186 if (!CM_IsEmpty(msg, emessageId)) {
1187 syslog(LOG_WARNING, "internet_addressing: duplicate message id");
1194 pValueLen = valuelen;
1195 /* Strip angle brackets */
1196 while (haschar(pValue, '<') > 0) {
1201 for (i = 0; i <= pValueLen; ++i)
1202 if (pValue[i] == '>') {
1207 CM_SetField(msg, emessageId, pValue, pValueLen);
1213 else if (!strcasecmp(key, "Return-Path")) {
1214 if (CM_IsEmpty(msg, eMessagePath))
1215 CM_SetField(msg, eMessagePath, value, valuelen);
1219 else if (!strcasecmp(key, "Envelope-To")) {
1220 if (CM_IsEmpty(msg, eenVelopeTo))
1221 CM_SetField(msg, eenVelopeTo, value, valuelen);
1225 else if (!strcasecmp(key, "References")) {
1226 CM_SetField(msg, eWeferences, value, valuelen);
1230 else if (!strcasecmp(key, "Reply-To")) {
1231 CM_SetField(msg, eReplyTo, value, valuelen);
1235 else if (!strcasecmp(key, "In-reply-to")) {
1236 if (CM_IsEmpty(msg, eWeferences)) /* References: supersedes In-reply-to: */
1237 CM_SetField(msg, eWeferences, value, valuelen);
1243 /* Clean up and move on. */
1244 free(key); /* Don't free 'value', it's actually the same buffer */
1250 * Convert RFC822 references format (References) to Citadel references format (Weferences)
1252 void convert_references_to_wefewences(char *str) {
1253 int bracket_nesting = 0;
1255 char *moveptr = NULL;
1262 if (bracket_nesting < 0) bracket_nesting = 0;
1264 if ((ch == '>') && (bracket_nesting == 0) && (*(ptr+1)) && (ptr>str) ) {
1268 else if (bracket_nesting > 0) {
1274 *moveptr = *(moveptr+1);
1278 if (ch == '<') ++bracket_nesting;
1285 * Convert an RFC822 message (headers + body) to a CtdlMessage structure.
1286 * NOTE: the supplied buffer becomes part of the CtdlMessage structure, and
1287 * will be deallocated when CM_Free() is called. Therefore, the
1288 * supplied buffer should be DEREFERENCED. It should not be freed or used
1291 struct CtdlMessage *convert_internet_message(char *rfc822) {
1292 StrBuf *RFCBuf = NewStrBufPlain(rfc822, -1);
1294 return convert_internet_message_buf(&RFCBuf);
1298 struct CtdlMessage *convert_internet_message_buf(StrBuf **rfc822)
1300 struct CtdlMessage *msg;
1301 const char *pos, *beg, *end, *totalend;
1302 int done, alldone = 0;
1304 StrBuf *OtherHeaders;
1306 msg = malloc(sizeof(struct CtdlMessage));
1307 if (msg == NULL) return msg;
1309 memset(msg, 0, sizeof(struct CtdlMessage));
1310 msg->cm_magic = CTDLMESSAGE_MAGIC; /* self check */
1311 msg->cm_anon_type = 0; /* never anonymous */
1312 msg->cm_format_type = FMT_RFC822; /* internet message */
1314 pos = ChrPtr(*rfc822);
1315 totalend = pos + StrLength(*rfc822);
1317 OtherHeaders = NewStrBufPlain(NULL, StrLength(*rfc822));
1321 /* Locate beginning and end of field, keeping in mind that
1322 * some fields might be multiline
1326 while ((end < totalend) &&
1331 if ( (*pos=='\n') && ((*(pos+1))!=0x20) && ((*(pos+1))!=0x09) )
1336 /* done with headers? */
1338 ( (*(pos+1)=='\n') ||
1344 if (pos >= (totalend - 1) )
1354 /* At this point we have a field. Are we interested in it? */
1355 converted = convert_field(msg, beg, end);
1357 /* Strip the field out of the RFC822 header if we used it */
1359 StrBufAppendBufPlain(OtherHeaders, beg, end - beg, 0);
1360 StrBufAppendBufPlain(OtherHeaders, HKEY("\n"), 0);
1363 /* If we've hit the end of the message, bail out */
1364 if (pos >= totalend)
1367 StrBufAppendBufPlain(OtherHeaders, HKEY("\n"), 0);
1369 StrBufAppendBufPlain(OtherHeaders, pos, totalend - pos, 0);
1371 CM_SetAsFieldSB(msg, eMesageText, &OtherHeaders);
1373 /* Follow-up sanity checks... */
1375 /* If there's no timestamp on this message, set it to now. */
1376 if (CM_IsEmpty(msg, eTimestamp)) {
1377 CM_SetFieldLONG(msg, eTimestamp, time(NULL));
1380 /* If a W (references, or rather, Wefewences) field is present, we
1381 * have to convert it from RFC822 format to Citadel format.
1383 if (!CM_IsEmpty(msg, eWeferences)) {
1385 convert_references_to_wefewences(msg->cm_fields[eWeferences]);
1393 * Look for a particular header field in an RFC822 message text. If the
1394 * requested field is found, it is unfolded (if necessary) and returned to
1395 * the caller. The field name is stripped out, leaving only its contents.
1396 * The caller is responsible for freeing the returned buffer. If the requested
1397 * field is not present, or anything else goes wrong, it returns NULL.
1399 char *rfc822_fetch_field(const char *rfc822, const char *fieldname) {
1400 char *fieldbuf = NULL;
1401 const char *end_of_headers;
1402 const char *field_start;
1407 /* Should never happen, but sometimes we get stupid */
1408 if (rfc822 == NULL) return(NULL);
1409 if (fieldname == NULL) return(NULL);
1411 snprintf(fieldhdr, sizeof fieldhdr, "%s:", fieldname);
1413 /* Locate the end of the headers, so we don't run past that point */
1414 end_of_headers = cbmstrcasestr(rfc822, "\n\r\n");
1415 if (end_of_headers == NULL) {
1416 end_of_headers = cbmstrcasestr(rfc822, "\n\n");
1418 if (end_of_headers == NULL) return (NULL);
1420 field_start = cbmstrcasestr(rfc822, fieldhdr);
1421 if (field_start == NULL) return(NULL);
1422 if (field_start > end_of_headers) return(NULL);
1424 fieldbuf = malloc(SIZ);
1425 strcpy(fieldbuf, "");
1428 ptr = cmemreadline(ptr, fieldbuf, SIZ-strlen(fieldbuf) );
1429 while ( (isspace(ptr[0])) && (ptr < end_of_headers) ) {
1430 strcat(fieldbuf, " ");
1431 cont = &fieldbuf[strlen(fieldbuf)];
1432 ptr = cmemreadline(ptr, cont, SIZ-strlen(fieldbuf) );
1436 strcpy(fieldbuf, &fieldbuf[strlen(fieldhdr)]);
1443 /*****************************************************************************
1444 * DIRECTORY MANAGEMENT FUNCTIONS *
1445 *****************************************************************************/
1448 * Generate the index key for an Internet e-mail address to be looked up
1451 void directory_key(char *key, char *addr) {
1455 for (i=0; !IsEmptyStr(&addr[i]); ++i) {
1456 if (!isspace(addr[i])) {
1457 key[keylen++] = tolower(addr[i]);
1462 syslog(LOG_DEBUG, "internet_addressing: directory key is <%s>", key);
1467 * Return nonzero if the supplied address is in one of "our" domains
1469 int IsDirectory(char *addr, int allow_masq_domains) {
1473 extract_token(domain, addr, 1, '@', sizeof domain);
1476 h = CtdlHostAlias(domain);
1478 if ( (h == hostalias_masq) && allow_masq_domains)
1481 if (h == hostalias_localhost) {
1491 * Add an Internet e-mail address to the directory for a user
1493 int CtdlDirectoryAddUser(char *internet_addr, char *citadel_addr) {
1496 if (IsDirectory(internet_addr, 0) == 0) {
1499 syslog(LOG_DEBUG, "internet_addressing: create directory entry: %s --> %s", internet_addr, citadel_addr);
1500 directory_key(key, internet_addr);
1501 cdb_store(CDB_DIRECTORY, key, strlen(key), citadel_addr, strlen(citadel_addr)+1 );
1507 * Delete an Internet e-mail address from the directory.
1509 * (NOTE: we don't actually use or need the citadel_addr variable; it's merely
1510 * here because the callback API expects to be able to send it.)
1512 int CtdlDirectoryDelUser(char *internet_addr, char *citadel_addr) {
1515 syslog(LOG_DEBUG, "internet_addressing: delete directory entry: %s --> %s", internet_addr, citadel_addr);
1516 directory_key(key, internet_addr);
1517 return cdb_delete(CDB_DIRECTORY, key, strlen(key) ) == 0;
1522 * Look up an Internet e-mail address in the directory.
1523 * On success: returns 0, and Citadel address stored in 'target'
1524 * On failure: returns nonzero
1526 int CtdlDirectoryLookup(char *target, char *internet_addr, size_t targbuflen) {
1527 struct cdbdata *cdbrec;
1530 /* Dump it in there unchanged, just for kicks */
1531 if (target != NULL) {
1532 safestrncpy(target, internet_addr, targbuflen);
1535 /* Only do lookups for addresses with hostnames in them */
1536 if (num_tokens(internet_addr, '@') != 2) return(-1);
1538 /* Only do lookups for domains in the directory */
1539 if (IsDirectory(internet_addr, 0) == 0) return(-1);
1541 directory_key(key, internet_addr);
1542 cdbrec = cdb_fetch(CDB_DIRECTORY, key, strlen(key) );
1543 if (cdbrec != NULL) {
1544 if (target != NULL) {
1545 safestrncpy(target, cdbrec->ptr, targbuflen);
1556 * Harvest any email addresses that someone might want to have in their
1557 * "collected addresses" book.
1559 char *harvest_collected_addresses(struct CtdlMessage *msg) {
1562 char user[256], node[256], name[256];
1565 eMsgField field = 0;
1567 if (msg == NULL) return(NULL);
1571 if (!CM_IsEmpty(msg, eAuthor)) {
1572 strcat(addr, msg->cm_fields[eAuthor]);
1574 if (!CM_IsEmpty(msg, erFc822Addr)) {
1576 strcat(addr, msg->cm_fields[erFc822Addr]);
1578 if (IsDirectory(msg->cm_fields[erFc822Addr], 0)) {
1583 if (is_harvestable) {
1584 coll = strdup(addr);
1590 if (coll == NULL) return(NULL);
1592 /* Scan both the R (To) and Y (CC) fields */
1593 for (i = 0; i < 2; ++i) {
1594 if (i == 0) field = eRecipient;
1595 if (i == 1) field = eCarbonCopY;
1597 if (!CM_IsEmpty(msg, field)) {
1598 for (j=0; j<num_tokens(msg->cm_fields[field], ','); ++j) {
1599 extract_token(addr, msg->cm_fields[field], j, ',', sizeof addr);
1600 if (strstr(addr, "=?") != NULL)
1601 utf8ify_rfc822_string(addr);
1602 process_rfc822_addr(addr, user, node, name);
1603 h = CtdlHostAlias(node);
1604 if (h != hostalias_localhost) {
1605 coll = realloc(coll, strlen(coll) + strlen(addr) + 4);
1606 if (coll == NULL) return(NULL);
1607 if (!IsEmptyStr(coll)) {
1617 if (IsEmptyStr(coll)) {
1626 * Helper function for CtdlRebuildDirectoryIndex()
1628 void CtdlRebuildDirectoryIndex_backend(char *username, void *data) {
1631 struct ctdluser usbuf;
1633 if (CtdlGetUser(&usbuf, username) != 0) {
1637 if ( (!IsEmptyStr(usbuf.fullname)) && (!IsEmptyStr(usbuf.emailaddrs)) ) {
1638 for (j=0; j<num_tokens(usbuf.emailaddrs, '|'); ++j) {
1639 char one_email[512];
1640 extract_token(one_email, usbuf.emailaddrs, j, '|', sizeof one_email);
1641 CtdlDirectoryAddUser(one_email, usbuf.fullname);
1648 * Initialize the directory database (erasing anything already there)
1650 void CtdlRebuildDirectoryIndex(void) {
1651 syslog(LOG_INFO, "internet_addressing: rebuilding email address directory index");
1652 cdb_trunc(CDB_DIRECTORY);
1653 ForEachUser(CtdlRebuildDirectoryIndex_backend, NULL);
1658 * Configure Internet email addresses for a user account, updating the Directory Index in the process
1660 void CtdlSetEmailAddressesForUser(char *requested_user, char *new_emailaddrs)
1662 struct ctdluser usbuf;
1666 if (CtdlGetUserLock(&usbuf, requested_user) != 0) { // We are relying on the fact that the DirectoryIndex functions don't lock.
1667 return; // Silently fail here if we can't acquire a lock on the user record.
1670 syslog(LOG_DEBUG, "internet_addressing: setting email addresses for <%s> to <%s>", usbuf.fullname, new_emailaddrs);
1672 /* Delete all of the existing directory index records for the user (easier this way) */
1673 for (i=0; i<num_tokens(usbuf.emailaddrs, '|'); ++i) {
1674 extract_token(buf, usbuf.emailaddrs, i, '|', sizeof buf);
1675 CtdlDirectoryDelUser(buf, requested_user);
1678 strcpy(usbuf.emailaddrs, new_emailaddrs); // make it official.
1680 /* Index all of the new email addresses (they've already been sanitized) */
1681 for (i=0; i<num_tokens(usbuf.emailaddrs, '|'); ++i) {
1682 extract_token(buf, usbuf.emailaddrs, i, '|', sizeof buf);
1683 CtdlDirectoryAddUser(buf, requested_user);
1686 CtdlPutUserLock(&usbuf);
1691 * Auto-generate an Internet email address for a user account
1693 void AutoGenerateEmailAddressForUser(struct ctdluser *user)
1695 char synthetic_email_addr[1024];
1699 for (i=0; u==0; ++i) {
1701 // first try just converting the user name to lowercase and replacing spaces with underscores
1702 snprintf(synthetic_email_addr, sizeof synthetic_email_addr, "%s@%s", user->fullname, CtdlGetConfigStr("c_fqdn"));
1703 for (j=0; ((synthetic_email_addr[j] != '\0')&&(synthetic_email_addr[j] != '@')); j++) {
1704 synthetic_email_addr[j] = tolower(synthetic_email_addr[j]);
1705 if (!isalnum(synthetic_email_addr[j])) {
1706 synthetic_email_addr[j] = '_';
1711 // then try 'ctdl' followed by the user number
1712 snprintf(synthetic_email_addr, sizeof synthetic_email_addr, "ctdl%08lx@%s", user->usernum, CtdlGetConfigStr("c_fqdn"));
1715 // oof. just keep trying other numbers until we find one
1716 snprintf(synthetic_email_addr, sizeof synthetic_email_addr, "ctdl%08x@%s", i, CtdlGetConfigStr("c_fqdn"));
1718 u = CtdlDirectoryLookup(NULL, synthetic_email_addr, 0);
1719 syslog(LOG_DEBUG, "user_ops: address <%s> lookup returned <%d>", synthetic_email_addr, u);
1722 CtdlSetEmailAddressesForUser(user->fullname, synthetic_email_addr);
1723 strncpy(CC->user.emailaddrs, synthetic_email_addr, sizeof(user->emailaddrs));
1724 syslog(LOG_DEBUG, "user_ops: auto-generated email address <%s> for <%s>", synthetic_email_addr, user->fullname);