removed some debugs
[citadel.git] / citadel / internet_addressing.c
1 // This file contains functions which handle the mapping of Internet addresses
2 // to users on the Citadel system.
3 //
4 // Copyright (c) 1987-2022 by the citadel.org team
5 //
6 // This program is open source software; you can redistribute it and/or modify
7 // it under the terms of the GNU General Public License version 3.
8 //
9 // This program is distributed in the hope that it will be useful,
10 // but WITHOUT ANY WARRANTY; without even the implied warranty of
11 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12 // GNU General Public License for more details.
13
14 #include "sysdep.h"
15 #include <stdlib.h>
16 #include <unistd.h>
17 #include <stdio.h>
18 #include <fcntl.h>
19 #include <ctype.h>
20 #include <signal.h>
21 #include <pwd.h>
22 #include <errno.h>
23 #include <sys/types.h>
24 #include <time.h>
25 #include <sys/wait.h>
26 #include <string.h>
27 #include <limits.h>
28 #include <libcitadel.h>
29 #include "citadel.h"
30 #include "server.h"
31 #include "sysdep_decls.h"
32 #include "citserver.h"
33 #include "support.h"
34 #include "config.h"
35 #include "msgbase.h"
36 #include "internet_addressing.h"
37 #include "user_ops.h"
38 #include "room_ops.h"
39 #include "parsedate.h"
40 #include "database.h"
41 #include "ctdl_module.h"
42 #ifdef HAVE_ICONV
43 #include <iconv.h>
44
45 // This is the non-define version in case it is needed for debugging
46 #if 0
47 inline void FindNextEnd (char *bptr, char *end)
48 {
49         /* Find the next ?Q? */
50         end = strchr(bptr + 2, '?');
51         if (end == NULL) return NULL;
52         if (((*(end + 1) == 'B') || (*(end + 1) == 'Q')) && 
53             (*(end + 2) == '?')) {
54                 /* skip on to the end of the cluster, the next ?= */
55                 end = strstr(end + 3, "?=");
56         }
57         else
58                 /* sort of half valid encoding, try to find an end. */
59                 end = strstr(bptr, "?=");
60 }
61 #endif
62
63 #define FindNextEnd(bptr, end) { \
64         end = strchr(bptr + 2, '?'); \
65         if (end != NULL) { \
66                 if (((*(end + 1) == 'B') || (*(end + 1) == 'Q')) && (*(end + 2) == '?')) { \
67                         end = strstr(end + 3, "?="); \
68                 } else end = strstr(bptr, "?="); \
69         } \
70 }
71
72 // Handle subjects with RFC2047 encoding such as:
73 // =?koi8-r?B?78bP0s3Mxc7JxSDXz9rE1dvO2c3JINvB0sHNySDP?=
74 void utf8ify_rfc822_string(char *buf) {
75         char *start, *end, *next, *nextend, *ptr;
76         char newbuf[1024];
77         char charset[128];
78         char encoding[16];
79         char istr[1024];
80         iconv_t ic = (iconv_t)(-1) ;
81         char *ibuf;                     // Buffer of characters to be converted
82         char *obuf;                     // Buffer for converted characters
83         size_t ibuflen;                 // Length of input buffer
84         size_t obuflen;                 // Length of output buffer
85         char *isav;                     // Saved pointer to input buffer
86         char *osav;                     // Saved pointer to output buffer
87         int passes = 0;
88         int i, len, delta;
89         int illegal_non_rfc2047_encoding = 0;
90
91         // Sometimes, badly formed messages contain strings which were simply
92         // written out directly in some foreign character set instead of
93         // using RFC2047 encoding.  This is illegal but we will attempt to
94         // handle it anyway by converting from a user-specified default
95         // charset to UTF-8 if we see any nonprintable characters.
96         len = strlen(buf);
97         for (i=0; i<len; ++i) {
98                 if ((buf[i] < 32) || (buf[i] > 126)) {
99                         illegal_non_rfc2047_encoding = 1;
100                         i = len;        // take a shortcut, it won't be more than one.
101                 }
102         }
103         if (illegal_non_rfc2047_encoding) {
104                 const char *default_header_charset = "iso-8859-1";
105                 if ( (strcasecmp(default_header_charset, "UTF-8")) && (strcasecmp(default_header_charset, "us-ascii")) ) {
106                         ctdl_iconv_open("UTF-8", default_header_charset, &ic);
107                         if (ic != (iconv_t)(-1) ) {
108                                 ibuf = malloc(1024);
109                                 isav = ibuf;
110                                 safestrncpy(ibuf, buf, 1024);
111                                 ibuflen = strlen(ibuf);
112                                 obuflen = 1024;
113                                 obuf = (char *) malloc(obuflen);
114                                 osav = obuf;
115                                 iconv(ic, &ibuf, &ibuflen, &obuf, &obuflen);
116                                 osav[1024-obuflen] = 0;
117                                 strcpy(buf, osav);
118                                 free(osav);
119                                 iconv_close(ic);
120                                 free(isav);
121                         }
122                 }
123         }
124
125         // pre evaluate the first pair
126         nextend = end = NULL;
127         len = strlen(buf);
128         start = strstr(buf, "=?");
129         if (start != NULL) 
130                 FindNextEnd (start, end);
131
132         while ((start != NULL) && (end != NULL)) {
133                 next = strstr(end, "=?");
134                 if (next != NULL)
135                         FindNextEnd(next, nextend);
136                 if (nextend == NULL)
137                         next = NULL;
138
139                 // did we find two partitions
140                 if ((next != NULL) && ((next - end) > 2)) {
141                         ptr = end + 2;
142                         while ((ptr < next) && 
143                                (isspace(*ptr) ||
144                                 (*ptr == '\r') ||
145                                 (*ptr == '\n') || 
146                                 (*ptr == '\t')))
147                                 ptr ++;
148                         // did we find a gab just filled with blanks?
149                         if (ptr == next) {
150                                 memmove(end + 2, next, len - (next - start));
151
152                                 // now terminate the gab at the end
153                                 delta = (next - end) - 2;
154                                 len -= delta;
155                                 buf[len] = '\0';
156
157                                 // move next to its new location.
158                                 next -= delta;
159                                 nextend -= delta;
160                         }
161                 }
162                 // our next-pair is our new first pair now.
163                 start = next;
164                 end = nextend;
165         }
166
167         // Now we handle foreign character sets properly encoded in RFC2047 format.
168         start = strstr(buf, "=?");
169         FindNextEnd((start != NULL)? start : buf, end);
170         while (start != NULL && end != NULL && end > start) {
171                 extract_token(charset, start, 1, '?', sizeof charset);
172                 extract_token(encoding, start, 2, '?', sizeof encoding);
173                 extract_token(istr, start, 3, '?', sizeof istr);
174
175                 ibuf = malloc(1024);
176                 isav = ibuf;
177                 if (!strcasecmp(encoding, "B")) {       // base64
178                         ibuflen = CtdlDecodeBase64(ibuf, istr, strlen(istr));
179                 }
180                 else if (!strcasecmp(encoding, "Q")) {  // quoted-printable
181                         size_t len;
182                         unsigned long pos;
183                         
184                         len = strlen(istr);
185                         pos = 0;
186                         while (pos < len) {
187                                 if (istr[pos] == '_') istr[pos] = ' ';
188                                 pos++;
189                         }
190                         ibuflen = CtdlDecodeQuotedPrintable(ibuf, istr, len);
191                 }
192                 else {
193                         strcpy(ibuf, istr);             // unknown encoding
194                         ibuflen = strlen(istr);
195                 }
196
197                 ctdl_iconv_open("UTF-8", charset, &ic);
198                 if (ic != (iconv_t)(-1) ) {
199                         obuflen = 1024;
200                         obuf = (char *) malloc(obuflen);
201                         osav = obuf;
202                         iconv(ic, &ibuf, &ibuflen, &obuf, &obuflen);
203                         osav[1024-obuflen] = 0;
204
205                         end = start;
206                         end++;
207                         strcpy(start, "");
208                         remove_token(end, 0, '?');
209                         remove_token(end, 0, '?');
210                         remove_token(end, 0, '?');
211                         remove_token(end, 0, '?');
212                         strcpy(end, &end[1]);
213
214                         snprintf(newbuf, sizeof newbuf, "%s%s%s", buf, osav, end);
215                         strcpy(buf, newbuf);
216                         free(osav);
217                         iconv_close(ic);
218                 }
219                 else {
220                         end = start;
221                         end++;
222                         strcpy(start, "");
223                         remove_token(end, 0, '?');
224                         remove_token(end, 0, '?');
225                         remove_token(end, 0, '?');
226                         remove_token(end, 0, '?');
227                         strcpy(end, &end[1]);
228
229                         snprintf(newbuf, sizeof newbuf, "%s(unreadable)%s", buf, end);
230                         strcpy(buf, newbuf);
231                 }
232
233                 free(isav);
234
235                 // Since spammers will go to all sorts of absurd lengths to get their
236                 // messages through, there are LOTS of corrupt headers out there.
237                 // So, prevent a really badly formed RFC2047 header from throwing
238                 // this function into an infinite loop.
239                 ++passes;
240                 if (passes > 20) return;
241
242                 start = strstr(buf, "=?");
243                 FindNextEnd((start != NULL)? start : buf, end);
244         }
245
246 }
247 #else
248 inline void utf8ify_rfc822_string(char *a){};
249
250 #endif
251
252
253 char *inetcfg = NULL;
254
255 // Return nonzero if the supplied name is an alias for this host.
256 int CtdlHostAlias(char *fqdn) {
257         int config_lines;
258         int i;
259         char buf[256];
260         char host[256], type[256];
261         int found = 0;
262
263         if (fqdn == NULL)                                       return(hostalias_nomatch);
264         if (IsEmptyStr(fqdn))                                   return(hostalias_nomatch);
265         if (!strcasecmp(fqdn, "localhost"))                     return(hostalias_localhost);
266         if (!strcasecmp(fqdn, CtdlGetConfigStr("c_fqdn")))      return(hostalias_localhost);
267         if (!strcasecmp(fqdn, CtdlGetConfigStr("c_nodename")))  return(hostalias_localhost);
268         if (inetcfg == NULL)                                    return(hostalias_nomatch);
269
270         config_lines = num_tokens(inetcfg, '\n');
271         for (i=0; i<config_lines; ++i) {
272                 extract_token(buf, inetcfg, i, '\n', sizeof buf);
273                 extract_token(host, buf, 0, '|', sizeof host);
274                 extract_token(type, buf, 1, '|', sizeof type);
275
276                 found = 0;
277
278                 // Process these in a specific order, in case there are multiple matches.
279                 // We want localhost to override masq, for example.
280
281                 if ( (!strcasecmp(type, "masqdomain")) && (!strcasecmp(fqdn, host))) {
282                         found = hostalias_masq;
283                 }
284
285                 if ( (!strcasecmp(type, "localhost")) && (!strcasecmp(fqdn, host))) {
286                         found = hostalias_localhost;
287                 }
288
289                 // "directory" used to be a distributed version of "localhost" but they're both the same now
290                 if ( (!strcasecmp(type, "directory")) && (!strcasecmp(fqdn, host))) {
291                         found = hostalias_localhost;
292                 }
293
294                 if (found) return(found);
295         }
296         return(hostalias_nomatch);
297 }
298
299
300 // Determine whether a given Internet address belongs to the current user
301 int CtdlIsMe(char *addr, int addr_buf_len) {
302         struct recptypes *recp;
303         int i;
304
305         recp = validate_recipients(addr, NULL, 0);
306         if (recp == NULL) return(0);
307
308         if (recp->num_local == 0) {
309                 free_recipients(recp);
310                 return(0);
311         }
312
313         for (i=0; i<recp->num_local; ++i) {
314                 extract_token(addr, recp->recp_local, i, '|', addr_buf_len);
315                 if (!strcasecmp(addr, CC->user.fullname)) {
316                         free_recipients(recp);
317                         return(1);
318                 }
319         }
320
321         free_recipients(recp);
322         return(0);
323 }
324
325
326 // If the last item in a list of recipients was truncated to a partial address,
327 // remove it completely in order to avoid choking library functions.
328 void sanitize_truncated_recipient(char *str) {
329         if (!str) return;
330         if (num_tokens(str, ',') < 2) return;
331
332         int len = strlen(str);
333         if (len < 900) return;
334         if (len > 998) str[998] = 0;
335
336         char *cptr = strrchr(str, ',');
337         if (!cptr) return;
338
339         char *lptr = strchr(cptr, '<');
340         char *rptr = strchr(cptr, '>');
341
342         if ( (lptr) && (rptr) && (rptr > lptr) ) return;
343
344         *cptr = 0;
345 }
346
347
348 // This function is self explanatory.
349 // (What can I say, I'm in a weird mood today...)
350 void remove_any_whitespace_to_the_left_or_right_of_at_symbol(char *name) {
351         char *ptr;
352         if (!name) return;
353
354         for (ptr=name; *ptr; ++ptr) {
355                 while ( (isspace(*ptr)) && (*(ptr+1)=='@') ) {
356                         strcpy(ptr, ptr+1);
357                         if (ptr > name) --ptr;
358                 }
359                 while ( (*ptr=='@') && (*(ptr+1)!=0) && (isspace(*(ptr+1))) ) {
360                         strcpy(ptr+1, ptr+2);
361                 }
362         }
363 }
364
365
366 // values that can be returned by expand_aliases()
367 enum {
368         EA_ERROR,               // Can't send message due to bad address
369         EA_MULTIPLE,            // Alias expanded into multiple recipients -- run me again!
370         EA_LOCAL,               // Local message, do no network processing
371         EA_INTERNET,            // Convert msg and send as Internet mail
372         EA_SKIP                 // This recipient has been invalidated -- skip it!
373 };
374
375
376 // Process alias and routing info for email addresses
377 int expand_aliases(char *name, char *aliases) {
378         int a;
379         char aaa[SIZ];
380         int at = 0;
381
382         if (aliases) {
383                 int num_aliases = num_tokens(aliases, '\n');
384                 for (a=0; a<num_aliases; ++a) {
385                         extract_token(aaa, aliases, a, '\n', sizeof aaa);
386                         char *bar = strchr(aaa, '|');
387                         if (bar) {
388                                 bar[0] = 0;
389                                 ++bar;
390                                 striplt(aaa);
391                                 striplt(bar);
392                                 if ( (!IsEmptyStr(aaa)) && (!strcasecmp(name, aaa)) ) {
393                                         syslog(LOG_DEBUG, "internet_addressing: global alias <%s> to <%s>", name, bar);
394                                         strcpy(name, bar);
395                                 }
396                         }
397                 }
398                 if (strchr(name, ',')) {
399                         return(EA_MULTIPLE);
400                 }
401         }
402
403         char original_name[256];                                // Now go for the regular aliases
404         safestrncpy(original_name, name, sizeof original_name);
405
406         // should these checks still be here, or maybe move them to split_recps() ?
407         striplt(name);
408         remove_any_whitespace_to_the_left_or_right_of_at_symbol(name);
409         stripallbut(name, '<', '>');
410
411         // Hit the email address directory
412         if (CtdlDirectoryLookup(aaa, name, sizeof aaa) == 0) {
413                 strcpy(name, aaa);
414         }
415
416         if (strcasecmp(original_name, name)) {
417                 syslog(LOG_INFO, "internet_addressing: directory alias <%s> to <%s>", original_name, name);
418         }
419
420         // Change "user @ xxx" to "user" if xxx is an alias for this host
421         for (a=0; name[a] != '\0'; ++a) {
422                 if (name[a] == '@') {
423                         if (CtdlHostAlias(&name[a+1]) == hostalias_localhost) {
424                                 name[a] = 0;
425                                 syslog(LOG_DEBUG, "internet_addressing: host is local, recipient is <%s>", name);
426                                 break;
427                         }
428                 }
429         }
430
431         // Is this a local or remote recipient?
432         at = haschar(name, '@');
433         if (at == 0) {
434                 return(EA_LOCAL);                       // no @'s = local address
435         }
436         else if (at == 1) {
437                 return(EA_INTERNET);                    // one @ = internet address
438         }
439         else {
440                 return(EA_ERROR);                       // more than one @ = badly formed address
441         }
442 }
443
444
445 // Return a supplied list of email addresses as an array, removing superfluous information and syntax.
446 // If an existing Array is supplied as "append_to" it will do so; otherwise a new Array is allocated.
447 Array *split_recps(char *addresses, Array *append_to) {
448
449         if (IsEmptyStr(addresses)) {            // nothing supplied, nothing returned
450                 return(NULL);
451         }
452
453         // Copy the supplied address list into our own memory space, because we are going to modify it.
454         char *a = strdup(addresses);
455         if (a == NULL) {
456                 syslog(LOG_ERR, "internet_addressing: malloc() failed: %m");
457                 return(NULL);
458         }
459
460         // Strip out anything in double quotes
461         char *l = NULL;
462         char *r = NULL;
463         do {
464                 l = strchr(a, '\"');
465                 r = strrchr(a, '\"');
466                 if (r > l) {
467                         strcpy(l, r+1);
468                 }
469         } while (r > l);
470
471         // Transform all qualifying delimiters to commas
472         char *t;
473         for (t=a; t[0]; ++t) {
474                 if ((t[0]==';') || (t[0]=='|')) {
475                         t[0]=',';
476                 }
477         }
478
479         // Tokenize the recipients into an array.  No single recipient should be larger than 256 bytes.
480         Array *recipients_array = NULL;
481         if (append_to) {
482                 recipients_array = append_to;                   // Append to an existing array of recipients
483         }
484         else {
485                 recipients_array = array_new(256);              // This is a new array of recipients
486         }
487
488         int num_addresses = num_tokens(a, ',');
489         int i;
490         for (i=0; i<num_addresses; ++i) {
491                 char this_address[256];
492                 extract_token(this_address, a, i, ',', sizeof this_address);
493                 striplt(this_address);                          // strip leading and trailing whitespace
494                 stripout(this_address, '(', ')');               // remove any portion in parentheses
495                 stripallbut(this_address, '<', '>');            // if angle brackets are present, keep only what is inside them
496                 if (!IsEmptyStr(this_address)) {
497                         array_append(recipients_array, this_address);
498                 }
499         }
500
501         free(a);                                                // We don't need this buffer anymore.
502         return(recipients_array);                               // Return the completed array to the caller.
503 }
504
505
506 // Validate recipients, count delivery types and errors, and handle aliasing
507 //
508 // Returns 0 if all addresses are ok, ret->num_error = -1 if no addresses 
509 // were specified, or the number of addresses found invalid.
510 //
511 // Caller needs to free the result using free_recipients()
512 //
513 struct recptypes *validate_recipients(char *supplied_recipients, const char *RemoteIdentifier, int Flags) {
514         struct recptypes *ret;
515         char *recipients = NULL;
516         char append[SIZ];
517         long len;
518         int mailtype;
519         int invalid;
520         struct ctdluser tempUS;
521         struct ctdlroom original_room;
522         int err = 0;
523         char errmsg[SIZ];
524         char *org_recp;
525         char this_recp[256];
526
527         ret = (struct recptypes *) malloc(sizeof(struct recptypes));                    // Initialize
528         if (ret == NULL) return(NULL);
529         memset(ret, 0, sizeof(struct recptypes));                                       // set all values to null/zero
530
531         if (supplied_recipients == NULL) {
532                 recipients = strdup("");
533         }
534         else {
535                 recipients = strdup(supplied_recipients);
536         }
537
538         len = strlen(recipients) + 1024;                                                // allocate memory
539         ret->errormsg = malloc(len);
540         ret->recp_local = malloc(len);
541         ret->recp_internet = malloc(len);
542         ret->recp_room = malloc(len);
543         ret->display_recp = malloc(len);
544         ret->recp_orgroom = malloc(len);
545
546         ret->errormsg[0] = 0;
547         ret->recp_local[0] = 0;
548         ret->recp_internet[0] = 0;
549         ret->recp_room[0] = 0;
550         ret->recp_orgroom[0] = 0;
551         ret->display_recp[0] = 0;
552         ret->recptypes_magic = RECPTYPES_MAGIC;
553
554         Array *recp_array = split_recps(supplied_recipients, NULL);
555
556         char *aliases = CtdlGetSysConfig(GLOBAL_ALIASES);                               // First hit the Global Alias Table
557
558         int r;
559         for (r=0; (recp_array && r<array_len(recp_array)); ++r) {
560                 org_recp = (char *)array_get_element_at(recp_array, r);
561                 strncpy(this_recp, org_recp, sizeof this_recp);
562
563                 int i;
564                 for (i=0; i<3; ++i) {                                           // pass three times through the aliaser
565                         mailtype = expand_aliases(this_recp, aliases);
566         
567                         // If an alias expanded to multiple recipients, strip off those recipients and append them
568                         // to the end of the array.  This loop will hit those again when it gets there.
569                         if (mailtype == EA_MULTIPLE) {
570                                 recp_array = split_recps(this_recp, recp_array);
571                         }
572                 }
573
574                 // This loop searches for duplicate recipients in the final list and marks them to be skipped.
575                 int j;
576                 for (j=0; j<r; ++j) {
577                         if (!strcasecmp(this_recp, (char *)array_get_element_at(recp_array, j) )) {
578                                 mailtype = EA_SKIP;
579                         }
580                 }
581
582                 syslog(LOG_DEBUG, "Recipient #%d of type %d is <%s>", r, mailtype, this_recp);
583                 invalid = 0;
584                 errmsg[0] = 0;
585                 switch(mailtype) {
586                 case EA_LOCAL:                                  // There are several types of "local" recipients.
587
588                         // Old BBS conventions require mail to "sysop" to go somewhere.  Send it to the admin room.
589                         if (!strcasecmp(this_recp, "sysop")) {
590                                 ++ret->num_room;
591                                 strcpy(this_recp, CtdlGetConfigStr("c_aideroom"));
592                                 if (!IsEmptyStr(ret->recp_room)) {
593                                         strcat(ret->recp_room, "|");
594                                 }
595                                 strcat(ret->recp_room, this_recp);
596                         }
597
598                         // This handles rooms which can receive posts via email.
599                         else if (!strncasecmp(this_recp, "room_", 5)) {
600                                 original_room = CC->room;                               // Remember where we parked
601
602                                 char mail_to_room[ROOMNAMELEN];
603                                 char *m;
604                                 strncpy(mail_to_room, &this_recp[5], sizeof mail_to_room);
605                                 for (m = mail_to_room; *m; ++m) {
606                                         if (m[0] == '_') m[0]=' ';
607                                 }
608                                 if (!CtdlGetRoom(&CC->room, mail_to_room)) {            // Find the room they asked for
609
610                                         err = CtdlDoIHavePermissionToPostInThisRoom(    // check for write permissions to room
611                                                 errmsg, 
612                                                 sizeof errmsg, 
613                                                 RemoteIdentifier,
614                                                 Flags,
615                                                 0                                       // 0 means "this is not a reply"
616                                         );
617                                         if (err) {
618                                                 ++ret->num_error;
619                                                 invalid = 1;
620                                         } 
621                                         else {
622                                                 ++ret->num_room;
623                                                 if (!IsEmptyStr(ret->recp_room)) {
624                                                         strcat(ret->recp_room, "|");
625                                                 }
626                                                 strcat(ret->recp_room, CC->room.QRname);
627         
628                                                 if (!IsEmptyStr(ret->recp_orgroom)) {
629                                                         strcat(ret->recp_orgroom, "|");
630                                                 }
631                                                 strcat(ret->recp_orgroom, this_recp);
632         
633                                         }
634                                 }
635                                 else {                                                  // no such room exists
636                                         ++ret->num_error;
637                                         invalid = 1;
638                                 }
639                                                 
640                                 // Restore this session's original room location.
641                                 CC->room = original_room;
642
643                         }
644
645                         // This handles the most common case, which is mail to a user's inbox.
646                         else if (CtdlGetUser(&tempUS, this_recp) == 0) {
647                                 ++ret->num_local;
648                                 strcpy(this_recp, tempUS.fullname);
649                                 if (!IsEmptyStr(ret->recp_local)) {
650                                         strcat(ret->recp_local, "|");
651                                 }
652                                 strcat(ret->recp_local, this_recp);
653                         }
654
655                         // No match for this recipient
656                         else {
657                                 ++ret->num_error;
658                                 invalid = 1;
659                         }
660                         break;
661                 case EA_INTERNET:
662                         // Yes, you're reading this correctly: if the target domain points back to the local system,
663                         // the address is invalid.  That's because if the address were valid, we would have
664                         // already translated it to a local address by now.
665                         if (IsDirectory(this_recp, 0)) {
666                                 ++ret->num_error;
667                                 invalid = 1;
668                         }
669                         else {
670                                 ++ret->num_internet;
671                                 if (!IsEmptyStr(ret->recp_internet)) {
672                                         strcat(ret->recp_internet, "|");
673                                 }
674                                 strcat(ret->recp_internet, this_recp);
675                         }
676                         break;
677                 case EA_MULTIPLE:
678                 case EA_SKIP:
679                         // no action required, anything in this slot has already been processed elsewhere
680                         break;
681                 case EA_ERROR:
682                         ++ret->num_error;
683                         invalid = 1;
684                         break;
685                 }
686                 if (invalid) {
687                         if (IsEmptyStr(errmsg)) {
688                                 snprintf(append, sizeof append, "Invalid recipient: %s", this_recp);
689                         }
690                         else {
691                                 snprintf(append, sizeof append, "%s", errmsg);
692                         }
693                         if ( (strlen(ret->errormsg) + strlen(append) + 3) < SIZ) {
694                                 if (!IsEmptyStr(ret->errormsg)) {
695                                         strcat(ret->errormsg, "; ");
696                                 }
697                                 strcat(ret->errormsg, append);
698                         }
699                 }
700                 else {
701                         if (IsEmptyStr(ret->display_recp)) {
702                                 strcpy(append, this_recp);
703                         }
704                         else {
705                                 snprintf(append, sizeof append, ", %s", this_recp);
706                         }
707                         if ( (strlen(ret->display_recp)+strlen(append)) < SIZ) {
708                                 strcat(ret->display_recp, append);
709                         }
710                 }
711         }
712
713         if (aliases != NULL) {          // ok, we're done with the global alias list now
714                 free(aliases);
715         }
716
717         if ( (ret->num_local + ret->num_internet + ret->num_room + ret->num_error) == 0) {
718                 ret->num_error = (-1);
719                 strcpy(ret->errormsg, "No recipients specified.");
720         }
721
722         syslog(LOG_DEBUG, "internet_addressing: validate_recipients() = %d local, %d room, %d SMTP, %d error",
723                 ret->num_local, ret->num_room, ret->num_internet, ret->num_error
724         );
725
726         free(recipients);
727         if (recp_array) {
728                 array_free(recp_array);
729         }
730
731         return(ret);
732 }
733
734
735 // Destructor for recptypes
736 void free_recipients(struct recptypes *valid) {
737
738         if (valid == NULL) {
739                 return;
740         }
741
742         if (valid->recptypes_magic != RECPTYPES_MAGIC) {
743                 syslog(LOG_ERR, "internet_addressing: attempt to call free_recipients() on some other data type!");
744                 abort();
745         }
746
747         if (valid->errormsg != NULL)            free(valid->errormsg);
748         if (valid->recp_local != NULL)          free(valid->recp_local);
749         if (valid->recp_internet != NULL)       free(valid->recp_internet);
750         if (valid->recp_room != NULL)           free(valid->recp_room);
751         if (valid->recp_orgroom != NULL)        free(valid->recp_orgroom);
752         if (valid->display_recp != NULL)        free(valid->display_recp);
753         if (valid->bounce_to != NULL)           free(valid->bounce_to);
754         if (valid->envelope_from != NULL)       free(valid->envelope_from);
755         if (valid->sending_room != NULL)        free(valid->sending_room);
756         free(valid);
757 }
758
759
760 char *qp_encode_email_addrs(char *source) {
761         char *user, *node, *name;
762         const char headerStr[] = "=?UTF-8?Q?";
763         char *Encoded;
764         char *EncodedName;
765         char *nPtr;
766         int need_to_encode = 0;
767         long SourceLen;
768         long EncodedMaxLen;
769         long nColons = 0;
770         long *AddrPtr;
771         long *AddrUtf8;
772         long nAddrPtrMax = 50;
773         long nmax;
774         int InQuotes = 0;
775         int i, n;
776
777         if (source == NULL) return source;
778         if (IsEmptyStr(source)) return source;
779         syslog(LOG_DEBUG, "internet_addressing: qp_encode_email_addrs <%s>", source);
780
781         AddrPtr = malloc (sizeof (long) * nAddrPtrMax);
782         AddrUtf8 = malloc (sizeof (long) * nAddrPtrMax);
783         memset(AddrUtf8, 0, sizeof (long) * nAddrPtrMax);
784         *AddrPtr = 0;
785         i = 0;
786         while (!IsEmptyStr (&source[i])) {
787                 if (nColons >= nAddrPtrMax){
788                         long *ptr;
789
790                         ptr = (long *) malloc(sizeof (long) * nAddrPtrMax * 2);
791                         memcpy (ptr, AddrPtr, sizeof (long) * nAddrPtrMax);
792                         free (AddrPtr), AddrPtr = ptr;
793
794                         ptr = (long *) malloc(sizeof (long) * nAddrPtrMax * 2);
795                         memset(&ptr[nAddrPtrMax], 0, sizeof (long) * nAddrPtrMax);
796
797                         memcpy (ptr, AddrUtf8, sizeof (long) * nAddrPtrMax);
798                         free (AddrUtf8), AddrUtf8 = ptr;
799                         nAddrPtrMax *= 2;                               
800                 }
801                 if (((unsigned char) source[i] < 32) || ((unsigned char) source[i] > 126)) {
802                         need_to_encode = 1;
803                         AddrUtf8[nColons] = 1;
804                 }
805                 if (source[i] == '"') {
806                         InQuotes = !InQuotes;
807                 }
808                 if (!InQuotes && source[i] == ',') {
809                         AddrPtr[nColons] = i;
810                         nColons++;
811                 }
812                 i++;
813         }
814         if (need_to_encode == 0) {
815                 free(AddrPtr);
816                 free(AddrUtf8);
817                 return source;
818         }
819
820         SourceLen = i;
821         EncodedMaxLen = nColons * (sizeof(headerStr) + 3) + SourceLen * 3;
822         Encoded = (char*) malloc (EncodedMaxLen);
823
824         for (i = 0; i < nColons; i++) {
825                 source[AddrPtr[i]++] = '\0';
826         }
827         // TODO: if libidn, this might get larger
828         user = malloc(SourceLen + 1);
829         node = malloc(SourceLen + 1);
830         name = malloc(SourceLen + 1);
831
832         nPtr = Encoded;
833         *nPtr = '\0';
834         for (i = 0; i < nColons && nPtr != NULL; i++) {
835                 nmax = EncodedMaxLen - (nPtr - Encoded);
836                 if (AddrUtf8[i]) {
837                         process_rfc822_addr(&source[AddrPtr[i]], user, node, name);
838                         // TODO: libIDN here !
839                         if (IsEmptyStr(name)) {
840                                 n = snprintf(nPtr, nmax, (i==0)?"%s@%s" : ",%s@%s", user, node);
841                         }
842                         else {
843                                 EncodedName = rfc2047encode(name, strlen(name));                        
844                                 n = snprintf(nPtr, nmax, (i==0)?"%s <%s@%s>" : ",%s <%s@%s>", EncodedName, user, node);
845                                 free(EncodedName);
846                         }
847                 }
848                 else { 
849                         n = snprintf(nPtr, nmax, (i==0)?"%s" : ",%s", &source[AddrPtr[i]]);
850                 }
851                 if (n > 0 )
852                         nPtr += n;
853                 else { 
854                         char *ptr, *nnPtr;
855                         ptr = (char*) malloc(EncodedMaxLen * 2);
856                         memcpy(ptr, Encoded, EncodedMaxLen);
857                         nnPtr = ptr + (nPtr - Encoded), nPtr = nnPtr;
858                         free(Encoded), Encoded = ptr;
859                         EncodedMaxLen *= 2;
860                         i--; // do it once more with properly lengthened buffer
861                 }
862         }
863         for (i = 0; i < nColons; i++)
864                 source[--AddrPtr[i]] = ',';
865
866         free(user);
867         free(node);
868         free(name);
869         free(AddrUtf8);
870         free(AddrPtr);
871         return Encoded;
872 }
873
874
875 // Unfold a multi-line field into a single line, removing multi-whitespaces
876 void unfold_rfc822_field(char **field, char **FieldEnd) 
877 {
878         int quote = 0;
879         char *pField = *field;
880         char *sField;
881         char *pFieldEnd = *FieldEnd;
882
883         while (isspace(*pField))
884                 pField++;
885         // remove leading/trailing whitespace
886         ;
887
888         while (isspace(*pFieldEnd))
889                 pFieldEnd --;
890
891         *FieldEnd = pFieldEnd;
892         // convert non-space whitespace to spaces, and remove double blanks
893         for (sField = *field = pField; 
894              sField < pFieldEnd; 
895              pField++, sField++)
896         {
897                 if ((*sField=='\r') || (*sField=='\n'))
898                 {
899                         int offset = 1;
900                         while ( ( (*(sField + offset) == '\r') || (*(sField + offset) == '\n' )) && (sField + offset < pFieldEnd) ) {
901                                 offset ++;
902                         }
903                         sField += offset;
904                         *pField = *sField;
905                 }
906                 else {
907                         if (*sField=='\"') quote = 1 - quote;
908                         if (!quote) {
909                                 if (isspace(*sField)) {
910                                         *pField = ' ';
911                                         pField++;
912                                         sField++;
913                                         
914                                         while ((sField < pFieldEnd) && 
915                                                isspace(*sField))
916                                                 sField++;
917                                         *pField = *sField;
918                                 }
919                                 else *pField = *sField;
920                         }
921                         else *pField = *sField;
922                 }
923         }
924         *pField = '\0';
925         *FieldEnd = pField - 1;
926 }
927
928
929 // Split an RFC822-style address into userid, host, and full name
930 //
931 // Note: This still handles obsolete address syntaxes such as user%node@node and ...node!user
932 //       We should probably remove that.
933 void process_rfc822_addr(const char *rfc822, char *user, char *node, char *name) {
934         int a;
935
936         strcpy(user, "");
937         strcpy(node, CtdlGetConfigStr("c_fqdn"));
938         strcpy(name, "");
939
940         if (rfc822 == NULL) return;
941
942         // extract full name - first, it's From minus <userid>
943         strcpy(name, rfc822);
944         stripout(name, '<', '>');
945
946         // strip anything to the left of a bang
947         while ((!IsEmptyStr(name)) && (haschar(name, '!') > 0))
948                 strcpy(name, &name[1]);
949
950         // and anything to the right of a @ or %
951         for (a = 0; name[a] != '\0'; ++a) {
952                 if (name[a] == '@') {
953                         name[a] = 0;
954                         break;
955                 }
956                 if (name[a] == '%') {
957                         name[a] = 0;
958                         break;
959                 }
960         }
961
962         // but if there are parentheses, that changes the rules...
963         if ((haschar(rfc822, '(') == 1) && (haschar(rfc822, ')') == 1)) {
964                 strcpy(name, rfc822);
965                 stripallbut(name, '(', ')');
966         }
967
968         // but if there are a set of quotes, that supersedes everything
969         if (haschar(rfc822, 34) == 2) {
970                 strcpy(name, rfc822);
971                 while ((!IsEmptyStr(name)) && (name[0] != 34)) {
972                         strcpy(&name[0], &name[1]);
973                 }
974                 strcpy(&name[0], &name[1]);
975                 for (a = 0; name[a] != '\0'; ++a)
976                         if (name[a] == 34) {
977                                 name[a] = 0;
978                                 break;
979                         }
980         }
981         // extract user id
982         strcpy(user, rfc822);
983
984         // first get rid of anything in parens
985         stripout(user, '(', ')');
986
987         // if there's a set of angle brackets, strip it down to that
988         if ((haschar(user, '<') == 1) && (haschar(user, '>') == 1)) {
989                 stripallbut(user, '<', '>');
990         }
991
992         // strip anything to the left of a bang
993         while ((!IsEmptyStr(user)) && (haschar(user, '!') > 0))
994                 strcpy(user, &user[1]);
995
996         // and anything to the right of a @ or %
997         for (a = 0; user[a] != '\0'; ++a) {
998                 if (user[a] == '@') {
999                         user[a] = 0;
1000                         break;
1001                 }
1002                 if (user[a] == '%') {
1003                         user[a] = 0;
1004                         break;
1005                 }
1006         }
1007
1008
1009         // extract node name
1010         strcpy(node, rfc822);
1011
1012         // first get rid of anything in parens
1013         stripout(node, '(', ')');
1014
1015         // if there's a set of angle brackets, strip it down to that
1016         if ((haschar(node, '<') == 1) && (haschar(node, '>') == 1)) {
1017                 stripallbut(node, '<', '>');
1018         }
1019
1020         // If no node specified, tack ours on instead
1021         if (
1022                 (haschar(node, '@')==0)
1023                 && (haschar(node, '%')==0)
1024                 && (haschar(node, '!')==0)
1025         ) {
1026                 strcpy(node, CtdlGetConfigStr("c_nodename"));
1027         }
1028         else {
1029
1030                 // strip anything to the left of a @
1031                 while ((!IsEmptyStr(node)) && (haschar(node, '@') > 0))
1032                         strcpy(node, &node[1]);
1033         
1034                 // strip anything to the left of a %
1035                 while ((!IsEmptyStr(node)) && (haschar(node, '%') > 0))
1036                         strcpy(node, &node[1]);
1037         
1038                 // reduce multiple system bang paths to node!user
1039                 while ((!IsEmptyStr(node)) && (haschar(node, '!') > 1))
1040                         strcpy(node, &node[1]);
1041         
1042                 // now get rid of the user portion of a node!user string
1043                 for (a = 0; node[a] != '\0'; ++a)
1044                         if (node[a] == '!') {
1045                                 node[a] = 0;
1046                                 break;
1047                         }
1048         }
1049
1050         // strip leading and trailing spaces in all strings
1051         striplt(user);
1052         striplt(node);
1053         striplt(name);
1054
1055         // If we processed a string that had the address in angle brackets
1056         // but no name outside the brackets, we now have an empty name.  In
1057         // this case, use the user portion of the address as the name.
1058         if ((IsEmptyStr(name)) && (!IsEmptyStr(user))) {
1059                 strcpy(name, user);
1060         }
1061 }
1062
1063
1064 // convert_field() is a helper function for convert_internet_message().
1065 // Given start/end positions for an rfc822 field, it converts it to a Citadel
1066 // field if it wants to, and unfolds it if necessary.
1067 //
1068 // Returns 1 if the field was converted and inserted into the Citadel message
1069 // structure, implying that the source field should be removed from the
1070 // message text.
1071 int convert_field(struct CtdlMessage *msg, const char *beg, const char *end) {
1072         char *key, *value, *valueend;
1073         long len;
1074         const char *pos;
1075         int i;
1076         const char *colonpos = NULL;
1077         int processed = 0;
1078         char user[1024];
1079         char node[1024];
1080         char name[1024];
1081         char addr[1024];
1082         time_t parsed_date;
1083         long valuelen;
1084
1085         for (pos = end; pos >= beg; pos--) {
1086                 if (*pos == ':') colonpos = pos;
1087         }
1088
1089         if (colonpos == NULL) return(0);        /* no colon? not a valid header line */
1090
1091         len = end - beg;
1092         key = malloc(len + 2);
1093         memcpy(key, beg, len + 1);
1094         key[len] = '\0';
1095         valueend = key + len;
1096         * ( key + (colonpos - beg) ) = '\0';
1097         value = &key[(colonpos - beg) + 1];
1098         // printf("Header: [%s]\nValue: [%s]\n", key, value);
1099         unfold_rfc822_field(&value, &valueend);
1100         valuelen = valueend - value + 1;
1101         // printf("UnfoldedValue: [%s]\n", value);
1102
1103         // Here's the big rfc822-to-citadel loop.
1104
1105         // Date/time is converted into a unix timestamp.  If the conversion
1106         // fails, we replace it with the time the message arrived locally.
1107         if (!strcasecmp(key, "Date")) {
1108                 parsed_date = parsedate(value);
1109                 if (parsed_date < 0L) parsed_date = time(NULL);
1110
1111                 if (CM_IsEmpty(msg, eTimestamp))
1112                         CM_SetFieldLONG(msg, eTimestamp, parsed_date);
1113                 processed = 1;
1114         }
1115
1116         else if (!strcasecmp(key, "From")) {
1117                 process_rfc822_addr(value, user, node, name);
1118                 syslog(LOG_DEBUG, "internet_addressing: converted to <%s@%s> (%s)", user, node, name);
1119                 snprintf(addr, sizeof(addr), "%s@%s", user, node);
1120                 if (CM_IsEmpty(msg, eAuthor) && !IsEmptyStr(name)) {
1121                         CM_SetField(msg, eAuthor, name, -1);
1122                 }
1123                 if (CM_IsEmpty(msg, erFc822Addr) && !IsEmptyStr(addr)) {
1124                         CM_SetField(msg, erFc822Addr, addr, -1);
1125                 }
1126                 processed = 1;
1127         }
1128
1129         else if (!strcasecmp(key, "Subject")) {
1130                 if (CM_IsEmpty(msg, eMsgSubject))
1131                         CM_SetField(msg, eMsgSubject, value, valuelen);
1132                 processed = 1;
1133         }
1134
1135         else if (!strcasecmp(key, "List-ID")) {
1136                 if (CM_IsEmpty(msg, eListID))
1137                         CM_SetField(msg, eListID, value, valuelen);
1138                 processed = 1;
1139         }
1140
1141         else if (!strcasecmp(key, "To")) {
1142                 if (CM_IsEmpty(msg, eRecipient))
1143                         CM_SetField(msg, eRecipient, value, valuelen);
1144                 processed = 1;
1145         }
1146
1147         else if (!strcasecmp(key, "CC")) {
1148                 if (CM_IsEmpty(msg, eCarbonCopY))
1149                         CM_SetField(msg, eCarbonCopY, value, valuelen);
1150                 processed = 1;
1151         }
1152
1153         else if (!strcasecmp(key, "Message-ID")) {
1154                 if (!CM_IsEmpty(msg, emessageId)) {
1155                         syslog(LOG_WARNING, "internet_addressing: duplicate message id");
1156                 }
1157                 else {
1158                         char *pValue;
1159                         long pValueLen;
1160
1161                         pValue = value;
1162                         pValueLen = valuelen;
1163                         // Strip angle brackets
1164                         while (haschar(pValue, '<') > 0) {
1165                                 pValue ++;
1166                                 pValueLen --;
1167                         }
1168
1169                         for (i = 0; i <= pValueLen; ++i)
1170                                 if (pValue[i] == '>') {
1171                                         pValueLen = i;
1172                                         break;
1173                                 }
1174
1175                         CM_SetField(msg, emessageId, pValue, pValueLen);
1176                 }
1177
1178                 processed = 1;
1179         }
1180
1181         else if (!strcasecmp(key, "Return-Path")) {
1182                 if (CM_IsEmpty(msg, eMessagePath))
1183                         CM_SetField(msg, eMessagePath, value, valuelen);
1184                 processed = 1;
1185         }
1186
1187         else if (!strcasecmp(key, "Envelope-To")) {
1188                 if (CM_IsEmpty(msg, eenVelopeTo))
1189                         CM_SetField(msg, eenVelopeTo, value, valuelen);
1190                 processed = 1;
1191         }
1192
1193         else if (!strcasecmp(key, "References")) {
1194                 CM_SetField(msg, eWeferences, value, valuelen);
1195                 processed = 1;
1196         }
1197
1198         else if (!strcasecmp(key, "Reply-To")) {
1199                 CM_SetField(msg, eReplyTo, value, valuelen);
1200                 processed = 1;
1201         }
1202
1203         else if (!strcasecmp(key, "In-reply-to")) {
1204                 if (CM_IsEmpty(msg, eWeferences)) // References: supersedes In-reply-to:
1205                         CM_SetField(msg, eWeferences, value, valuelen);
1206                 processed = 1;
1207         }
1208
1209
1210
1211         // Clean up and move on.
1212         free(key);      // Don't free 'value', it's actually the same buffer
1213         return processed;
1214 }
1215
1216
1217 // Convert RFC822 references format (References) to Citadel references format (Weferences)
1218 void convert_references_to_wefewences(char *str) {
1219         int bracket_nesting = 0;
1220         char *ptr = str;
1221         char *moveptr = NULL;
1222         char ch;
1223
1224         while(*ptr) {
1225                 ch = *ptr;
1226                 if (ch == '>') {
1227                         --bracket_nesting;
1228                         if (bracket_nesting < 0) bracket_nesting = 0;
1229                 }
1230                 if ((ch == '>') && (bracket_nesting == 0) && (*(ptr+1)) && (ptr>str) ) {
1231                         *ptr = '|';
1232                         ++ptr;
1233                 }
1234                 else if (bracket_nesting > 0) {
1235                         ++ptr;
1236                 }
1237                 else {
1238                         moveptr = ptr;
1239                         while (*moveptr) {
1240                                 *moveptr = *(moveptr+1);
1241                                 ++moveptr;
1242                         }
1243                 }
1244                 if (ch == '<') ++bracket_nesting;
1245         }
1246
1247 }
1248
1249
1250 // Convert an RFC822 message (headers + body) to a CtdlMessage structure.
1251 // NOTE: the supplied buffer becomes part of the CtdlMessage structure, and
1252 // will be deallocated when CM_Free() is called.  Therefore, the
1253 // supplied buffer should be DEREFERENCED.  It should not be freed or used
1254 // again.
1255 struct CtdlMessage *convert_internet_message(char *rfc822) {
1256         StrBuf *RFCBuf = NewStrBufPlain(rfc822, -1);
1257         free (rfc822);
1258         return convert_internet_message_buf(&RFCBuf);
1259 }
1260
1261
1262 struct CtdlMessage *convert_internet_message_buf(StrBuf **rfc822)
1263 {
1264         struct CtdlMessage *msg;
1265         const char *pos, *beg, *end, *totalend;
1266         int done, alldone = 0;
1267         int converted;
1268         StrBuf *OtherHeaders;
1269
1270         msg = malloc(sizeof(struct CtdlMessage));
1271         if (msg == NULL) return msg;
1272
1273         memset(msg, 0, sizeof(struct CtdlMessage));
1274         msg->cm_magic = CTDLMESSAGE_MAGIC;      // self check
1275         msg->cm_anon_type = 0;                  // never anonymous
1276         msg->cm_format_type = FMT_RFC822;       // internet message
1277
1278         pos = ChrPtr(*rfc822);
1279         totalend = pos + StrLength(*rfc822);
1280         done = 0;
1281         OtherHeaders = NewStrBufPlain(NULL, StrLength(*rfc822));
1282
1283         while (!alldone) {
1284
1285                 /* Locate beginning and end of field, keeping in mind that
1286                  * some fields might be multiline
1287                  */
1288                 end = beg = pos;
1289
1290                 while ((end < totalend) && 
1291                        (end == beg) && 
1292                        (done == 0) ) 
1293                 {
1294
1295                         if ( (*pos=='\n') && ((*(pos+1))!=0x20) && ((*(pos+1))!=0x09) )
1296                         {
1297                                 end = pos;
1298                         }
1299
1300                         /* done with headers? */
1301                         if ((*pos=='\n') &&
1302                             ( (*(pos+1)=='\n') ||
1303                               (*(pos+1)=='\r')) ) 
1304                         {
1305                                 alldone = 1;
1306                         }
1307
1308                         if (pos >= (totalend - 1) )
1309                         {
1310                                 end = pos;
1311                                 done = 1;
1312                         }
1313
1314                         ++pos;
1315
1316                 }
1317
1318                 /* At this point we have a field.  Are we interested in it? */
1319                 converted = convert_field(msg, beg, end);
1320
1321                 /* Strip the field out of the RFC822 header if we used it */
1322                 if (!converted) {
1323                         StrBufAppendBufPlain(OtherHeaders, beg, end - beg, 0);
1324                         StrBufAppendBufPlain(OtherHeaders, HKEY("\n"), 0);
1325                 }
1326
1327                 /* If we've hit the end of the message, bail out */
1328                 if (pos >= totalend)
1329                         alldone = 1;
1330         }
1331         StrBufAppendBufPlain(OtherHeaders, HKEY("\n"), 0);
1332         if (pos < totalend)
1333                 StrBufAppendBufPlain(OtherHeaders, pos, totalend - pos, 0);
1334         FreeStrBuf(rfc822);
1335         CM_SetAsFieldSB(msg, eMesageText, &OtherHeaders);
1336
1337         /* Follow-up sanity checks... */
1338
1339         /* If there's no timestamp on this message, set it to now. */
1340         if (CM_IsEmpty(msg, eTimestamp)) {
1341                 CM_SetFieldLONG(msg, eTimestamp, time(NULL));
1342         }
1343
1344         /* If a W (references, or rather, Wefewences) field is present, we
1345          * have to convert it from RFC822 format to Citadel format.
1346          */
1347         if (!CM_IsEmpty(msg, eWeferences)) {
1348                 /// todo: API!
1349                 convert_references_to_wefewences(msg->cm_fields[eWeferences]);
1350         }
1351
1352         return msg;
1353 }
1354
1355
1356 /*
1357  * Look for a particular header field in an RFC822 message text.  If the
1358  * requested field is found, it is unfolded (if necessary) and returned to
1359  * the caller.  The field name is stripped out, leaving only its contents.
1360  * The caller is responsible for freeing the returned buffer.  If the requested
1361  * field is not present, or anything else goes wrong, it returns NULL.
1362  */
1363 char *rfc822_fetch_field(const char *rfc822, const char *fieldname) {
1364         char *fieldbuf = NULL;
1365         const char *end_of_headers;
1366         const char *field_start;
1367         const char *ptr;
1368         char *cont;
1369         char fieldhdr[SIZ];
1370
1371         /* Should never happen, but sometimes we get stupid */
1372         if (rfc822 == NULL) return(NULL);
1373         if (fieldname == NULL) return(NULL);
1374
1375         snprintf(fieldhdr, sizeof fieldhdr, "%s:", fieldname);
1376
1377         /* Locate the end of the headers, so we don't run past that point */
1378         end_of_headers = cbmstrcasestr(rfc822, "\n\r\n");
1379         if (end_of_headers == NULL) {
1380                 end_of_headers = cbmstrcasestr(rfc822, "\n\n");
1381         }
1382         if (end_of_headers == NULL) return (NULL);
1383
1384         field_start = cbmstrcasestr(rfc822, fieldhdr);
1385         if (field_start == NULL) return(NULL);
1386         if (field_start > end_of_headers) return(NULL);
1387
1388         fieldbuf = malloc(SIZ);
1389         strcpy(fieldbuf, "");
1390
1391         ptr = field_start;
1392         ptr = cmemreadline(ptr, fieldbuf, SIZ-strlen(fieldbuf) );
1393         while ( (isspace(ptr[0])) && (ptr < end_of_headers) ) {
1394                 strcat(fieldbuf, " ");
1395                 cont = &fieldbuf[strlen(fieldbuf)];
1396                 ptr = cmemreadline(ptr, cont, SIZ-strlen(fieldbuf) );
1397                 striplt(cont);
1398         }
1399
1400         strcpy(fieldbuf, &fieldbuf[strlen(fieldhdr)]);
1401         striplt(fieldbuf);
1402
1403         return(fieldbuf);
1404 }
1405
1406
1407 /*****************************************************************************
1408  *                      DIRECTORY MANAGEMENT FUNCTIONS                       *
1409  *****************************************************************************/
1410
1411 /*
1412  * Generate the index key for an Internet e-mail address to be looked up
1413  * in the database.
1414  */
1415 void directory_key(char *key, char *addr) {
1416         int i;
1417         int keylen = 0;
1418
1419         for (i=0; !IsEmptyStr(&addr[i]); ++i) {
1420                 if (!isspace(addr[i])) {
1421                         key[keylen++] = tolower(addr[i]);
1422                 }
1423         }
1424         key[keylen++] = 0;
1425
1426         syslog(LOG_DEBUG, "internet_addressing: directory key is <%s>", key);
1427 }
1428
1429
1430 /*
1431  * Return nonzero if the supplied address is in one of "our" domains
1432  */
1433 int IsDirectory(char *addr, int allow_masq_domains) {
1434         char domain[256];
1435         int h;
1436
1437         extract_token(domain, addr, 1, '@', sizeof domain);
1438         striplt(domain);
1439
1440         h = CtdlHostAlias(domain);
1441
1442         if ( (h == hostalias_masq) && allow_masq_domains)
1443                 return(1);
1444         
1445         if (h == hostalias_localhost) {
1446                 return(1);
1447         }
1448         else {
1449                 return(0);
1450         }
1451 }
1452
1453
1454 /*
1455  * Add an Internet e-mail address to the directory for a user
1456  */
1457 int CtdlDirectoryAddUser(char *internet_addr, char *citadel_addr) {
1458         char key[SIZ];
1459
1460         if (IsDirectory(internet_addr, 0) == 0) {
1461                 return 0;
1462         }
1463         syslog(LOG_DEBUG, "internet_addressing: create directory entry: %s --> %s", internet_addr, citadel_addr);
1464         directory_key(key, internet_addr);
1465         cdb_store(CDB_DIRECTORY, key, strlen(key), citadel_addr, strlen(citadel_addr)+1 );
1466         return 1;
1467 }
1468
1469
1470 /*
1471  * Delete an Internet e-mail address from the directory.
1472  *
1473  * (NOTE: we don't actually use or need the citadel_addr variable; it's merely
1474  * here because the callback API expects to be able to send it.)
1475  */
1476 int CtdlDirectoryDelUser(char *internet_addr, char *citadel_addr) {
1477         char key[SIZ];
1478         
1479         syslog(LOG_DEBUG, "internet_addressing: delete directory entry: %s --> %s", internet_addr, citadel_addr);
1480         directory_key(key, internet_addr);
1481         return cdb_delete(CDB_DIRECTORY, key, strlen(key) ) == 0;
1482 }
1483
1484
1485 /*
1486  * Look up an Internet e-mail address in the directory.
1487  * On success: returns 0, and Citadel address stored in 'target'
1488  * On failure: returns nonzero
1489  */
1490 int CtdlDirectoryLookup(char *target, char *internet_addr, size_t targbuflen) {
1491         struct cdbdata *cdbrec;
1492         char key[SIZ];
1493
1494         /* Dump it in there unchanged, just for kicks */
1495         if (target != NULL) {
1496                 safestrncpy(target, internet_addr, targbuflen);
1497         }
1498
1499         /* Only do lookups for addresses with hostnames in them */
1500         if (num_tokens(internet_addr, '@') != 2) return(-1);
1501
1502         /* Only do lookups for domains in the directory */
1503         if (IsDirectory(internet_addr, 0) == 0) return(-1);
1504
1505         directory_key(key, internet_addr);
1506         cdbrec = cdb_fetch(CDB_DIRECTORY, key, strlen(key) );
1507         if (cdbrec != NULL) {
1508                 if (target != NULL) {
1509                         safestrncpy(target, cdbrec->ptr, targbuflen);
1510                 }
1511                 cdb_free(cdbrec);
1512                 return(0);
1513         }
1514
1515         return(-1);
1516 }
1517
1518
1519 /*
1520  * Harvest any email addresses that someone might want to have in their
1521  * "collected addresses" book.
1522  */
1523 char *harvest_collected_addresses(struct CtdlMessage *msg) {
1524         char *coll = NULL;
1525         char addr[256];
1526         char user[256], node[256], name[256];
1527         int is_harvestable;
1528         int i, j, h;
1529         eMsgField field = 0;
1530
1531         if (msg == NULL) return(NULL);
1532
1533         is_harvestable = 1;
1534         strcpy(addr, "");       
1535         if (!CM_IsEmpty(msg, eAuthor)) {
1536                 strcat(addr, msg->cm_fields[eAuthor]);
1537         }
1538         if (!CM_IsEmpty(msg, erFc822Addr)) {
1539                 strcat(addr, " <");
1540                 strcat(addr, msg->cm_fields[erFc822Addr]);
1541                 strcat(addr, ">");
1542                 if (IsDirectory(msg->cm_fields[erFc822Addr], 0)) {
1543                         is_harvestable = 0;
1544                 }
1545         }
1546
1547         if (is_harvestable) {
1548                 coll = strdup(addr);
1549         }
1550         else {
1551                 coll = strdup("");
1552         }
1553
1554         if (coll == NULL) return(NULL);
1555
1556         /* Scan both the R (To) and Y (CC) fields */
1557         for (i = 0; i < 2; ++i) {
1558                 if (i == 0) field = eRecipient;
1559                 if (i == 1) field = eCarbonCopY;
1560
1561                 if (!CM_IsEmpty(msg, field)) {
1562                         for (j=0; j<num_tokens(msg->cm_fields[field], ','); ++j) {
1563                                 extract_token(addr, msg->cm_fields[field], j, ',', sizeof addr);
1564                                 if (strstr(addr, "=?") != NULL)
1565                                         utf8ify_rfc822_string(addr);
1566                                 process_rfc822_addr(addr, user, node, name);
1567                                 h = CtdlHostAlias(node);
1568                                 if (h != hostalias_localhost) {
1569                                         coll = realloc(coll, strlen(coll) + strlen(addr) + 4);
1570                                         if (coll == NULL) return(NULL);
1571                                         if (!IsEmptyStr(coll)) {
1572                                                 strcat(coll, ",");
1573                                         }
1574                                         striplt(addr);
1575                                         strcat(coll, addr);
1576                                 }
1577                         }
1578                 }
1579         }
1580
1581         if (IsEmptyStr(coll)) {
1582                 free(coll);
1583                 return(NULL);
1584         }
1585         return(coll);
1586 }
1587
1588
1589 /*
1590  * Helper function for CtdlRebuildDirectoryIndex()
1591  */
1592 void CtdlRebuildDirectoryIndex_backend(char *username, void *data) {
1593
1594         int j = 0;
1595         struct ctdluser usbuf;
1596
1597         if (CtdlGetUser(&usbuf, username) != 0) {
1598                 return;
1599         }
1600
1601         if ( (!IsEmptyStr(usbuf.fullname)) && (!IsEmptyStr(usbuf.emailaddrs)) ) {
1602                 for (j=0; j<num_tokens(usbuf.emailaddrs, '|'); ++j) {
1603                         char one_email[512];
1604                         extract_token(one_email, usbuf.emailaddrs, j, '|', sizeof one_email);
1605                         CtdlDirectoryAddUser(one_email, usbuf.fullname);
1606                 }
1607         }
1608 }
1609
1610
1611 /*
1612  * Initialize the directory database (erasing anything already there)
1613  */
1614 void CtdlRebuildDirectoryIndex(void) {
1615         syslog(LOG_INFO, "internet_addressing: rebuilding email address directory index");
1616         cdb_trunc(CDB_DIRECTORY);
1617         ForEachUser(CtdlRebuildDirectoryIndex_backend, NULL);
1618 }
1619
1620
1621 // Configure Internet email addresses for a user account, updating the Directory Index in the process
1622 void CtdlSetEmailAddressesForUser(char *requested_user, char *new_emailaddrs) {
1623         struct ctdluser usbuf;
1624         int i;
1625         char buf[SIZ];
1626
1627         if (CtdlGetUserLock(&usbuf, requested_user) != 0) {     // We can lock because the DirectoryIndex functions don't lock.
1628                 return;                                         // Silently fail here if the specified user does not exist.
1629         }
1630
1631         syslog(LOG_DEBUG, "internet_addressing: setting email addresses for <%s> to <%s>", usbuf.fullname, new_emailaddrs);
1632
1633         // Delete all of the existing directory index records for the user (easier this way)
1634         for (i=0; i<num_tokens(usbuf.emailaddrs, '|'); ++i) {
1635                 extract_token(buf, usbuf.emailaddrs, i, '|', sizeof buf);
1636                 CtdlDirectoryDelUser(buf, requested_user);
1637         }
1638
1639         strcpy(usbuf.emailaddrs, new_emailaddrs);               // make it official.
1640
1641         // Index all of the new email addresses (they've already been sanitized)
1642         for (i=0; i<num_tokens(usbuf.emailaddrs, '|'); ++i) {
1643                 extract_token(buf, usbuf.emailaddrs, i, '|', sizeof buf);
1644                 CtdlDirectoryAddUser(buf, requested_user);
1645         }
1646
1647         CtdlPutUserLock(&usbuf);
1648 }
1649
1650
1651 /*
1652  * Auto-generate an Internet email address for a user account
1653  */
1654 void AutoGenerateEmailAddressForUser(struct ctdluser *user) {
1655         char synthetic_email_addr[1024];
1656         int i, j;
1657         int u = 0;
1658
1659         for (i=0; u==0; ++i) {
1660                 if (i == 0) {
1661                         // first try just converting the user name to lowercase and replacing spaces with underscores
1662                         snprintf(synthetic_email_addr, sizeof synthetic_email_addr, "%s@%s", user->fullname, CtdlGetConfigStr("c_fqdn"));
1663                         for (j=0; ((synthetic_email_addr[j] != '\0')&&(synthetic_email_addr[j] != '@')); j++) {
1664                                 synthetic_email_addr[j] = tolower(synthetic_email_addr[j]);
1665                                 if (!isalnum(synthetic_email_addr[j])) {
1666                                         synthetic_email_addr[j] = '_';
1667                                 }
1668                         }
1669                 }
1670                 else if (i == 1) {
1671                         // then try 'ctdl' followed by the user number
1672                         snprintf(synthetic_email_addr, sizeof synthetic_email_addr, "ctdl%08lx@%s", user->usernum, CtdlGetConfigStr("c_fqdn"));
1673                 }
1674                 else if (i > 1) {
1675                         // oof.  just keep trying other numbers until we find one
1676                         snprintf(synthetic_email_addr, sizeof synthetic_email_addr, "ctdl%08x@%s", i, CtdlGetConfigStr("c_fqdn"));
1677                 }
1678                 u = CtdlDirectoryLookup(NULL, synthetic_email_addr, 0);
1679                 syslog(LOG_DEBUG, "user_ops: address <%s> lookup returned <%d>", synthetic_email_addr, u);
1680         }
1681
1682         CtdlSetEmailAddressesForUser(user->fullname, synthetic_email_addr);
1683         strncpy(CC->user.emailaddrs, synthetic_email_addr, sizeof(user->emailaddrs));
1684         syslog(LOG_DEBUG, "user_ops: auto-generated email address <%s> for <%s>", synthetic_email_addr, user->fullname);
1685 }
1686
1687
1688 // Determine whether the supplied email address is subscribed to the supplied room's mailing list service.
1689 int is_email_subscribed_to_list(char *email, char *room_name) {
1690         struct ctdlroom room;
1691         long roomnum;
1692         char *roomnetconfig;
1693         int found_it = 0;
1694
1695         if (CtdlGetRoom(&room, room_name)) {
1696                 return(0);                                      // room not found, so definitely not subscribed
1697         }
1698
1699         // If this room has the QR2_SMTP_PUBLIC flag set, anyone may email a post to this room, even non-subscribers.
1700         if (room.QRflags2 & QR2_SMTP_PUBLIC) {
1701                 return(1);
1702         }
1703
1704         roomnum = room.QRnumber;
1705         roomnetconfig = LoadRoomNetConfigFile(roomnum);
1706         if (roomnetconfig == NULL) {
1707                 return(0);
1708         }
1709
1710         // We're going to do a very sloppy match here and simply search for the specified email address
1711         // anywhere in the room's netconfig.  If you don't like this, fix it yourself.
1712         if (bmstrcasestr(roomnetconfig, email)) {
1713                 found_it = 1;
1714         }
1715         else {
1716                 found_it = 0;
1717         }
1718
1719         free(roomnetconfig);
1720         return(found_it);
1721 }