#include <stdarg.h>
#include <pthread.h>
#include <signal.h>
+
+#ifdef HAVE_ICONV
+#include <iconv.h>
+#endif
+
#include "webcit.h"
#include "vcard.h"
#include "webserver.h"
/*
+ * Sanitize and enhance an HTML message for display.
+ * Also convert weird character sets to UTF-8 if necessary.
*/
-void output_html(void) {
+void output_html(char *charset) {
char buf[SIZ];
char *msg;
char *ptr;
char *msgstart;
char *msgend;
+ char *converted_msg;
int buffer_length = 1;
int line_length = 0;
int content_length = 0;
+ int output_length = 0;
+ char new_window[SIZ];
+ int brak = 0;
+ int alevel = 0;
+ int i;
+ int linklen;
+#ifdef HAVE_ICONV
+ iconv_t ic = (iconv_t)(-1) ;
+ char *ibuf; /* Buffer of characters to be converted */
+ char *obuf; /* Buffer for converted characters */
+ size_t ibuflen; /* Length of input buffer */
+ size_t obuflen; /* Length of output buffer */
+ char *osav; /* Saved pointer to output buffer */
+#endif
msg = strdup("");
+ sprintf(new_window, "<A TARGET=\"%s\" HREF=", TARGET);
- while (serv_gets(buf), strcmp(buf, "000")) {
+ while (serv_getln(buf, sizeof buf), strcmp(buf, "000")) {
line_length = strlen(buf);
buffer_length = content_length + line_length + 2;
msg = realloc(msg, buffer_length);
if (msg == NULL) {
wprintf("<B>realloc() error! "
- "couldn't get %d bytes: %s</B><BR><BR>\n",
+ "couldn't get %d bytes: %s</B><br /><br />\n",
buffer_length + 1,
strerror(errno));
return;
content_length += 1;
}
+#ifdef HAVE_ICONV
+ if ( (strcasecmp(charset, "us-ascii"))
+ && (strcasecmp(charset, "UTF-8")) ) {
+ ic = iconv_open("UTF-8", charset);
+ if (ic == (iconv_t)(-1) ) {
+ lprintf(5, "iconv_open() failed: %s\n", strerror(errno));
+ }
+ }
+ if (ic != (iconv_t)(-1) ) {
+ ibuf = msg;
+ ibuflen = content_length;
+ obuflen = content_length + (content_length / 2) ;
+ obuf = (char *) malloc(obuflen);
+ osav = obuf;
+ iconv(ic, &ibuf, &ibuflen, &obuf, &obuflen);
+ content_length = content_length + (content_length / 2) - obuflen;
+ osav[content_length] = 0;
+ free(msg);
+ msg = osav;
+ iconv_close(ic);
+ }
+#endif
+
ptr = msg;
msgstart = msg;
msgend = &msg[content_length];
++ptr;
}
- write(WC->http_sock, msgstart, strlen(msgstart));
+ converted_msg = malloc(content_length);
+ strcpy(converted_msg, "");
+ ptr = msgstart;
+ while (ptr < msgend) {
+ /* Change mailto: links to WebCit mail, by replacing the
+ * link with one that points back to our mail room. Due to
+ * the way we parse URL's, it'll even handle mailto: links
+ * that have "?subject=" in them.
+ */
+ if (!strncasecmp(ptr, "<A HREF=\"mailto:", 16)) {
+ content_length += 64;
+ converted_msg = realloc(converted_msg, content_length);
+ sprintf(&converted_msg[output_length],
+ "<A HREF=\"/display_enter"
+ "?force_room=_MAIL_&recp=");
+ output_length += 47;
+ ptr = &ptr[16];
+ ++alevel;
+ }
+ /* Make links open in a separate window */
+ else if (!strncasecmp(ptr, "<A HREF=", 8)) {
+ content_length += 64;
+ converted_msg = realloc(converted_msg, content_length);
+ sprintf(&converted_msg[output_length], new_window);
+ output_length += strlen(new_window);
+ ptr = &ptr[8];
+ ++alevel;
+ }
+ /* Turn anything that looks like a URL into a real link, as long
+ * as it's not inside a tag already
+ */
+ else if ( (brak == 0) && (alevel == 0)
+ && (!strncasecmp(ptr, "http://", 7))) {
+ linklen = 0;
+ /* Find the end of the link */
+ for (i=0; i<=strlen(ptr); ++i) {
+ if ((ptr[i]==0)
+ ||(isspace(ptr[i]))
+ ||(ptr[i]==10)
+ ||(ptr[i]==13)
+ ||(ptr[i]=='(')
+ ||(ptr[i]==')')
+ ||(ptr[i]=='<')
+ ||(ptr[i]=='>')
+ ||(ptr[i]=='[')
+ ||(ptr[i]==']')
+ ) linklen = i;
+ if (linklen > 0) break;
+ }
+ if (linklen > 0) {
+ content_length += (32 + linklen);
+ converted_msg = realloc(converted_msg, content_length);
+ sprintf(&converted_msg[output_length], new_window);
+ output_length += strlen(new_window);
+ converted_msg[output_length] = '\"';
+ converted_msg[++output_length] = 0;
+ for (i=0; i<linklen; ++i) {
+ converted_msg[output_length] = ptr[i];
+ converted_msg[++output_length] = 0;
+ }
+ sprintf(&converted_msg[output_length], "\">");
+ output_length += 2;
+ for (i=0; i<linklen; ++i) {
+ converted_msg[output_length] = *ptr++;
+ converted_msg[++output_length] = 0;
+ }
+ sprintf(&converted_msg[output_length], "</A>");
+ output_length += 4;
+ }
+ }
+ else {
+ /*
+ * We need to know when we're inside a tag,
+ * so we don't turn things that look like URL's into
+ * links, when they're already links - or image sources.
+ */
+ if (*ptr == '<') ++brak;
+ if (*ptr == '>') --brak;
+ if (!strncasecmp(ptr, "</A>", 3)) --alevel;
+ converted_msg[output_length] = *ptr++;
+ converted_msg[++output_length] = 0;
+ }
+ }
+
+ /* Output our big pile of markup */
+ client_write(converted_msg, output_length);
/* A little trailing vertical whitespace... */
- wprintf("<BR><BR>\n");
+ wprintf("<br /><br />\n");
/* Now give back the memory */
+ free(converted_msg);
free(msg);
-
}