X-Git-Url: https://code.citadel.org/?a=blobdiff_plain;f=webcit%2Fcontext_loop.c;h=3b1f30ae3969d7cb80d1a7fc654b7d5e9e6bf2d0;hb=f7b538d716fc80c12ab49d3ca8c4eb48a5c51eb2;hp=208521386eb318cefe76e92a27da39b1a5a6462c;hpb=27e6a22f021cffe2cee1a41accbf9d2f78b20dab;p=citadel.git diff --git a/webcit/context_loop.c b/webcit/context_loop.c index 208521386..3b1f30ae3 100644 --- a/webcit/context_loop.c +++ b/webcit/context_loop.c @@ -1,11 +1,24 @@ /* - * $Id$ - * * This is the other half of the webserver. It handles the task of hooking * up HTTP requests with the sessions they belong to, using HTTP cookies to * keep track of things. If the HTTP request doesn't belong to any currently * active session, a new session is started. * + * Copyright (c) 1996-2011 by the citadel.org team + * + * This program is open source software. You can redistribute it and/or + * modify it under the terms of the GNU General Public License as + * published by the Free Software Foundation; either version 3 of the + * License, or (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ #include "webcit.h" @@ -15,31 +28,27 @@ /* Only one thread may manipulate SessionList at a time... */ pthread_mutex_t SessionListMutex; -wcsession *SessionList = NULL; /**< our sessions ????*/ +wcsession *SessionList = NULL; /* Linked list of all webcit sessions */ -pthread_key_t MyConKey; /**< TSD key for MySession() */ +pthread_key_t MyConKey; /* TSD key for MySession() */ +HashList *HttpReqTypes = NULL; +HashList *HttpHeaderHandler = NULL; +extern HashList *HandlerHash; +/* the following two values start at 1 because the initial parent thread counts as one. */ +int num_threads_existing = 1; /* Number of worker threads which exist. */ +int num_threads_executing = 1; /* Number of worker threads currently executing. */ +extern void session_loop(void); +void spawn_another_worker_thread(void); -void DestroySession(wcsession **sessions_to_kill) -{ - close((*sessions_to_kill)->serv_sock); - close((*sessions_to_kill)->chat_sock); -/* -// if ((*sessions_to_kill)->preferences != NULL) { -// free((*sessions_to_kill)->preferences); -// } -*/ - if ((*sessions_to_kill)->cache_fold != NULL) { - free((*sessions_to_kill)->cache_fold); - } - DeleteServInfo(&((*sessions_to_kill)->serv_info)); - free_march_list((*sessions_to_kill)); - - session_destroy_modules(*sessions_to_kill); - free((*sessions_to_kill)); - (*sessions_to_kill) = NULL; +void DestroyHttpHeaderHandler(void *V) +{ + OneHttpHeader *pHdr; + pHdr = (OneHttpHeader*) V; + FreeStrBuf(&pHdr->Val); + free(pHdr); } void shutdown_sessions(void) @@ -55,28 +64,24 @@ void do_housekeeping(void) { wcsession *sptr, *ss; wcsession *sessions_to_kill = NULL; - int num_sessions = 0; - static int num_threads = MIN_WORKER_THREADS; - /** + /* * Lock the session list, moving any candidates for euthanasia into * a separate list. */ - pthread_mutex_lock(&SessionListMutex); - num_sessions = 0; + CtdlLogResult(pthread_mutex_lock(&SessionListMutex)); for (sptr = SessionList; sptr != NULL; sptr = sptr->next) { - ++num_sessions; - /** Kill idle sessions */ - if ((time(NULL) - (sptr->lastreq)) > - (time_t) WEBCIT_TIMEOUT) { + /* Kill idle sessions */ + if ((time(NULL) - (sptr->lastreq)) > (time_t) WEBCIT_TIMEOUT) { + syslog(3, "Timeout session %d\n", sptr->wc_session); sptr->killthis = 1; } - /** Remove sessions flagged for kill */ + /* Remove sessions flagged for kill */ if (sptr->killthis) { - /** remove session from linked list */ + /* remove session from linked list */ if (sptr == SessionList) { SessionList = SessionList->next; } @@ -90,33 +95,38 @@ void do_housekeeping(void) sessions_to_kill = sptr; } } - pthread_mutex_unlock(&SessionListMutex); + CtdlLogResult(pthread_mutex_unlock(&SessionListMutex)); - /** + /* * Now free up and destroy the culled sessions. */ while (sessions_to_kill != NULL) { - lprintf(3, "Destroying session %d\n", sessions_to_kill->wc_session); - pthread_mutex_lock(&sessions_to_kill->SessionMutex); - pthread_mutex_unlock(&sessions_to_kill->SessionMutex); + syslog(3, "Destroying session %d\n", sessions_to_kill->wc_session); sptr = sessions_to_kill->next; - - DestroySession(&sessions_to_kill); + session_destroy_modules(&sessions_to_kill); sessions_to_kill = sptr; - --num_sessions; } +} - /** - * If there are more sessions than threads, then we should spawn - * more threads ... up to a predefined maximum. - */ - while ( (num_sessions > num_threads) - && (num_threads <= MAX_WORKER_THREADS) ) { +/* + * Check the size of our thread pool. If all threads are executing, spawn another. + */ +void check_thread_pool_size(void) +{ + if (time_to_die) return; /* don't expand the thread pool during shutdown */ + + begin_critical_section(S_SPAWNER); /* only one of these should run at a time */ + if ( + (num_threads_executing >= num_threads_existing) + && (num_threads_existing < MAX_WORKER_THREADS) + ) { + syslog(3, "%d of %d threads are executing. Adding another worker thread.\n", + num_threads_executing, + num_threads_existing + ); spawn_another_worker_thread(); - ++num_threads; - lprintf(3, "There are %d sessions and %d threads active.\n", - num_sessions, num_threads); } + end_critical_section(S_SPAWNER); } @@ -148,141 +158,257 @@ int GenerateSessionID(void) return ++seq; } - -/* - * lingering_close() a`la Apache. see - * http://www.apache.org/docs/misc/fin_wait_2.html for rationale - */ -int lingering_close(int fd) +wcsession *FindSession(wcsession **wclist, ParsedHttpHdrs *Hdr, pthread_mutex_t *ListMutex) { - char buf[SIZ]; - int i; - fd_set set; - struct timeval tv, start; + wcsession *sptr = NULL; + wcsession *TheSession = NULL; + + if (Hdr->HR.got_auth == AUTH_BASIC) { + GetAuthBasic(Hdr); + } - gettimeofday(&start, NULL); - shutdown(fd, 1); - do { - do { - gettimeofday(&tv, NULL); - tv.tv_sec = SLEEPING - (tv.tv_sec - start.tv_sec); - tv.tv_usec = start.tv_usec - tv.tv_usec; - if (tv.tv_usec < 0) { - tv.tv_sec--; - tv.tv_usec += 1000000; + CtdlLogResult(pthread_mutex_lock(ListMutex)); + for (sptr = *wclist; ((sptr != NULL) && (TheSession == NULL)); sptr = sptr->next) { + + /* If HTTP-AUTH, look for a session with matching credentials */ + switch (Hdr->HR.got_auth) + { + case AUTH_BASIC: + if ( (Hdr->HR.SessionKey != sptr->SessionKey)) + continue; + if ((!strcasecmp(ChrPtr(Hdr->c_username), ChrPtr(sptr->wc_username))) && + (!strcasecmp(ChrPtr(Hdr->c_password), ChrPtr(sptr->wc_password))) ) { + syslog(LOG_DEBUG, "-- matched a session with the same http-auth"); + TheSession = sptr; + } + if (TheSession == NULL) + syslog(1, "found sessionkey [%d], but credentials for [%s|%s] didn't match", + Hdr->HR.SessionKey, + ChrPtr(Hdr->c_username), + ChrPtr(sptr->wc_username) + ); + break; + case AUTH_COOKIE: + /* If cookie-session, look for a session with matching session ID */ + if ( (Hdr->HR.desired_session != 0) && + (sptr->wc_session == Hdr->HR.desired_session)) + { + syslog(LOG_DEBUG, "-- matched a session with the same cookie"); + TheSession = sptr; + } + break; + case NO_AUTH: + /* Any unbound session is a candidate */ + if ( (sptr->wc_session == 0) && (sptr->inuse == 0) ) { + syslog(LOG_DEBUG, "-- reusing an unbound session"); + TheSession = sptr; } - FD_ZERO(&set); - FD_SET(fd, &set); - i = select(fd + 1, &set, NULL, NULL, &tv); - } while (i == -1 && errno == EINTR); - - if (i <= 0) break; + } + } + CtdlLogResult(pthread_mutex_unlock(ListMutex)); + if (TheSession == NULL) { + syslog(1, "didn't find sessionkey [%d] for user [%s]", + Hdr->HR.SessionKey, ChrPtr(Hdr->c_username) + ); + } + return TheSession; +} - i = read(fd, buf, sizeof buf); - } while (i != 0 && (i != -1 || errno == EINTR)); +wcsession *CreateSession(int Lockable, int Static, wcsession **wclist, ParsedHttpHdrs *Hdr, pthread_mutex_t *ListMutex) +{ + wcsession *TheSession; + TheSession = (wcsession *) malloc(sizeof(wcsession)); + memset(TheSession, 0, sizeof(wcsession)); + TheSession->Hdr = Hdr; + TheSession->SessionKey = Hdr->HR.SessionKey; + TheSession->serv_sock = (-1); - return close(fd); -} + pthread_setspecific(MyConKey, (void *)TheSession); + + /* If we're recreating a session that expired, it's best to give it the same + * session number that it had before. The client browser ought to pick up + * the new session number and start using it, but in some rare situations it + * doesn't, and that's a Bad Thing because it causes lots of spurious sessions + * to get created. + */ + if (Hdr->HR.desired_session == 0) { + TheSession->wc_session = GenerateSessionID(); + syslog(3, "Created new session %d", TheSession->wc_session); + } + else { + TheSession->wc_session = Hdr->HR.desired_session; + syslog(3, "Re-created session %d", TheSession->wc_session); + } + Hdr->HR.Static = Static; + session_new_modules(TheSession); + if (Lockable) { + pthread_mutex_init(&TheSession->SessionMutex, NULL); + if (ListMutex != NULL) + CtdlLogResult(pthread_mutex_lock(ListMutex)); -/* - * Look for commonly-found probes of malware such as worms, viruses, trojans, and Microsoft Office. - * Short-circuit these requests so we don't have to send them through the full processing loop. - */ -int is_bogus(StrBuf *http_cmd) { - const char *url; - int i, max; - const char *bogus_prefixes[] = { - "/scripts/root.exe", /* Worms and trojans and viruses, oh my! */ - "/c/winnt", - "/MSADC/", - "/_vti", /* Broken Microsoft DAV implementation */ - "/MSOffice", /* Stoopid MSOffice thinks everyone is IIS */ - "/nonexistenshit" /* Exploit found in the wild January 2009 */ - }; - - url = ChrPtr(http_cmd); - if (IsEmptyStr(url)) return(1); - ++url; - - max = sizeof(bogus_prefixes) / sizeof(char *); - - for (i=0; inonce = rand(); + TheSession->next = *wclist; + *wclist = TheSession; } + if (ListMutex != NULL) + CtdlLogResult(pthread_mutex_unlock(ListMutex)); + } + return TheSession; +} + + +/* If it's a "force 404" situation then display the error and bail. */ +void do_404(void) +{ + hprintf("HTTP/1.1 404 Not found\r\n"); + hprintf("Content-Type: text/plain\r\n"); + wc_printf("Not found\r\n"); + end_burst(); +} + +int ReadHttpSubject(ParsedHttpHdrs *Hdr, StrBuf *Line, StrBuf *Buf) +{ + const char *Args; + void *vLine, *vHandler; + const char *Pos = NULL; + + + Hdr->HR.ReqLine = Line; + /* The requesttype... GET, POST... */ + StrBufExtract_token(Buf, Hdr->HR.ReqLine, 0, ' '); + if (GetHash(HttpReqTypes, SKEY(Buf), &vLine) && + (vLine != NULL)) + { + Hdr->HR.eReqType = *(long*)vLine; + } + else { + Hdr->HR.eReqType = eGET; + return 1; + } + StrBufCutLeft(Hdr->HR.ReqLine, StrLength(Buf) + 1); + + /* the HTTP Version... */ + StrBufExtract_token(Buf, Hdr->HR.ReqLine, 1, ' '); + StrBufCutRight(Hdr->HR.ReqLine, StrLength(Buf) + 1); + + if (StrLength(Buf) == 0) { + Hdr->HR.eReqType = eGET; + return 1; + } + + StrBufAppendBuf(Hdr->this_page, Hdr->HR.ReqLine, 0); + + /* chop Filename / query arguments */ + Args = strchr(ChrPtr(Hdr->HR.ReqLine), '?'); + if (Args == NULL) /* whe're not that picky about params... TODO: this will spoil '&' in filenames.*/ + Args = strchr(ChrPtr(Hdr->HR.ReqLine), '&'); + if (Args != NULL) { + Args ++; /* skip the ? */ + StrBufPlain(Hdr->PlainArgs, + Args, + StrLength(Hdr->HR.ReqLine) - + (Args - ChrPtr(Hdr->HR.ReqLine))); + StrBufCutAt(Hdr->HR.ReqLine, 0, Args - 1); + } /* don't parse them yet, maybe we don't even care... */ + + /* now lookup what we are going to do with this... */ + /* skip first slash */ + StrBufExtract_NextToken(Buf, Hdr->HR.ReqLine, &Pos, '/'); + do { + StrBufExtract_NextToken(Buf, Hdr->HR.ReqLine, &Pos, '/'); + + GetHash(HandlerHash, SKEY(Buf), &vHandler), + Hdr->HR.Handler = (WebcitHandler*) vHandler; + if (Hdr->HR.Handler == NULL) + break; + /* + * If the request is prefixed by "/webcit" then chop that off. This + * allows a front end web server to forward all /webcit requests to us + * while still using the same web server port for other things. + */ + if ((Hdr->HR.Handler->Flags & URLNAMESPACE) != 0) + continue; + break; + } while (1); + /* remove the handlername from the URL */ + if ((Pos != NULL) && (Pos != StrBufNOTNULL)){ + StrBufCutLeft(Hdr->HR.ReqLine, + Pos - ChrPtr(Hdr->HR.ReqLine)); } - return(0); /* probably ok */ + if (Hdr->HR.Handler != NULL) { + if ((Hdr->HR.Handler->Flags & BOGUS) != 0) + return 1; + Hdr->HR.DontNeedAuth = ( + ((Hdr->HR.Handler->Flags & ISSTATIC) != 0) || + ((Hdr->HR.Handler->Flags & ANONYMOUS) != 0) + ); + } + else { + Hdr->HR.DontNeedAuth = 1; /* Flat request? show him the login screen... */ + } + + return 0; } +int AnalyseHeaders(ParsedHttpHdrs *Hdr) +{ + OneHttpHeader *pHdr; + void *vHdr; + long HKLen; + const char *HashKey; + HashPos *at = GetNewHashPos(Hdr->HTTPHeaders, 0); + + while (GetNextHashPos(Hdr->HTTPHeaders, at, &HKLen, &HashKey, &vHdr) && + (vHdr != NULL)) { + pHdr = (OneHttpHeader *)vHdr; + if (pHdr->HaveEvaluator) + pHdr->H(pHdr->Val, Hdr); + + } + DeleteHashPos(&at); + return 0; +} /*const char *nix(void *vptr) {return ChrPtr( (StrBuf*)vptr);}*/ /* - * handle one request - * - * This loop gets called once for every HTTP connection made to WebCit. At - * this entry point we have an HTTP socket with a browser allegedly on the - * other end, but we have not yet bound to a WebCit session. - * - * The job of this function is to locate the correct session and bind to it, - * or create a session if necessary and bind to it, then run the WebCit - * transaction loop. Afterwards, we unbind from the session. When this - * function returns, the worker thread is then free to handle another - * transaction. + * Read in the request */ -void context_loop(int *sock) +int ReadHTTPRequest (ParsedHttpHdrs *Hdr) { - const char *Pos = NULL; - const char *buf; - int desired_session = 0; - int got_cookie = 0; - int gzip_ok = 0; - wcsession *TheSession, *sptr; - char httpauth_string[1024]; - char httpauth_user[1024]; - char httpauth_pass[1024]; - int session_is_new = 0; - int nLine = 0; - int LineLen; - void *vLine; - StrBuf *Buf, *Line, *LastLine, *HeaderName, *ReqLine, *ReqType, *HTTPVersion; const char *pch, *pchs, *pche; - HashList *HTTPHeaders; - - strcpy(httpauth_string, ""); - strcpy(httpauth_user, DEFAULT_HTTPAUTH_USER); - strcpy(httpauth_pass, DEFAULT_HTTPAUTH_PASS); + OneHttpHeader *pHdr; + StrBuf *Line, *LastLine, *HeaderName; + int nLine = 0; + void *vF; + int isbogus = 0; - /* - * Find out what it is that the web browser is asking for - */ HeaderName = NewStrBuf(); - Buf = NewStrBuf(); LastLine = NULL; - HTTPHeaders = NewHash(1, NULL); - - /* - * Read in the request - */ do { nLine ++; - Line = NewStrBuf(); - + Line = NewStrBufPlain(NULL, SIZ / 4); - if (ClientGetLine(sock, Line, Buf, &Pos) < 0) return; + if (ClientGetLine(Hdr, Line) < 0) return 1; - LineLen = StrLength(Line); - - if (nLine == 1) { - ReqLine = Line; + if (StrLength(Line) == 0) { + FreeStrBuf(&Line); continue; } - if (LineLen == 0) { - FreeStrBuf(&Line); + if (nLine == 1) { + Hdr->HTTPHeaders = NewHash(1, NULL); + pHdr = (OneHttpHeader*) malloc(sizeof(OneHttpHeader)); + memset(pHdr, 0, sizeof(OneHttpHeader)); + pHdr->Val = Line; + Put(Hdr->HTTPHeaders, HKEY("GET /"), pHdr, DestroyHttpHeaderHandler); + syslog(9, "%s\n", ChrPtr(Line)); + isbogus = ReadHttpSubject(Hdr, Line, HeaderName); + if (isbogus) break; continue; } @@ -295,6 +421,7 @@ void context_loop(int *sock) pch ++; StrBufCutLeft(Line, pch - pchs); StrBufAppendBuf(LastLine, Line, 0); + FreeStrBuf(&Line); continue; } @@ -303,206 +430,158 @@ void context_loop(int *sock) StrBufExtract_token(HeaderName, Line, 0, ':'); pchs = ChrPtr(Line); + pche = pchs + StrLength(Line); pch = pchs + StrLength(HeaderName) + 1; pche = pchs + StrLength(Line); - while (isspace(*pch) && (pch < pche)) + while ((pch < pche) && isspace(*pch)) pch ++; StrBufCutLeft(Line, pch - pchs); StrBufUpCase(HeaderName); - Put(HTTPHeaders, SKEY(HeaderName), Line, HFreeStrBuf); + + pHdr = (OneHttpHeader*) malloc(sizeof(OneHttpHeader)); + memset(pHdr, 0, sizeof(OneHttpHeader)); + pHdr->Val = Line; + + if (GetHash(HttpHeaderHandler, SKEY(HeaderName), &vF) && + (vF != NULL)) + { + OneHttpHeader *FHdr = (OneHttpHeader*) vF; + pHdr->H = FHdr->H; + pHdr->HaveEvaluator = 1; + } + Put(Hdr->HTTPHeaders, SKEY(HeaderName), pHdr, DestroyHttpHeaderHandler); LastLine = Line; - } while (LineLen > 0); + } while (Line != NULL); + FreeStrBuf(&HeaderName); -/* dbg_PrintHash(HTTPHeaders, nix, NULL); */ + return isbogus; +} +void OverrideRequest(ParsedHttpHdrs *Hdr, const char *Line, long len) +{ + StrBuf *Buf = NewStrBuf(); - /* - * Can we compress? - */ - if (GetHash(HTTPHeaders, HKEY("ACCEPT-ENCODING"), &vLine) && - (vLine != NULL)) { - buf = ChrPtr((StrBuf*)vLine); - if (strstr(&buf[16], "gzip")) { - gzip_ok = 1; - } + if (Hdr->HR.ReqLine != NULL) { + FlushStrBuf(Hdr->HR.ReqLine); + StrBufPlain(Hdr->HR.ReqLine, Line, len); } - - /* - * Browser-based sessions use cookies for session authentication - */ - if (GetHash(HTTPHeaders, HKEY("COOKIE"), &vLine) && - (vLine != NULL)) { - cookie_to_stuff(vLine, &desired_session, - NULL, NULL, NULL); - got_cookie = 1; + else { + Hdr->HR.ReqLine = NewStrBufPlain(Line, len); } + ReadHttpSubject(Hdr, Hdr->HR.ReqLine, Buf); + + FreeStrBuf(&Buf); +} + +/* + * handle one request + * + * This loop gets called once for every HTTP connection made to WebCit. At + * this entry point we have an HTTP socket with a browser allegedly on the + * other end, but we have not yet bound to a WebCit session. + * + * The job of this function is to locate the correct session and bind to it, + * or create a session if necessary and bind to it, then run the WebCit + * transaction loop. Afterwards, we unbind from the session. When this + * function returns, the worker thread is then free to handle another + * transaction. + */ +void context_loop(ParsedHttpHdrs *Hdr) +{ + int isbogus = 0; + wcsession *TheSession; + struct timeval tx_start; + struct timeval tx_finish; + int session_may_be_reused = 1; + + gettimeofday(&tx_start, NULL); /* start a stopwatch for performance timing */ /* - * GroupDAV-based sessions use HTTP authentication + * Find out what it is that the web browser is asking for */ - if (GetHash(HTTPHeaders, HKEY("AUTHORIZATION"), &vLine) && - (vLine != NULL)) { - Line = (StrBuf*)vLine; - if (strncasecmp(ChrPtr(Line), "Basic", 5) == 0) { - StrBufCutLeft(Line, 6); - CtdlDecodeBase64(httpauth_string, ChrPtr(Line), StrLength(Line)); - extract_token(httpauth_user, httpauth_string, 0, ':', sizeof httpauth_user); - extract_token(httpauth_pass, httpauth_string, 1, ':', sizeof httpauth_pass); - } - else - lprintf(1, "Authentication scheme not supported! [%s]\n", ChrPtr(Line)); + isbogus = ReadHTTPRequest(Hdr); + + Hdr->HR.dav_depth = 32767; /* TODO: find a general way to have non-0 defaults */ + + if (!isbogus) { + isbogus = AnalyseHeaders(Hdr); } - if (GetHash(HTTPHeaders, HKEY("IF-MODIFIED-SINCE"), &vLine) && - (vLine != NULL)) { - if_modified_since = httpdate_to_timestamp((StrBuf*)vLine); + if ( (isbogus) + || ((Hdr->HR.Handler != NULL) + && ((Hdr->HR.Handler->Flags & BOGUS) != 0)) + ) { + wcsession *Bogus; + Bogus = CreateSession(0, 1, NULL, Hdr, NULL); + do_404(); + syslog(9, "HTTP: 404 [%ld.%06ld] %s %s \n", + ((tx_finish.tv_sec*1000000 + tx_finish.tv_usec) - (tx_start.tv_sec*1000000 + tx_start.tv_usec)) / 1000000, + ((tx_finish.tv_sec*1000000 + tx_finish.tv_usec) - (tx_start.tv_sec*1000000 + tx_start.tv_usec)) % 1000000, + ReqStrs[Hdr->HR.eReqType], + ChrPtr(Hdr->this_page) + ); + session_detach_modules(Bogus); + session_destroy_modules(&Bogus); + return; } + if ((Hdr->HR.Handler != NULL) && ((Hdr->HR.Handler->Flags & ISSTATIC) != 0)) + { + wcsession *Static; + Static = CreateSession(0, 1, NULL, Hdr, NULL); + + Hdr->HR.Handler->F(); + /* How long did this transaction take? */ + gettimeofday(&tx_finish, NULL); + + syslog(9, "HTTP: 200 [%ld.%06ld] %s %s \n", + ((tx_finish.tv_sec*1000000 + tx_finish.tv_usec) - (tx_start.tv_sec*1000000 + tx_start.tv_usec)) / 1000000, + ((tx_finish.tv_sec*1000000 + tx_finish.tv_usec) - (tx_start.tv_sec*1000000 + tx_start.tv_usec)) % 1000000, + ReqStrs[Hdr->HR.eReqType], + ChrPtr(Hdr->this_page) + ); + session_detach_modules(Static); + session_destroy_modules(&Static); + return; + } + + if (Hdr->HR.got_auth == AUTH_BASIC) { + CheckAuthBasic(Hdr); + } - ReqType = NewStrBuf(); - HTTPVersion = NewStrBuf(); - StrBufExtract_token(HTTPVersion, ReqLine, 2, ' '); - StrBufExtract_token(ReqType, ReqLine, 0, ' '); - StrBufCutLeft(ReqLine, StrLength(ReqType) + 1); - StrBufCutRight(ReqLine, StrLength(HTTPVersion) + 1); + if (Hdr->HR.got_auth) { + session_may_be_reused = 0; + } /* - * If the request is prefixed by "/webcit" then chop that off. This - * allows a front end web server to forward all /webcit requests to us - * while still using the same web server port for other things. - */ - if ( (StrLength(ReqLine) >= 8) && (strstr(ChrPtr(ReqLine), "/webcit/")) ) { - StrBufCutLeft(ReqLine, 7); - } - - /* Begin parsing the request. */ -#ifdef TECH_PREVIEW - if ((strncmp(ChrPtr(ReqLine), "/sslg", 5) != 0) && - (strncmp(ChrPtr(ReqLine), "/static/", 8) != 0) && - (strncmp(ChrPtr(ReqLine), "/tiny_mce/", 10) != 0) && - (strncmp(ChrPtr(ReqLine), "/wholist_section", 16) != 0) && - (strstr(ChrPtr(ReqLine), "wholist_section") == NULL)) { -#endif - lprintf(5, "HTTP: %s %s %s\n", ChrPtr(ReqType), ChrPtr(ReqLine), ChrPtr(HTTPVersion)); -#ifdef TECH_PREVIEW - } -#endif - - /** Check for bogus requests */ - if ((StrLength(HTTPVersion) == 0) || - (StrLength(ReqType) == 0) || - is_bogus(ReqLine)) { - StrBufPlain(ReqLine, HKEY("/404 HTTP/1.1")); - StrBufPlain(ReqType, HKEY("GET")); - } - FreeStrBuf(&HTTPVersion); - - /** - * While we're at it, gracefully handle requests for the - * robots.txt and favicon.ico files. - */ - if (!strncasecmp(ChrPtr(ReqLine), "/robots.txt", 11)) { - StrBufPlain(ReqLine, - HKEY("/static/robots.txt" - "?force_close_session=yes HTTP/1.1")); - StrBufPlain(ReqType, HKEY("GET")); - } - else if (!strncasecmp(ChrPtr(ReqLine), "/favicon.ico", 12)) { - StrBufPlain(ReqLine, HKEY("/static/favicon.ico")); - StrBufPlain(ReqType, HKEY("GET")); - } - - /** - * These are the URL's which may be executed without a - * session cookie already set. If it's not one of these, - * force the session to close because cookies are - * probably disabled on the client browser. - */ - else if ( (StrLength(ReqLine) > 1 ) - && (strncasecmp(ChrPtr(ReqLine), "/listsub", 8)) - && (strncasecmp(ChrPtr(ReqLine), "/freebusy", 9)) - && (strncasecmp(ChrPtr(ReqLine), "/do_logout", 10)) - && (strncasecmp(ChrPtr(ReqLine), "/groupdav", 9)) - && (strncasecmp(ChrPtr(ReqLine), "/static", 7)) - && (strncasecmp(ChrPtr(ReqLine), "/rss", 4)) - && (strncasecmp(ChrPtr(ReqLine), "/404", 4)) - && (got_cookie == 0)) { - StrBufPlain(ReqLine, - HKEY("/static/nocookies.html" - "?force_close_session=yes")); - } - - /** * See if there's an existing session open with the desired ID or user/pass */ - TheSession = NULL; + TheSession = FindSession(&SessionList, Hdr, &SessionListMutex); - if (TheSession == NULL) { - pthread_mutex_lock(&SessionListMutex); - for (sptr = SessionList; - ((sptr != NULL) && (TheSession == NULL)); - sptr = sptr->next) { - - /** If HTTP-AUTH, look for a session with matching credentials */ - if ( (!IsEmptyStr(httpauth_user)) - &&(!strcasecmp(ChrPtr(sptr->httpauth_user), httpauth_user)) - &&(!strcasecmp(ChrPtr(sptr->httpauth_pass), httpauth_pass)) ) { - TheSession = sptr; - } - - /** If cookie-session, look for a session with matching session ID */ - if ( (desired_session != 0) && (sptr->wc_session == desired_session)) { - TheSession = sptr; - } - - } - pthread_mutex_unlock(&SessionListMutex); - } - - /** + /* * Create a new session if we have to */ if (TheSession == NULL) { - lprintf(3, "Creating a new session\n"); - TheSession = (wcsession *) - malloc(sizeof(wcsession)); - memset(TheSession, 0, sizeof(wcsession)); - TheSession->headers = HTTPHeaders; - TheSession->serv_sock = (-1); - TheSession->chat_sock = (-1); - - /* If we're recreating a session that expired, it's best to give it the same - * session number that it had before. The client browser ought to pick up - * the new session number and start using it, but in some rare situations it - * doesn't, and that's a Bad Thing because it causes lots of spurious sessions - * to get created. - */ - if (desired_session == 0) { - TheSession->wc_session = GenerateSessionID(); + TheSession = CreateSession(1, 0, &SessionList, Hdr, &SessionListMutex); + + if ( (StrLength(Hdr->c_username) == 0) + && (!Hdr->HR.DontNeedAuth) + && (Hdr->HR.Handler != NULL) + && ((XHTTP_COMMANDS & Hdr->HR.Handler->Flags) == XHTTP_COMMANDS) + ) { + OverrideRequest(Hdr, HKEY("GET /401 HTTP/1.0")); + Hdr->HR.prohibit_caching = 1; } - else { - TheSession->wc_session = desired_session; + + if (StrLength(Hdr->c_language) > 0) { + syslog(9, "Session cookie requests language '%s'\n", ChrPtr(Hdr->c_language)); + set_selected_language(ChrPtr(Hdr->c_language)); + go_selected_language(); } - - TheSession->httpauth_user = NewStrBufPlain(httpauth_user, -1); - TheSession->httpauth_pass = NewStrBufPlain(httpauth_user, -1); - - pthread_setspecific(MyConKey, (void *)TheSession); - session_new_modules(TheSession); - - pthread_mutex_init(&TheSession->SessionMutex, NULL); - pthread_mutex_lock(&SessionListMutex); - TheSession->nonce = rand(); - TheSession->next = SessionList; - TheSession->is_mobile = -1; - SessionList = TheSession; - pthread_mutex_unlock(&SessionListMutex); - session_is_new = 1; } - TheSession->headers = HTTPHeaders; /* * A future improvement might be to check the session integrity @@ -512,26 +591,42 @@ void context_loop(int *sock) /* * Bind to the session and perform the transaction */ - pthread_mutex_lock(&TheSession->SessionMutex); /* bind */ + CtdlLogResult(pthread_mutex_lock(&TheSession->SessionMutex)); pthread_setspecific(MyConKey, (void *)TheSession); + TheSession->inuse = 1; /* mark the session as bound */ TheSession->lastreq = time(NULL); /* log */ - TheSession->http_sock = *sock; - TheSession->gzip_ok = gzip_ok; + TheSession->Hdr = Hdr; session_attach_modules(TheSession); + session_loop(); /* do transaction */ + + /* How long did this transaction take? */ + gettimeofday(&tx_finish, NULL); + + syslog(9, "HTTP: 200 [%ld.%06ld] %s %s \n", + ((tx_finish.tv_sec*1000000 + tx_finish.tv_usec) - (tx_start.tv_sec*1000000 + tx_start.tv_usec)) / 1000000, + ((tx_finish.tv_sec*1000000 + tx_finish.tv_usec) - (tx_start.tv_sec*1000000 + tx_start.tv_usec)) % 1000000, + ReqStrs[Hdr->HR.eReqType], + ChrPtr(Hdr->this_page) + ); - session_loop(ReqLine, ReqType, Buf, &Pos); /* do transaction */ session_detach_modules(TheSession); - TheSession->headers = NULL; - pthread_mutex_unlock(&TheSession->SessionMutex); /* unbind */ + /* If *this* very transaction did not explicitly specify a session cookie, + * and it did not log in, we want to flag the session as a candidate for + * re-use by the next unbound client that comes along. This keeps our session + * table from getting bombarded with new sessions when, for example, a web + * spider crawls the site without using cookies. + */ + if ((session_may_be_reused) && (!WC->logged_in)) { + WC->wc_session = 0; /* flag as available for re-use */ + TheSession->selected_language = 0; /* clear any non-default language setting */ + } - /* Free the request buffer */ - DeleteHash(&HTTPHeaders); - FreeStrBuf(&ReqLine); - FreeStrBuf(&ReqType); - FreeStrBuf(&Buf); + TheSession->Hdr = NULL; + TheSession->inuse = 0; /* mark the session as unbound */ + CtdlLogResult(pthread_mutex_unlock(&TheSession->SessionMutex)); } void tmplput_nonce(StrBuf *Target, WCTemplputParams *TP) @@ -546,18 +641,199 @@ void tmplput_current_user(StrBuf *Target, WCTemplputParams *TP) StrBufAppendTemplate(Target, TP, WC->wc_fullname, 0); } -void tmplput_current_room(StrBuf *Target, WCTemplputParams *TP) +void Header_HandleContentLength(StrBuf *Line, ParsedHttpHdrs *hdr) { - StrBufAppendTemplate(Target, TP, WC->wc_roomname, 0); + hdr->HR.ContentLength = StrToi(Line); +} + +void Header_HandleContentType(StrBuf *Line, ParsedHttpHdrs *hdr) +{ + hdr->HR.ContentType = Line; } +void Header_HandleHost(StrBuf *Line, ParsedHttpHdrs *hdr) +{ + if (hdr->HostHeader != NULL) { + FreeStrBuf(&hdr->HostHeader); + } + hdr->HostHeader = NewStrBuf(); + StrBufAppendPrintf(hdr->HostHeader, "%s://", (is_https ? "https" : "http") ); + StrBufAppendBuf(hdr->HostHeader, Line, 0); +} + +void Header_HandleXFFHost(StrBuf *Line, ParsedHttpHdrs *hdr) +{ + if (!follow_xff) return; + + if (hdr->HostHeader != NULL) { + FreeStrBuf(&hdr->HostHeader); + } + + hdr->HostHeader = NewStrBuf(); + StrBufAppendPrintf(hdr->HostHeader, "http://"); /* this is naive; do something about it */ + StrBufAppendBuf(hdr->HostHeader, Line, 0); +} + + +void Header_HandleXFF(StrBuf *Line, ParsedHttpHdrs *hdr) +{ + hdr->HR.browser_host = Line; + + while (StrBufNum_tokens(hdr->HR.browser_host, ',') > 1) { + StrBufRemove_token(hdr->HR.browser_host, 0, ','); + } + StrBufTrim(hdr->HR.browser_host); +} + +void Header_HandleIfModSince(StrBuf *Line, ParsedHttpHdrs *hdr) +{ + hdr->HR.if_modified_since = httpdate_to_timestamp(Line); +} + +void Header_HandleAcceptEncoding(StrBuf *Line, ParsedHttpHdrs *hdr) +{ + /* + * Can we compress? + */ + if (strstr(&ChrPtr(Line)[16], "gzip")) { + hdr->HR.gzip_ok = 1; + } +} +const char *ReqStrs[eNONE] = { + "GET", + "POST", + "OPTIONS", + "PROPFIND", + "PUT", + "DELETE", + "HEAD", + "MOVE", + "COPY" +}; + +void +ServerStartModule_CONTEXT +(void) +{ + long *v; + HttpReqTypes = NewHash(1, NULL); + HttpHeaderHandler = NewHash(1, NULL); + + v = malloc(sizeof(long)); + *v = eGET; + Put(HttpReqTypes, HKEY("GET"), v, NULL); + + v = malloc(sizeof(long)); + *v = ePOST; + Put(HttpReqTypes, HKEY("POST"), v, NULL); + + v = malloc(sizeof(long)); + *v = eOPTIONS; + Put(HttpReqTypes, HKEY("OPTIONS"), v, NULL); + + v = malloc(sizeof(long)); + *v = ePROPFIND; + Put(HttpReqTypes, HKEY("PROPFIND"), v, NULL); + + v = malloc(sizeof(long)); + *v = ePUT; + Put(HttpReqTypes, HKEY("PUT"), v, NULL); + + v = malloc(sizeof(long)); + *v = eDELETE; + Put(HttpReqTypes, HKEY("DELETE"), v, NULL); + + v = malloc(sizeof(long)); + *v = eHEAD; + Put(HttpReqTypes, HKEY("HEAD"), v, NULL); + + v = malloc(sizeof(long)); + *v = eMOVE; + Put(HttpReqTypes, HKEY("MOVE"), v, NULL); + + v = malloc(sizeof(long)); + *v = eCOPY; + Put(HttpReqTypes, HKEY("COPY"), v, NULL); +} + +void +ServerShutdownModule_CONTEXT +(void) +{ + DeleteHash(&HttpReqTypes); + DeleteHash(&HttpHeaderHandler); +} + +void RegisterHeaderHandler(const char *Name, long Len, Header_Evaluator F) +{ + OneHttpHeader *pHdr; + pHdr = (OneHttpHeader*) malloc(sizeof(OneHttpHeader)); + memset(pHdr, 0, sizeof(OneHttpHeader)); + pHdr->H = F; + Put(HttpHeaderHandler, Name, Len, pHdr, DestroyHttpHeaderHandler); +} + void InitModule_CONTEXT (void) { - RegisterNamespace("CURRENT_USER", 0, 1, tmplput_current_user, CTX_NONE); - RegisterNamespace("CURRENT_ROOM", 0, 1, tmplput_current_room, CTX_NONE); - RegisterNamespace("NONCE", 0, 0, tmplput_nonce, 0); + RegisterHeaderHandler(HKEY("CONTENT-LENGTH"), Header_HandleContentLength); + RegisterHeaderHandler(HKEY("CONTENT-TYPE"), Header_HandleContentType); + RegisterHeaderHandler(HKEY("X-FORWARDED-HOST"), Header_HandleXFFHost); /* Apache way... */ + RegisterHeaderHandler(HKEY("X-REAL-IP"), Header_HandleXFFHost); /* NGinX way... */ + RegisterHeaderHandler(HKEY("HOST"), Header_HandleHost); + RegisterHeaderHandler(HKEY("X-FORWARDED-FOR"), Header_HandleXFF); + RegisterHeaderHandler(HKEY("ACCEPT-ENCODING"), Header_HandleAcceptEncoding); + RegisterHeaderHandler(HKEY("IF-MODIFIED-SINCE"), Header_HandleIfModSince); + + RegisterNamespace("CURRENT_USER", 0, 1, tmplput_current_user, NULL, CTX_NONE); + RegisterNamespace("NONCE", 0, 0, tmplput_nonce, NULL, 0); + + WebcitAddUrlHandler(HKEY("404"), "", 0, do_404, ANONYMOUS|COOKIEUNNEEDED); +/* + * Look for commonly-found probes of malware such as worms, viruses, trojans, and Microsoft Office. + * Short-circuit these requests so we don't have to send them through the full processing loop. + */ + WebcitAddUrlHandler(HKEY("scripts"), "", 0, do_404, ANONYMOUS|BOGUS); /* /root.exe - Worms and trojans and viruses, oh my! */ + WebcitAddUrlHandler(HKEY("c"), "", 0, do_404, ANONYMOUS|BOGUS); /* /winnt */ + WebcitAddUrlHandler(HKEY("MSADC"), "", 0, do_404, ANONYMOUS|BOGUS); + WebcitAddUrlHandler(HKEY("_vti"), "", 0, do_404, ANONYMOUS|BOGUS); /* Broken Microsoft DAV implementation */ + WebcitAddUrlHandler(HKEY("MSOffice"), "", 0, do_404, ANONYMOUS|BOGUS); /* Stoopid MSOffice thinks everyone is IIS */ + WebcitAddUrlHandler(HKEY("nonexistenshit"), "", 0, do_404, ANONYMOUS|BOGUS); /* Exploit found in the wild January 2009 */ +} + + +void +HttpNewModule_CONTEXT +(ParsedHttpHdrs *httpreq) +{ + httpreq->PlainArgs = NewStrBufPlain(NULL, SIZ); + httpreq->this_page = NewStrBufPlain(NULL, SIZ); +} + +void +HttpDetachModule_CONTEXT +(ParsedHttpHdrs *httpreq) +{ + FlushStrBuf(httpreq->PlainArgs); + FlushStrBuf(httpreq->HostHeader); + FlushStrBuf(httpreq->this_page); + FlushStrBuf(httpreq->PlainArgs); + DeleteHash(&httpreq->HTTPHeaders); + memset(&httpreq->HR, 0, sizeof(HdrRefs)); +} + +void +HttpDestroyModule_CONTEXT +(ParsedHttpHdrs *httpreq) +{ + FreeStrBuf(&httpreq->this_page); + FreeStrBuf(&httpreq->PlainArgs); + FreeStrBuf(&httpreq->this_page); + FreeStrBuf(&httpreq->PlainArgs); + FreeStrBuf(&httpreq->HostHeader); + DeleteHash(&httpreq->HTTPHeaders); + }