4 * This is the other half of the webserver. It handles the task of hooking
5 * up HTTP requests with the sessions they belong to, using HTTP cookies to
6 * keep track of things. If the HTTP request doesn't belong to any currently
7 * active session, a new session is started.
12 #include "webserver.h"
13 #include "modules_init.h"
15 /* Only one thread may manipulate SessionList at a time... */
16 pthread_mutex_t SessionListMutex;
18 wcsession *SessionList = NULL; /**< our sessions ????*/
20 pthread_key_t MyConKey; /**< TSD key for MySession() */
21 HashList *HttpReqTypes = NULL;
22 HashList *HttpHeaderHandler = NULL;
23 extern HashList *HandlerHash;
25 void DestroyHttpHeaderHandler(void *V)
28 pHdr = (OneHttpHeader*) V;
29 FreeStrBuf(&pHdr->Val);
33 void shutdown_sessions(void)
37 for (sptr = SessionList; sptr != NULL; sptr = sptr->next) {
42 void do_housekeeping(void)
45 wcsession *sessions_to_kill = NULL;
47 static int num_threads = MIN_WORKER_THREADS;
50 * Lock the session list, moving any candidates for euthanasia into
53 pthread_mutex_lock(&SessionListMutex);
55 for (sptr = SessionList; sptr != NULL; sptr = sptr->next) {
58 /** Kill idle sessions */
59 if ((time(NULL) - (sptr->lastreq)) >
60 (time_t) WEBCIT_TIMEOUT) {
64 /** Remove sessions flagged for kill */
67 /** remove session from linked list */
68 if (sptr == SessionList) {
69 SessionList = SessionList->next;
71 else for (ss=SessionList;ss!=NULL;ss=ss->next) {
72 if (ss->next == sptr) {
73 ss->next = ss->next->next;
77 sptr->next = sessions_to_kill;
78 sessions_to_kill = sptr;
81 pthread_mutex_unlock(&SessionListMutex);
84 * Now free up and destroy the culled sessions.
86 while (sessions_to_kill != NULL) {
87 lprintf(3, "Destroying session %d\n", sessions_to_kill->wc_session);
88 pthread_mutex_lock(&sessions_to_kill->SessionMutex);
89 pthread_mutex_unlock(&sessions_to_kill->SessionMutex);
90 sptr = sessions_to_kill->next;
92 session_destroy_modules(&sessions_to_kill);
93 sessions_to_kill = sptr;
98 * If there are more sessions than threads, then we should spawn
99 * more threads ... up to a predefined maximum.
101 while ( (num_sessions > num_threads)
102 && (num_threads <= MAX_WORKER_THREADS) ) {
103 spawn_another_worker_thread();
105 lprintf(3, "There are %d sessions and %d threads active.\n",
106 num_sessions, num_threads);
112 * Wake up occasionally and clean house
114 void housekeeping_loop(void)
117 sleeeeeeeeeep(HOUSEKEEPING);
124 * Create a Session id
125 * Generate a unique WebCit session ID (which is not the same thing as the
126 * Citadel session ID).
128 int GenerateSessionID(void)
130 static int seq = (-1);
133 seq = (int) time(NULL);
141 * lingering_close() a`la Apache. see
142 * http://www.apache.org/docs/misc/fin_wait_2.html for rationale
144 int lingering_close(int fd)
149 struct timeval tv, start;
151 gettimeofday(&start, NULL);
155 gettimeofday(&tv, NULL);
156 tv.tv_sec = SLEEPING - (tv.tv_sec - start.tv_sec);
157 tv.tv_usec = start.tv_usec - tv.tv_usec;
158 if (tv.tv_usec < 0) {
160 tv.tv_usec += 1000000;
164 i = select(fd + 1, &set, NULL, NULL, &tv);
165 } while (i == -1 && errno == EINTR);
170 i = read(fd, buf, sizeof buf);
171 } while (i != 0 && (i != -1 || errno == EINTR));
180 * \brief Detects a 'mobile' user agent
182 int is_mobile_ua(char *user_agent) {
183 if (strstr(user_agent,"iPhone OS") != NULL) {
185 } else if (strstr(user_agent,"Windows CE") != NULL) {
187 } else if (strstr(user_agent,"SymbianOS") != NULL) {
189 } else if (strstr(user_agent, "Opera Mobi") != NULL) {
191 } else if (strstr(user_agent, "Firefox/2.0.0 Opera 9.51 Beta") != NULL) {
192 /* For some reason a new install of Opera 9.51beta decided to spoof. */
201 * Look for commonly-found probes of malware such as worms, viruses, trojans, and Microsoft Office.
202 * Short-circuit these requests so we don't have to send them through the full processing loop.
204 int is_bogus(StrBuf *http_cmd) {////TODO!
207 const char *bogus_prefixes[] = {
208 "/scripts/root.exe", /* Worms and trojans and viruses, oh my! */
211 "/_vti", /* Broken Microsoft DAV implementation */
212 "/MSOffice", /* Stoopid MSOffice thinks everyone is IIS */
213 "/nonexistenshit" /* Exploit found in the wild January 2009 */
216 url = ChrPtr(http_cmd);
217 if (IsEmptyStr(url)) return(1);
220 max = sizeof(bogus_prefixes) / sizeof(char *);
222 for (i=0; i<max; ++i) {
223 if (!strncasecmp(url, bogus_prefixes[i], strlen(bogus_prefixes[i]))) {
228 return(0); /* probably ok */
232 int ReadHttpSubject(ParsedHttpHdrs *Hdr, StrBuf *Line, StrBuf *Buf)
235 void *vLine, *vHandler;
236 const char *Pos = NULL;
240 /* The requesttype... GET, POST... */
241 StrBufExtract_token(Buf, Hdr->ReqLine, 0, ' ');
242 if (GetHash(HttpReqTypes, SKEY(Buf), &vLine) &&
245 Hdr->eReqType = *(long*)vLine;
248 Hdr->eReqType = eGET;
251 StrBufCutLeft(Hdr->ReqLine, StrLength(Buf) + 1);
253 /* the HTTP Version... */
254 StrBufExtract_token(Buf, Hdr->ReqLine, 1, ' ');
255 StrBufCutRight(Hdr->ReqLine, StrLength(Buf) + 1);
256 if ((StrLength(Buf) == 0) ||
257 is_bogus(Hdr->ReqLine)) {
258 Hdr->eReqType = eGET;
262 Hdr->this_page = NewStrBufDup(Hdr->ReqLine);
263 /* chop Filename / query arguments */
264 Args = strchr(ChrPtr(Hdr->ReqLine), '?');
265 if (Args == NULL) /* whe're not that picky about params... TODO: this will spoil '&' in filenames.*/
266 Args = strchr(ChrPtr(Hdr->ReqLine), '&');
268 Args ++; /* skip the ? */
269 Hdr->PlainArgs = NewStrBufPlain(
271 StrLength(Hdr->ReqLine) -
272 (Args - ChrPtr(Hdr->ReqLine)));
273 StrBufCutAt(Hdr->ReqLine, 0, Args - 1);
274 } /* don't parse them yet, maybe we don't even care... */
276 /* now lookup what we are going to do with this... */
277 /* skip first slash */
278 StrBufExtract_NextToken(Buf, Hdr->ReqLine, &Pos, '/');
280 StrBufExtract_NextToken(Buf, Hdr->ReqLine, &Pos, '/');
282 GetHash(HandlerHash, SKEY(Buf), &vHandler),
283 Hdr->Handler = (WebcitHandler*) vHandler;
284 if (Hdr->Handler == NULL)
287 * If the request is prefixed by "/webcit" then chop that off. This
288 * allows a front end web server to forward all /webcit requests to us
289 * while still using the same web server port for other things.
291 if ((Hdr->Handler->Flags & URLNAMESPACE) == 0)
294 /* remove the handlername from the URL */
296 StrBufCutLeft(Hdr->ReqLine,
297 Pos - ChrPtr(Hdr->ReqLine));
300 if (Hdr->Handler != NULL) {
301 if ((Hdr->Handler->Flags & BOGUS) != 0)
303 Hdr->DontNeedAuth = (Hdr->Handler->Flags & ISSTATIC) != 0;
306 Hdr->HTTPHeaders = NewHash(1, NULL);
310 int AnalyseHeaders(ParsedHttpHdrs *Hdr)
316 HashPos *at = GetNewHashPos(Hdr->HTTPHeaders, 0);
318 while (GetNextHashPos(Hdr->HTTPHeaders, at, &HKLen, &HashKey, &vHdr) &&
320 pHdr = (OneHttpHeader *)vHdr;
321 if (pHdr->HaveEvaluator)
322 pHdr->H(pHdr->Val, Hdr);
329 /*const char *nix(void *vptr) {return ChrPtr( (StrBuf*)vptr);}*/
332 * Read in the request
334 int ReadHTTPRequset (ParsedHttpHdrs *Hdr)
336 const char *pch, *pchs, *pche;
338 StrBuf *Line, *LastLine, *HeaderName;
343 HeaderName = NewStrBuf();
344 Hdr->ReadBuf = NewStrBuf();
350 if (ClientGetLine(&Hdr->http_sock, Line, Hdr->ReadBuf, &Hdr->Pos) < 0) return 1;
352 if (StrLength(Line) == 0) {
357 isbogus = ReadHttpSubject(Hdr, Line, HeaderName);
362 /* Do we need to Unfold? */
363 if ((LastLine != NULL) &&
364 (isspace(*ChrPtr(Line)))) {
365 pch = pchs = ChrPtr(Line);
366 pche = pchs + StrLength(Line);
367 while (isspace(*pch) && (pch < pche))
369 StrBufCutLeft(Line, pch - pchs);
370 StrBufAppendBuf(LastLine, Line, 0);
376 StrBufSanitizeAscii(Line, '§');
377 StrBufExtract_token(HeaderName, Line, 0, ':');
380 pch = pchs + StrLength(HeaderName) + 1;
381 pche = pchs + StrLength(Line);
382 while (isspace(*pch) && (pch < pche))
384 StrBufCutLeft(Line, pch - pchs);
386 StrBufUpCase(HeaderName);
388 pHdr = (OneHttpHeader*) malloc(sizeof(OneHttpHeader));
389 memset(pHdr, 0, sizeof(OneHttpHeader));
392 if (GetHash(HttpHeaderHandler, SKEY(HeaderName), &vF) &&
395 OneHttpHeader *FHdr = (OneHttpHeader*) vF;
397 pHdr->HaveEvaluator = 1;
399 Put(Hdr->HTTPHeaders, SKEY(HeaderName), pHdr, DestroyHttpHeaderHandler);
401 } while (Line != NULL);
403 FreeStrBuf(&HeaderName);
413 * This loop gets called once for every HTTP connection made to WebCit. At
414 * this entry point we have an HTTP socket with a browser allegedly on the
415 * other end, but we have not yet bound to a WebCit session.
417 * The job of this function is to locate the correct session and bind to it,
418 * or create a session if necessary and bind to it, then run the WebCit
419 * transaction loop. Afterwards, we unbind from the session. When this
420 * function returns, the worker thread is then free to handle another
423 void context_loop(int *sock)
427 wcsession *TheSession, *sptr;
428 struct timeval tx_start;
429 struct timeval tx_finish;
431 gettimeofday(&tx_start, NULL); /* start a stopwatch for performance timing */
433 memset(&Hdr, 0, sizeof(ParsedHttpHdrs));
435 Hdr.http_sock = *sock;
437 * Find out what it is that the web browser is asking for
439 isbogus = ReadHTTPRequset(&Hdr);
442 isbogus = AnalyseHeaders(&Hdr);
444 if (Hdr.got_auth == AUTH_BASIC)
445 CheckAuthBasic(&Hdr);
449 StrBufPlain(ReqLine, HKEY("/404"));
450 TODO HKEY("/static/nocookies.html?force_close_session=yes"));
453 /* dbg_PrintHash(HTTPHeaders, nix, NULL); */
456 /* Begin parsing the request. * /
458 if ((strncmp(ChrPtr(ReqLine), "/sslg", 5) != 0) &&
459 (strncmp(ChrPtr(ReqLine), "/static/", 8) != 0) &&
460 (strncmp(ChrPtr(ReqLine), "/tiny_mce/", 10) != 0) &&
461 (strncmp(ChrPtr(ReqLine), "/wholist_section", 16) != 0) &&
462 (strstr(ChrPtr(ReqLine), "wholist_section") == NULL)) {
464 lprintf(5, "HTTP: %s %s\n", ReqStrs[Hdr.eReqType], ChrPtr(ReqLine));
472 * See if there's an existing session open with the desired ID or user/pass
476 if (TheSession == NULL) {
477 pthread_mutex_lock(&SessionListMutex);
478 for (sptr = SessionList;
479 ((sptr != NULL) && (TheSession == NULL));
482 /** If HTTP-AUTH, look for a session with matching credentials */
483 switch (Hdr.got_auth)
486 if ( (Hdr.SessionKey != sptr->SessionKey))
489 if ((!strcasecmp(ChrPtr(Hdr.c_username), ChrPtr(sptr->wc_username))) &&
490 (!strcasecmp(ChrPtr(Hdr.c_password), ChrPtr(sptr->wc_password))) )
494 /** If cookie-session, look for a session with matching session ID */
495 if ( (Hdr.desired_session != 0) &&
496 (sptr->wc_session == Hdr.desired_session))
503 pthread_mutex_unlock(&SessionListMutex);
507 * Create a new session if we have to
509 if (TheSession == NULL) {
510 lprintf(3, "Creating a new session\n");
511 TheSession = (wcsession *)
512 malloc(sizeof(wcsession));
513 memset(TheSession, 0, sizeof(wcsession));
514 TheSession->Hdr = &Hdr;
515 TheSession->SessionKey = Hdr.SessionKey;
516 TheSession->serv_sock = (-1);
517 TheSession->chat_sock = (-1);
519 /* If we're recreating a session that expired, it's best to give it the same
520 * session number that it had before. The client browser ought to pick up
521 * the new session number and start using it, but in some rare situations it
522 * doesn't, and that's a Bad Thing because it causes lots of spurious sessions
525 if (Hdr.desired_session == 0) {
526 TheSession->wc_session = GenerateSessionID();
529 TheSession->wc_session = Hdr.desired_session;
532 pthread_setspecific(MyConKey, (void *)TheSession);
533 session_new_modules(TheSession);
535 pthread_mutex_init(&TheSession->SessionMutex, NULL);
536 pthread_mutex_lock(&SessionListMutex);
537 TheSession->nonce = rand();
538 TheSession->next = SessionList;
539 TheSession->is_mobile = -1;
540 SessionList = TheSession;
541 pthread_mutex_unlock(&SessionListMutex);
545 * A future improvement might be to check the session integrity
546 * at this point before continuing.
550 * Bind to the session and perform the transaction
552 pthread_mutex_lock(&TheSession->SessionMutex); /* bind */
553 pthread_setspecific(MyConKey, (void *)TheSession);
555 TheSession->lastreq = time(NULL); /* log */
556 TheSession->Hdr = &Hdr;
558 session_attach_modules(TheSession);
559 session_loop(); /* do transaction */
562 /* How long did this transaction take? */
563 gettimeofday(&tx_finish, NULL);
565 lprintf(9, "Transaction [%s] completed in %ld.%06ld seconds.\n",
566 ChrPtr(Hdr.this_page),
567 ((tx_finish.tv_sec*1000000 + tx_finish.tv_usec) - (tx_start.tv_sec*1000000 + tx_start.tv_usec)) / 1000000,
568 ((tx_finish.tv_sec*1000000 + tx_finish.tv_usec) - (tx_start.tv_sec*1000000 + tx_start.tv_usec)) % 1000000
571 session_detach_modules(TheSession);
573 TheSession->Hdr = NULL;
574 pthread_mutex_unlock(&TheSession->SessionMutex); /* unbind */
576 http_destroy_modules(&Hdr);
579 void tmplput_nonce(StrBuf *Target, WCTemplputParams *TP)
582 StrBufAppendPrintf(Target, "%ld",
583 (WCC != NULL)? WCC->nonce:0);
586 void tmplput_current_user(StrBuf *Target, WCTemplputParams *TP)
588 StrBufAppendTemplate(Target, TP, WC->wc_fullname, 0);
591 void tmplput_current_room(StrBuf *Target, WCTemplputParams *TP)
593 StrBufAppendTemplate(Target, TP, WC->wc_roomname, 0);
596 void Header_HandleContentLength(StrBuf *Line, ParsedHttpHdrs *hdr)
598 hdr->ContentLength = StrToi(Line);
601 void Header_HandleContentType(StrBuf *Line, ParsedHttpHdrs *hdr)
603 hdr->ContentType = Line;
606 void Header_HandleUserAgent(StrBuf *Line, ParsedHttpHdrs *hdr)
608 hdr->user_agent = Line;
610 /* TODO: do this later on session creating
611 if ((WCC->is_mobile < 0) && is_mobile_ua(&buf[12])) {
622 void Header_HandleHost(StrBuf *Line, ParsedHttpHdrs *hdr)
624 if ((follow_xff) && (hdr->http_host != NULL))
627 hdr->http_host = Line;
630 void Header_HandleXFFHost(StrBuf *Line, ParsedHttpHdrs *hdr)
633 hdr->http_host = Line;
637 void Header_HandleXFF(StrBuf *Line, ParsedHttpHdrs *hdr)
639 hdr->browser_host = Line;
641 while (StrBufNum_tokens(hdr->browser_host, ',') > 1) {
642 StrBufRemove_token(hdr->browser_host, 0, ',');
644 StrBufTrim(hdr->browser_host);
647 void Header_HandleIfModSince(StrBuf *Line, ParsedHttpHdrs *hdr)
649 hdr->if_modified_since = httpdate_to_timestamp(Line);
652 void Header_HandleAcceptEncoding(StrBuf *Line, ParsedHttpHdrs *hdr)
657 if (strstr(&ChrPtr(Line)[16], "gzip")) {
661 const char *ReqStrs[eNONE] = {
674 ServerStartModule_CONTEXT
678 HttpReqTypes = NewHash(1, NULL);
679 HttpHeaderHandler = NewHash(1, NULL);
681 v = malloc(sizeof(long));
683 Put(HttpReqTypes, HKEY("GET"), v, NULL);
685 v = malloc(sizeof(long));
687 Put(HttpReqTypes, HKEY("POST"), v, NULL);
689 v = malloc(sizeof(long));
691 Put(HttpReqTypes, HKEY("OPTIONS"), v, NULL);
693 v = malloc(sizeof(long));
695 Put(HttpReqTypes, HKEY("PROPFIND"), v, NULL);
697 v = malloc(sizeof(long));
699 Put(HttpReqTypes, HKEY("PUT"), v, NULL);
701 v = malloc(sizeof(long));
703 Put(HttpReqTypes, HKEY("DELETE"), v, NULL);
705 v = malloc(sizeof(long));
707 Put(HttpReqTypes, HKEY("HEAD"), v, NULL);
709 v = malloc(sizeof(long));
711 Put(HttpReqTypes, HKEY("MOVE"), v, NULL);
713 v = malloc(sizeof(long));
715 Put(HttpReqTypes, HKEY("COPY"), v, NULL);
719 ServerShutdownModule_CONTEXT
722 DeleteHash(&HttpReqTypes);
723 DeleteHash(&HttpHeaderHandler);
726 void RegisterHeaderHandler(const char *Name, long Len, Header_Evaluator F)
729 pHdr = (OneHttpHeader*) malloc(sizeof(OneHttpHeader));
730 memset(pHdr, 0, sizeof(OneHttpHeader));
732 Put(HttpHeaderHandler, Name, Len, pHdr, DestroyHttpHeaderHandler);
734 extern void blank_page(void); ///TODO: remove me
739 RegisterHeaderHandler(HKEY("CONTENT-LENGTH"), Header_HandleContentLength);
740 RegisterHeaderHandler(HKEY("CONTENT-TYPE"), Header_HandleContentType);
741 RegisterHeaderHandler(HKEY("USER-AGENT"), Header_HandleUserAgent);
742 RegisterHeaderHandler(HKEY("X-FORWARDED-HOST"), Header_HandleXFFHost);
743 RegisterHeaderHandler(HKEY("HOST"), Header_HandleHost);
744 RegisterHeaderHandler(HKEY("X-FORWARDED-FOR"), Header_HandleXFF);
745 RegisterHeaderHandler(HKEY("ACCEPT-ENCODING"), Header_HandleAcceptEncoding);
746 RegisterHeaderHandler(HKEY("IF-MODIFIED-SINCE"), Header_HandleIfModSince);
748 RegisterNamespace("CURRENT_USER", 0, 1, tmplput_current_user, CTX_NONE);
749 RegisterNamespace("CURRENT_ROOM", 0, 1, tmplput_current_room, CTX_NONE);
750 RegisterNamespace("NONCE", 0, 0, tmplput_nonce, 0);
754 WebcitAddUrlHandler(HKEY("blank"), blank_page, ANONYMOUS|BOGUS);
756 WebcitAddUrlHandler(HKEY("webcit"), blank_page, URLNAMESPACE);
762 HttpDestroyModule_CONTEXT
763 (ParsedHttpHdrs *httpreq)
765 FreeStrBuf(&httpreq->ReqLine);
766 FreeStrBuf(&httpreq->ReadBuf);
767 FreeStrBuf(&httpreq->PlainArgs);
768 FreeStrBuf(&httpreq->this_page);
769 DeleteHash(&httpreq->HTTPHeaders);