]> code.citadel.org Git - citadel.git/blobdiff - citadel/sysdep.c
Changed the way we create aditional threads. One for every connection is
[citadel.git] / citadel / sysdep.c
index 5358fb3d403c4e93ffb515211d8819c984af74e6..6be3f2cca11739d35cabfda447d548cdc57bbcb3 100644 (file)
@@ -1357,7 +1357,7 @@ int CtdlThreadCheckStop(struct CtdlThreadNode *this_thread)
                pthread_mutex_unlock(&this_thread->ThreadMutex);
                return -1;
        }
-       else if(this_thread->state < CTDL_THREAD_STOP_REQ)
+       else if((this_thread->state < CTDL_THREAD_STOP_REQ) && (this_thread->state > CTDL_THREAD_CREATE))
        {
                pthread_mutex_unlock(&this_thread->ThreadMutex);
                return -1;
@@ -1442,7 +1442,9 @@ static void ctdl_internal_thread_cleanup(void *arg)
        #ifdef HAVE_BACKTRACE
        eCrash_UnregisterThread();
        #endif
+       pthread_mutex_lock(&this_thread->ThreadMutex);
        this_thread->state = CTDL_THREAD_EXITED;        // needs to be last thing else house keeping will unlink us too early
+       pthread_mutex_unlock(&this_thread->ThreadMutex);
        end_critical_section(S_THREAD_LIST);
 //     CtdlThreadGC();
 }
@@ -1456,7 +1458,6 @@ void ctdl_thread_internal_calc_loadavg(void)
        double load_avg, worker_avg;
        int workers = 0;
 
-       begin_critical_section(S_THREAD_LIST);
        that_thread = CtdlThreadList;
        load_avg = 0;
        worker_avg = 0;
@@ -1492,9 +1493,8 @@ void ctdl_thread_internal_calc_loadavg(void)
        CtdlThreadLoadAvg = load_avg/num_threads;
        CtdlThreadWorkerAvg = worker_avg/workers;
 #ifdef WITH_THREADLOG
-       CtdlLogPrintf(CTDL_INFO, "System load average %f, workers averag %f\n", CtdlThreadLoadAvg, CtdlThreadWorkerAvg);
+       CtdlLogPrintf(CTDL_INFO, "System load average %f, workers averag %f, threads %d, workers %d, sessions %d\n", CtdlThreadLoadAvg, CtdlThreadWorkerAvg, num_threads, num_workers, num_sessions);
 #endif
-       end_critical_section(S_THREAD_LIST);
 }
 
 
@@ -1517,7 +1517,6 @@ void ctdl_internal_thread_gc (void)
        /*
         * Woke up to do garbage collection
         */
-       begin_critical_section(S_THREAD_LIST);
        this_thread = CtdlThreadList;
        while(this_thread)
        {
@@ -1534,17 +1533,15 @@ void ctdl_internal_thread_gc (void)
                
                if (pthread_equal(that_thread->tid, pthread_self()) && that_thread->thread_func)
                {       /* Sanity check */
-                       end_critical_section(S_THREAD_LIST);
                        CtdlLogPrintf(CTDL_EMERG, "Thread system PANIC, a thread is trying to clean up after itself.\n");
-                       CtdlThreadStopAll();
+                       abort();
                        return;
                }
                
                if (num_threads <= 0)
                {       /* Sanity check */
-                       end_critical_section (S_THREAD_LIST);
                        CtdlLogPrintf(CTDL_EMERG, "Thread system PANIC, num_threads <= 0 and trying to do Garbage Collection.\n");
-                       CtdlThreadStopAll();
+                       abort();
                        return;
                }
 
@@ -1582,11 +1579,12 @@ void ctdl_internal_thread_gc (void)
        /* Sanity check number of worker threads */
        if (workers != num_workers)
        {
-               end_critical_section(S_THREAD_LIST);
-               CtdlLogPrintf(CTDL_EMERG, "Thread system PANIC, discrepancy in number of worker threads. Counted %d, should be %d.\n", workers, num_workers);
-               return;
+               CtdlLogPrintf(CTDL_EMERG,
+                       "Thread system PANIC, discrepancy in number of worker threads. Counted %d, should be %d.\n",
+                       workers, num_workers
+                       );
+               abort();
        }
-       end_critical_section(S_THREAD_LIST);
 }
 
 
@@ -1607,9 +1605,17 @@ static void *ctdl_internal_thread_func (void *arg)
         * can continue its execution.
         */
        begin_critical_section(S_THREAD_LIST);
+       // Register the cleanup function to take care of when we exit.
+       pthread_cleanup_push(ctdl_internal_thread_cleanup, NULL);
        // Get our thread data structure
        this_thread = (struct CtdlThreadNode *) arg;
-       this_thread->state = CTDL_THREAD_RUNNING;
+       /* Only change to running state if we weren't asked to stop during the create cycle
+        * Other wise there is a window to allow this threads creation to continue to full grown and
+        * therby prevent a shutdown of the server.
+        */
+       if (!CtdlThreadCheckStop(this_thread))
+               this_thread->state = CTDL_THREAD_RUNNING;
+       
        this_thread->pid = getpid();
        gettimeofday(&this_thread->start_time, NULL);           /* Time this thread started */
        memcpy(&this_thread->last_state_change, &this_thread->start_time, sizeof (struct timeval));     /* Changed state so mark it. */
@@ -1618,14 +1624,13 @@ static void *ctdl_internal_thread_func (void *arg)
        // Tell the world we are here
        CtdlLogPrintf(CTDL_NOTICE, "Created a new thread \"%s\" (%ld). \n", this_thread->name, this_thread->tid);
 
-       // Register the cleanup function to take care of when we exit.
-       pthread_cleanup_push(ctdl_internal_thread_cleanup, NULL);
        
        
        /*
-        * run the thread to do the work
+        * run the thread to do the work but only if we haven't been asked to stop
         */
-       ret = (this_thread->thread_func)(this_thread->user_args);
+       if (!CtdlThreadCheckStop(this_thread))
+               ret = (this_thread->thread_func)(this_thread->user_args);
        
        /*
         * Our thread is exiting either because it wanted to end or because the server is stopping
@@ -1704,6 +1709,11 @@ struct CtdlThreadNode *ctdl_internal_create_thread(char *name, long flags, void
        this_thread->flags = flags;
        this_thread->thread_func = thread_func;
        this_thread->user_args = args;
+       /* Set this new thread with an avg_blocked of 2. We do this so that its creation affects the
+        * load average for the system. If we don't do this then we create a mass of threads at the same time 
+        * because the creation didn't affect the load average.
+        */
+       this_thread->avg_blocked = 2;
        pthread_mutex_init (&(this_thread->ThreadMutex), NULL);
        pthread_cond_init (&(this_thread->ThreadCond), NULL);
        
@@ -1757,6 +1767,7 @@ struct CtdlThreadNode *ctdl_internal_create_thread(char *name, long flags, void
        #ifdef HAVE_BACKTRACE
        eCrash_RegisterThread(this_thread->name, 0);
        #endif
+       ctdl_thread_internal_calc_loadavg();
        return this_thread;
 }
 
@@ -1781,12 +1792,10 @@ struct CtdlThreadNode *CtdlThreadCreate(char *name, long flags, void *(*thread_f
 /*
  * A warapper function for select so we can show a thread as blocked
  */
-int CtdlThreadSelect(int n, fd_set *readfds, fd_set *writefds, fd_set *exceptfds, const struct timeval *timeout)
+int CtdlThreadSelect(int n, fd_set *readfds, fd_set *writefds, fd_set *exceptfds, const struct timeval *timeout, struct CtdlThreadNode *self)
 {
-       struct CtdlThreadNode *self;
        int ret;
        
-       self = CtdlThreadSelf();
        ctdl_thread_internal_change_state(self, CTDL_THREAD_BLOCKED);
        ret = select(n, readfds, writefds, exceptfds, timeout);
        ctdl_thread_internal_change_state(self, CTDL_THREAD_RUNNING);
@@ -1808,17 +1817,16 @@ void dead_session_purge(int force) {
        struct CitContext *ptr, *ptr2;          /* general-purpose utility pointer */
        struct CitContext *rem = NULL;  /* list of sessions to be destroyed */
        
-       CtdlThreadPushName("dead_session_purge");
-       
        if (force == 0) {
                if ( (time(NULL) - last_purge) < 5 ) {
-                       CtdlThreadPopName();
                        return; /* Too soon, go away */
                }
        }
        time(&last_purge);
 
-       begin_critical_section(S_SESSION_TABLE);
+       if (try_critical_section(S_SESSION_TABLE))
+               return;
+               
        ptr = ContextList;
        while (ptr) {
                ptr2 = ptr;
@@ -1837,11 +1845,9 @@ void dead_session_purge(int force) {
                        }
 
                        --num_sessions;
-
                        /* And put it on our to-be-destroyed list */
                        ptr2->next = rem;
                        rem = ptr2;
-
                }
        }
        end_critical_section(S_SESSION_TABLE);
@@ -1857,18 +1863,6 @@ void dead_session_purge(int force) {
                rem = rem->next;
                free(ptr);
        }
-
-       /* Raise the size of the worker thread pool if necessary. */
-       begin_critical_section(S_THREAD_LIST);
-       if ( (num_sessions > num_workers)
-          && (num_workers < config.c_max_workers) ) {
-               ctdl_internal_create_thread("Worker Thread", CTDLTHREAD_BIGSTACK + CTDLTHREAD_WORKER, worker_thread, NULL);
-       }
-       end_critical_section(S_THREAD_LIST);
-       // FIXME: reduce the number of worker threads too
-       
-       CtdlThreadPopName();
-       
 }
 
 
@@ -1969,8 +1963,7 @@ do_select:        force_purge = 0;
                if (!CtdlThreadCheckStop(CT)) {
                        tv.tv_sec = 1;          /* wake up every second if no input */
                        tv.tv_usec = 0;
-                       retval = CtdlThreadSelect(highest + 1, &readfds, NULL, NULL, &tv);
-//                     retval = select(highest + 1, &readfds, NULL, NULL, &tv);
+                       retval = CtdlThreadSelect(highest + 1, &readfds, NULL, NULL, &tv, CT);
                }
 
                if (CtdlThreadCheckStop(CT)) return(NULL);
@@ -1992,9 +1985,9 @@ do_select:        force_purge = 0;
                                goto do_select;
                        }
                }
-               else if(retval == 0) {
-                       goto SKIP_SELECT;
-               }
+//             else if(retval == 0) {
+//                     goto SKIP_SELECT;
+//             }
                /* Next, check to see if it's a new client connecting
                 * on a master socket.
                 */
@@ -2100,7 +2093,6 @@ SKIP_SELECT:
 
                dead_session_purge(force_purge);
                do_housekeeping();
-               check_sched_shutdown();
        }
        /* If control reaches this point, the server is shutting down */        
        return(NULL);