mmlr+anevilyak:

* Keep track of the currently running threads. * Make use of that info to decide if a thread that becomes ready should preempt the running thread. * If we should preempt we send the target CPU a reschedule message. * This preemption strategy makes keeping track of idle CPUs by means of a bitmap superflous and it is therefore removed. * Right now only other CPUs are preempted though, not the current one. * Add missing initialization of the quantum tracking code. * Do not extend the quantum of the idle thread based quantum tracking as we want it to not run longer than necessary. Once the preemption works completely adding a quantum timer for the idle thread will become unnecessary though. * Fix thread stealing code, it did missed the last thread in the run queue. * When stealing, try to steal the highest priority thread that is currently waiting by taking priorities into account when finding the target run queue. * Simplify stealing code a bit as well. * Minor cleanups. git-svn-id: file:///srv/svn/repos/haiku/haiku/trunk@32503 a95241bf-73f2-0310-859d-f6bbb57e9c96
2009-08-19 03:19:17 +00:00 · 2009-08-19 03:19:17 +00:00 · 152132f08a
commit 152132f08a
parent 29c4d5a983
3 changed files with 65 additions and 75 deletions
--- a/headers/private/kernel/smp.h
+++ b/headers/private/kernel/smp.h
@ -22,6 +22,7 @@ enum {
 	SMP_MSG_GLOBAL_INVALIDATE_PAGES,
 	SMP_MSG_CPU_HALT,
 	SMP_MSG_CALL_FUNCTION,
 	SMP_MSG_RESCHEDULE,
 	SMP_MSG_RESCHEDULE_IF_IDLE
 };
--- a/src/system/kernel/scheduler/scheduler_affine.cpp
+++ b/src/system/kernel/scheduler/scheduler_affine.cpp
@ -40,10 +40,10 @@
 // TODO: consolidate this such that HT/SMT entities on the same physical core
 // share a queue, once we have the necessary API for retrieving the topology
 // information
 static struct thread* sRunningThreads[B_MAX_CPU_COUNT];
 static struct thread* sRunQueue[B_MAX_CPU_COUNT];
 static int32 sRunQueueSize[B_MAX_CPU_COUNT];
 static struct thread* sIdleThreads;
 static cpu_mask_t sIdleCPUs = 0;
 const int32 kMaxTrackingQuantums = 5;
 const bigtime_t kMinThreadQuantum = 3000;
@ -61,6 +61,7 @@ struct scheduler_thread_data {
 		fQuantumAverage = 0;
 		fLastQuantumSlot = 0;
 		fLastQueue = -1;
 		memset(fLastThreadQuantums, 0, sizeof(fLastThreadQuantums));
 	}
 	inline void SetQuantum(int32 quantum)
@ -141,19 +142,6 @@ affine_get_most_idle_cpu()
 }
 static inline int32
 affine_get_next_idle_cpu(void)
 {
 	for (int32 i = 0; i < smp_get_num_cpus(); i++) {
 		if (gCPU[i].disabled)
 			continue;
 		if (sIdleCPUs & (1 << i))
 			return i;
 	}
 	return -1;
 }
 /*!	Enqueues the thread into the run queue.
 	Note: thread lock must be held when entering this function
 */
@ -191,28 +179,27 @@ affine_enqueue_in_run_queue(struct thread *thread)
 			prev->queue_next = thread;
 		else
 			sRunQueue[targetCPU] = thread;
 		thread->scheduler_data->fLastQueue = targetCPU;
 	}
 	thread->next_priority = thread->priority;
 	if (thread->priority != B_IDLE_PRIORITY && targetCPU != smp_get_current_cpu()) {
 		int32 idleCPU = targetCPU;
 		if ((sIdleCPUs & (1 << targetCPU)) == 0) {
 			idleCPU = affine_get_next_idle_cpu();
 			// no idle CPUs are available
 			// to try and grab this task
 			if (idleCPU < 0)
 				return;
 		}
 		sIdleCPUs &= ~(1 << idleCPU);
 		smp_send_ici(idleCPU, SMP_MSG_RESCHEDULE_IF_IDLE, 0, 0,
 			0, NULL, SMP_MSG_FLAG_ASYNC);
 	}
 	// notify listeners
 	NotifySchedulerListeners(&SchedulerListener::ThreadEnqueuedInRunQueue,
 		thread);
 	if (sRunningThreads[targetCPU] != NULL
 		&& thread->priority > sRunningThreads[targetCPU]->priority) {
 		int32 currentCPU = smp_get_current_cpu();
 		if (targetCPU == currentCPU) {
 			// TODO: we want to inform the caller somehow that it should
 			// trigger a reschedule
 		} else {
 			smp_send_ici(targetCPU, SMP_MSG_RESCHEDULE, 0, 0, 0, NULL,
 				SMP_MSG_FLAG_ASYNC);
 		}
 	}
 }
 static inline struct thread *
@ -235,12 +222,9 @@ dequeue_from_run_queue(struct thread *prevThread, int32 currentCPU)
 /*!	Looks for a possible thread to grab/run from another CPU.
 	Note: thread lock must be held when entering this function
 */
-static struct thread *steal_thread_from_other_cpus(int32 currentCPU)
+static struct thread *
 steal_thread_from_other_cpus(int32 currentCPU)
 {
 	int32 targetCPU = -1;
 	struct thread* nextThread = NULL;
 	struct thread* prevThread = NULL;
 	// look through the active CPUs - find the one
 	// that has a) threads available to steal, and
 	// b) out of those, the one that's the most CPU-bound
@ -248,43 +232,40 @@ static struct thread *steal_thread_from_other_cpus(int32 currentCPU)
 	// - we need to try and maintain a reasonable balance
 	// in run queue sizes across CPUs, and also try to maintain
 	// an even distribution of cpu bound / interactive threads
 	int32 targetCPU = -1;
 	for (int32 i = 0; i < smp_get_num_cpus(); i++) {
 		// skip CPUs that have either no or only one thread
-		if (sRunQueueSize[i] < 2)
+		if (i == currentCPU || sRunQueueSize[i] < 2)
 			continue;
 		if (i == currentCPU)
 			continue;
 		// out of the CPUs with threads available to steal,
 		// pick whichever one is generally the most CPU bound.
-		if (targetCPU < 0)
+		if (targetCPU < 0
-			targetCPU = i;
+			|| sRunQueue[i]->priority > sRunQueue[targetCPU]->priority
-		else if (sRunQueueSize[i] > sRunQueueSize[targetCPU])
+			|| (sRunQueue[i]->priority == sRunQueue[targetCPU]->priority
 				&& sRunQueueSize[i] > sRunQueueSize[targetCPU]))
 			targetCPU = i;
 	}
-	if (targetCPU >= 0) {
+	if (targetCPU < 0)
-		nextThread = sRunQueue[targetCPU];
+		return NULL;
 		do {
 			// grab the highest priority non-pinned thread
 			// out of this CPU's queue, if any.
 			if (nextThread->pinned_to_cpu > 0) {
 				prevThread = nextThread;
 				nextThread = prevThread->queue_next;
 			} else
 				break;
 		} while (nextThread->queue_next != NULL);
-		// we reached the end of the queue without finding an
+	struct thread* nextThread = sRunQueue[targetCPU];
-		// eligible thread.
+	struct thread* prevThread = NULL;
 		if (nextThread->pinned_to_cpu > 0)
 			nextThread = NULL;
-		// dequeue the thread we're going to steal
+	while (nextThread != NULL) {
-		if (nextThread != NULL)
+		// grab the highest priority non-pinned thread
 		// out of this CPU's queue, dequeue and return it
 		if (nextThread->pinned_to_cpu <= 0) {
 			dequeue_from_run_queue(prevThread, targetCPU);
 			return nextThread;
 		}
 		prevThread = nextThread;
 		nextThread = nextThread->queue_next;
 	}
-	return nextThread;
+	return NULL;
 }
@ -319,10 +300,10 @@ affine_set_thread_priority(struct thread *thread, int32 priority)
 	for (item = sRunQueue[targetCPU], prev = NULL; item && item != thread;
 			item = item->queue_next) {
-			if (prev)
+		if (prev)
-				prev = prev->queue_next;
+			prev = prev->queue_next;
-			else
+		else
-				prev = item;
+			prev = item;
 	}
 	ASSERT(item == thread);
@ -405,7 +386,7 @@ affine_reschedule(void)
 	prevThread = NULL;
 	if (sRunQueue[currentCPU] != NULL) {
-		TRACE(("Dequeueing next thread from CPU %ld\n", currentCPU));
+		TRACE(("dequeueing next thread from cpu %ld\n", currentCPU));
 		// select next thread from the run queue
 		while (nextThread->queue_next) {
 			// always extract real time threads
@ -424,6 +405,9 @@ affine_reschedule(void)
 			} while (nextThread->queue_next != NULL
 				&& priority == nextThread->queue_next->priority);
 		}
 		TRACE(("dequeuing thread %ld from cpu %ld\n", nextThread->id,
 			currentCPU));
 		// extract selected thread from the run queue
 		dequeue_from_run_queue(prevThread, currentCPU);
 	} else {
@ -432,6 +416,7 @@ affine_reschedule(void)
 			nextThread = steal_thread_from_other_cpus(currentCPU);
 		} else
 			nextThread = NULL;
 		if (nextThread == NULL) {
 			TRACE(("No threads to steal, grabbing from idle pool\n"));
 			// no other CPU had anything for us to take,
@ -476,30 +461,31 @@ affine_reschedule(void)
 	}
 	if (nextThread != oldThread || oldThread->cpu->preempted) {
 		timer *quantumTimer = &oldThread->cpu->quantum_timer;
 		if (!oldThread->cpu->preempted)
 			cancel_timer(quantumTimer);
 		oldThread->cpu->preempted = 0;
 		// we do not adjust the quantum for the idle thread as it is going to be
 		// preempted most of the time and would likely get the longer quantum
 		// over time, indeed we use a smaller quantum to avoid running idle too
 		// long
 		bigtime_t quantum = kMinThreadQuantum;
 		// give CPU-bound background threads a larger quantum size
 		// to minimize unnecessary context switches if the system is idle
-		if (nextThread->scheduler_data->GetAverageQuantumUsage()
+		if (nextThread->priority != B_IDLE_PRIORITY
 			&& nextThread->scheduler_data->GetAverageQuantumUsage()
 			> (kMinThreadQuantum >> 1)
 			&& nextThread->priority < B_NORMAL_PRIORITY)
 			quantum = kMaxThreadQuantum;
 		timer *quantumTimer = &oldThread->cpu->quantum_timer;
 		if (!oldThread->cpu->preempted)
 			cancel_timer(quantumTimer);
 		oldThread->cpu->preempted = 0;
 		add_timer(quantumTimer, &reschedule_event, quantum,
 			B_ONE_SHOT_RELATIVE_TIMER | B_TIMER_ACQUIRE_THREAD_LOCK);
-		// update the idle bit for this CPU in the CPU mask
+		if (nextThread != oldThread) {
-		if (nextThread->priority == B_IDLE_PRIORITY)
+			sRunningThreads[currentCPU] = nextThread;
 			sIdleCPUs = SET_BIT(sIdleCPUs, currentCPU);
 		else
 			sIdleCPUs = CLEAR_BIT(sIdleCPUs, currentCPU);
 		if (nextThread != oldThread)
 			context_switch(oldThread, nextThread);
 		}
 	}
 }
--- a/src/system/kernel/smp.cpp
+++ b/src/system/kernel/smp.cpp
@ -631,6 +631,9 @@ process_pending_ici(int32 currentCPU)
 			func(msg->data, currentCPU, msg->data2, msg->data3);
 			break;
 		}
 		case SMP_MSG_RESCHEDULE:
 			thread_get_current_thread()->cpu->invoke_scheduler = true;
 			break;
 		case SMP_MSG_RESCHEDULE_IF_IDLE:
 		{
 			// TODO: We must not dereference the thread when entering the kernel