kernel: Rewrite B_DEBUG_SPINLOCK_CONTENTION.

* Replace count_low/count_high with bigtime_t fields plus an int32. sizeof(spinlock) is now 32 bytes with the debug option enabled. * Adjust and clean up all spinlock code to use the new fields. * Fold DEBUG_SPINLOCK_LATENCIES into the new code. Remove the bootloader option and other flags for it (these were not compiled in by default.) The new code should be much easier to understand and also more powerful. However, the information transmitted to userland isn't as useful now; the KDL command output will have the interesting information. (Things could be reworked to transmit more interesting information to userland again if desired, but as this code clearly hadn't been compiled for many years, as it referred to global spinlocks that have been gone for a very long time.) Change-Id: I2cb34078bfdc7604f288a297b6cd1aa7ff9cc512 Reviewed-on: https://review.haiku-os.org/c/haiku/+/6943 Reviewed-by: waddlesplash <waddlesplash@gmail.com> Tested-by: Commit checker robot <no-reply+buildbot@haiku-os.org>
2023-09-23 01:08:50 -04:00 · 2023-09-23 01:08:50 -04:00 · 76681bd900
commit 76681bd900
parent ef9e2f627b
7 changed files with 112 additions and 158 deletions
--- a/build/config_headers/kernel_debug_config.h
+++ b/build/config_headers/kernel_debug_config.h
@ -82,8 +82,6 @@
 // available.
 #define DEBUG_SPINLOCKS					KDEBUG_LEVEL_2

-#define DEBUG_SPINLOCK_LATENCIES		0
-

 // VM

--- a/headers/os/drivers/KernelExport.h
+++ b/headers/os/drivers/KernelExport.h
@ -21,15 +21,19 @@ typedef ulong cpu_status;
 #if B_DEBUG_SPINLOCK_CONTENTION
 	typedef struct {
 		int32	lock;
-		int32	count_low;
-		int32	count_high;
+		int32		failed_try_acquire;
+		bigtime_t	total_wait;
+		bigtime_t	total_held;
+		bigtime_t	last_acquired;
 	} spinlock;

-#	define B_SPINLOCK_INITIALIZER { 0, 0, 0 }
+#	define B_SPINLOCK_INITIALIZER { 0, 0, 0, 0, 0 }
 #	define B_INITIALIZE_SPINLOCK(spinlock)	do {	\
 			(spinlock)->lock = 0;					\
-			(spinlock)->count_low = 0;				\
-			(spinlock)->count_high = 0;				\
+			(spinlock)->failed_try_acquire = 0;		\
+			(spinlock)->total_wait = 0;				\
+			(spinlock)->total_held = 0;				\
+			(spinlock)->last_acquired = 0;			\
 		} while (false)
 #else
 	typedef struct {
--- a/headers/private/system/safemode_defs.h
+++ b/headers/private/system/safemode_defs.h
@ -20,8 +20,5 @@
 #define B_SAFEMODE_4_GB_MEMORY_LIMIT		"4gb_memory_limit"
 #define B_SAFEMODE_256_TB_MEMORY_LIMIT		"256tb_memory_limit"

-#if DEBUG_SPINLOCK_LATENCIES
-#	define B_SAFEMODE_DISABLE_LATENCY_CHECK	"disable_latency_check"
-#endif

 #endif	/* _SYSTEM_SAFEMODE_DEFS_H */
--- a/headers/private/system/spinlock_contention.h
+++ b/headers/private/system/spinlock_contention.h
@ -13,8 +13,7 @@


 typedef struct spinlock_contention_info {
-	uint64	thread_spinlock_counter;
-	uint64	team_spinlock_counter;
+	bigtime_t	thread_creation_spinlock;
 } spinlock_contention_info;


--- a/src/system/boot/loader/menu.cpp
+++ b/src/system/boot/loader/menu.cpp
@ -1428,16 +1428,6 @@ add_debug_menu()
 	Menu* menu = new(std::nothrow) Menu(STANDARD_MENU, "Debug Options");
 	MenuItem* item;

-#if DEBUG_SPINLOCK_LATENCIES
-	item = new(std::nothrow) MenuItem("Disable latency checks");
-	if (item != NULL) {
-		item->SetType(MENU_ITEM_MARKABLE);
-		item->SetData(B_SAFEMODE_DISABLE_LATENCY_CHECK);
-		item->SetHelpText("Disables latency check panics.");
-		menu->AddItem(item);
-	}
-#endif
-
 	menu->AddItem(item
 		= new(nothrow) MenuItem("Enable serial debug output"));
 	item->SetData("serial_debug_output");
--- a/src/system/kernel/smp.cpp
+++ b/src/system/kernel/smp.cpp
@ -29,9 +29,6 @@
 #include <spinlock_contention.h>
 #include <thread.h>
 #include <util/atomic.h>
-#if DEBUG_SPINLOCK_LATENCIES
-#	include <safemode.h>
-#endif

 #include "kernel_debug_config.h"

@ -172,6 +169,13 @@ dump_spinlock(int argc, char** argv)
 	} else
 		kprintf("  not locked\n");

+#if B_DEBUG_SPINLOCK_CONTENTION
+	kprintf("  failed try_acquire():		%d\n", lock->failed_try_acquire);
+	kprintf("  total wait time:		%" B_PRIdBIGTIME "\n", lock->total_wait);
+	kprintf("  total held time:		%" B_PRIdBIGTIME "\n", lock->total_held);
+	kprintf("  last acquired at:		%" B_PRIdBIGTIME "\n", lock->last_acquired);
+#endif
+
 	return 0;
 }

@ -179,59 +183,35 @@ dump_spinlock(int argc, char** argv)
 #endif	// DEBUG_SPINLOCKS


+#if B_DEBUG_SPINLOCK_CONTENTION
+
+
+static inline void
+update_lock_contention(spinlock* lock, bigtime_t start)
+{
+	const bigtime_t now = system_time();
+	lock->last_acquired = now;
+	lock->total_wait += (now - start);
+}
+
+
+static inline void
+update_lock_held(spinlock* lock)
+{
+	const bigtime_t held = (system_time() - lock->last_acquired);
+	lock->total_held += held;
+
+//#define DEBUG_SPINLOCK_LATENCIES 2000
 #if DEBUG_SPINLOCK_LATENCIES
-
-
-#define NUM_LATENCY_LOCKS	4
-#define DEBUG_LATENCY		200
-
-
-static struct {
-	spinlock	*lock;
-	bigtime_t	timestamp;
-} sLatency[SMP_MAX_CPUS][NUM_LATENCY_LOCKS];
-
-static int32 sLatencyIndex[SMP_MAX_CPUS];
-static bool sEnableLatencyCheck;
-
-
-static void
-push_latency(spinlock* lock)
-{
-	if (!sEnableLatencyCheck)
-		return;
-
-	int32 cpu = smp_get_current_cpu();
-	int32 index = (++sLatencyIndex[cpu]) % NUM_LATENCY_LOCKS;
-
-	sLatency[cpu][index].lock = lock;
-	sLatency[cpu][index].timestamp = system_time();
-}
-
-
-static void
-test_latency(spinlock* lock)
-{
-	if (!sEnableLatencyCheck)
-		return;
-
-	int32 cpu = smp_get_current_cpu();
-
-	for (int32 i = 0; i < NUM_LATENCY_LOCKS; i++) {
-		if (sLatency[cpu][i].lock == lock) {
-			bigtime_t diff = system_time() - sLatency[cpu][i].timestamp;
-			if (diff > DEBUG_LATENCY && diff < 500000) {
-				panic("spinlock %p was held for %lld usecs (%d allowed)\n",
-					lock, diff, DEBUG_LATENCY);
-			}
-
-			sLatency[cpu][i].lock = NULL;
-		}
+	if (held > DEBUG_SPINLOCK_LATENCIES) {
+		panic("spinlock %p was held for %" B_PRIdBIGTIME " usecs (%d allowed)\n",
+			lock, held, DEBUG_SPINLOCK_LATENCIES);
 	}
+#endif // DEBUG_SPINLOCK_LATENCIES
 }


-#endif	// DEBUG_SPINLOCK_LATENCIES
+#endif // B_DEBUG_SPINLOCK_CONTENTION


 int
@ -326,16 +306,19 @@ try_acquire_spinlock(spinlock* lock)
 	}
 #endif

+	if (atomic_get_and_set(&lock->lock, 1) != 0) {
 #if B_DEBUG_SPINLOCK_CONTENTION
-	if (atomic_add(&lock->lock, 1) != 0)
-		return false;
-#else
-	if (atomic_get_and_set(&lock->lock, 1) != 0)
+		atomic_add(&lock->failed_try_acquire, 1);
+#endif
 		return false;
+	}

-#	if DEBUG_SPINLOCKS
+#if B_DEBUG_SPINLOCK_CONTENTION
+	update_lock_contention(lock, system_time());
+#endif
+
+#if DEBUG_SPINLOCKS
 	push_lock_caller(arch_debug_get_caller(), lock);
-#	endif
 #endif

 	return true;
@ -353,24 +336,23 @@ acquire_spinlock(spinlock* lock)
 #endif

 	if (sNumCPUs > 1) {
-		int currentCPU = smp_get_current_cpu();
 #if B_DEBUG_SPINLOCK_CONTENTION
-		while (atomic_add(&lock->lock, 1) != 0)
-			process_all_pending_ici(currentCPU);
-#else
+		const bigtime_t start = system_time();
+#endif
+		int currentCPU = smp_get_current_cpu();
 		while (1) {
 			uint32 count = 0;
 			while (lock->lock != 0) {
 				if (++count == SPINLOCK_DEADLOCK_COUNT) {
-#	if DEBUG_SPINLOCKS
+#if DEBUG_SPINLOCKS
 					panic("acquire_spinlock(): Failed to acquire spinlock %p "
 						"for a long time (last caller: %p, value: %" B_PRIx32
 						")", lock, find_lock_caller(lock), lock->lock);
-#	else
+#else
 					panic("acquire_spinlock(): Failed to acquire spinlock %p "
 						"for a long time (value: %" B_PRIx32 ")", lock,
 						lock->lock);
-#	endif
+#endif
 					count = 0;
 				}

@ -381,11 +363,17 @@ acquire_spinlock(spinlock* lock)
 				break;
 		}

-#	if DEBUG_SPINLOCKS
+#if B_DEBUG_SPINLOCK_CONTENTION
+		update_lock_contention(lock, start);
+#endif
+
+#if DEBUG_SPINLOCKS
 		push_lock_caller(arch_debug_get_caller(), lock);
-#	endif
 #endif
 	} else {
+#if B_DEBUG_SPINLOCK_CONTENTION
+		lock->last_acquired = system_time();
+#endif
 #if DEBUG_SPINLOCKS
 		int32 oldValue = atomic_get_and_set(&lock->lock, 1);
 		if (oldValue != 0) {
@ -397,9 +385,6 @@ acquire_spinlock(spinlock* lock)
 		push_lock_caller(arch_debug_get_caller(), lock);
 #endif
 	}
-#if DEBUG_SPINLOCK_LATENCIES
-	push_latency(lock);
-#endif
 }


@ -415,22 +400,21 @@ acquire_spinlock_nocheck(spinlock *lock)

 	if (sNumCPUs > 1) {
 #if B_DEBUG_SPINLOCK_CONTENTION
-		while (atomic_add(&lock->lock, 1) != 0) {
-		}
-#else
+		const bigtime_t start = system_time();
+#endif
 		while (1) {
 			uint32 count = 0;
 			while (lock->lock != 0) {
 				if (++count == SPINLOCK_DEADLOCK_COUNT_NO_CHECK) {
-#	if DEBUG_SPINLOCKS
+#if DEBUG_SPINLOCKS
 					panic("acquire_spinlock_nocheck(): Failed to acquire "
 						"spinlock %p for a long time (last caller: %p, value: %"
 						B_PRIx32 ")", lock, find_lock_caller(lock), lock->lock);
-#	else
+#else
 					panic("acquire_spinlock_nocheck(): Failed to acquire "
 						"spinlock %p for a long time (value: %" B_PRIx32 ")",
 						lock, lock->lock);
-#	endif
+#endif
 					count = 0;
 				}

@ -441,11 +425,17 @@ acquire_spinlock_nocheck(spinlock *lock)
 				break;
 		}

-#	if DEBUG_SPINLOCKS
+#if B_DEBUG_SPINLOCK_CONTENTION
+		update_lock_contention(lock, start);
+#endif
+
+#if DEBUG_SPINLOCKS
 		push_lock_caller(arch_debug_get_caller(), lock);
-#	endif
 #endif
 	} else {
+#if B_DEBUG_SPINLOCK_CONTENTION
+		lock->last_acquired = system_time();
+#endif
 #if DEBUG_SPINLOCKS
 		int32 oldValue = atomic_get_and_set(&lock->lock, 1);
 		if (oldValue != 0) {
@ -473,22 +463,21 @@ acquire_spinlock_cpu(int32 currentCPU, spinlock *lock)

 	if (sNumCPUs > 1) {
 #if B_DEBUG_SPINLOCK_CONTENTION
-		while (atomic_add(&lock->lock, 1) != 0)
-			process_all_pending_ici(currentCPU);
-#else
+		const bigtime_t start = system_time();
+#endif
 		while (1) {
 			uint32 count = 0;
 			while (lock->lock != 0) {
 				if (++count == SPINLOCK_DEADLOCK_COUNT) {
-#	if DEBUG_SPINLOCKS
+#if DEBUG_SPINLOCKS
 					panic("acquire_spinlock_cpu(): Failed to acquire spinlock "
 						"%p for a long time (last caller: %p, value: %" B_PRIx32
 						")", lock, find_lock_caller(lock), lock->lock);
-#	else
+#else
 					panic("acquire_spinlock_cpu(): Failed to acquire spinlock "
 						"%p for a long time (value: %" B_PRIx32 ")", lock,
 						lock->lock);
-#	endif
+#endif
 					count = 0;
 				}

@ -499,11 +488,17 @@ acquire_spinlock_cpu(int32 currentCPU, spinlock *lock)
 				break;
 		}

-#	if DEBUG_SPINLOCKS
+#if B_DEBUG_SPINLOCK_CONTENTION
+		update_lock_contention(lock, start);
+#endif
+
+#if DEBUG_SPINLOCKS
 		push_lock_caller(arch_debug_get_caller(), lock);
-#	endif
 #endif
 	} else {
+#if B_DEBUG_SPINLOCK_CONTENTION
+		lock->last_acquired = system_time();
+#endif
 #if DEBUG_SPINLOCKS
 		int32 oldValue = atomic_get_and_set(&lock->lock, 1);
 		if (oldValue != 0) {
@ -521,28 +516,17 @@ acquire_spinlock_cpu(int32 currentCPU, spinlock *lock)
 void
 release_spinlock(spinlock *lock)
 {
-#if DEBUG_SPINLOCK_LATENCIES
-	test_latency(lock);
+#if B_DEBUG_SPINLOCK_CONTENTION
+	update_lock_held(lock);
 #endif

 	if (sNumCPUs > 1) {
-		if (are_interrupts_enabled())
+		if (are_interrupts_enabled()) {
 			panic("release_spinlock: attempt to release lock %p with "
 				"interrupts enabled\n", lock);
-#if B_DEBUG_SPINLOCK_CONTENTION
-		{
-			int32 count = atomic_and(&lock->lock, 0) - 1;
-			if (count < 0) {
-				panic("release_spinlock: lock %p was already released\n", lock);
-			} else {
-				// add to the total count -- deal with carry manually
-				if ((uint32)atomic_add(&lock->count_low, count) + count
-						< (uint32)count) {
-					atomic_add(&lock->count_high, 1);
-				}
-			}
 		}
-#elif DEBUG_SPINLOCKS
+
+#if DEBUG_SPINLOCKS
 		if (atomic_get_and_set(&lock->lock, 0) != 1)
 			panic("release_spinlock: lock %p was already released\n", lock);
 #else
@ -556,9 +540,6 @@ release_spinlock(spinlock *lock)
 		}
 		if (atomic_get_and_set(&lock->lock, 0) != 1)
 			panic("release_spinlock: lock %p was already released\n", lock);
-#endif
-#if DEBUG_SPINLOCK_LATENCIES
-		test_latency(lock);
 #endif
 	}
 }
@ -695,7 +676,8 @@ release_read_spinlock(rw_spinlock* lock)


 bool
-try_acquire_write_seqlock(seqlock* lock) {
+try_acquire_write_seqlock(seqlock* lock)
+{
 	bool succeed = try_acquire_spinlock(&lock->lock);
 	if (succeed)
 		atomic_add((int32*)&lock->count, 1);
@ -704,27 +686,31 @@ try_acquire_write_seqlock(seqlock* lock) {


 void
-acquire_write_seqlock(seqlock* lock) {
+acquire_write_seqlock(seqlock* lock)
+{
 	acquire_spinlock(&lock->lock);
 	atomic_add((int32*)&lock->count, 1);
 }


 void
-release_write_seqlock(seqlock* lock) {
+release_write_seqlock(seqlock* lock)
+{
 	atomic_add((int32*)&lock->count, 1);
 	release_spinlock(&lock->lock);
 }


 uint32
-acquire_read_seqlock(seqlock* lock) {
+acquire_read_seqlock(seqlock* lock)
+{
 	return atomic_get((int32*)&lock->count);
 }


 bool
-release_read_seqlock(seqlock* lock, uint32 count) {
+release_read_seqlock(seqlock* lock, uint32 count)
+{
 	memory_read_barrier();

 	uint32 current = *(volatile int32*)&lock->count;
@ -982,34 +968,20 @@ process_pending_ici(int32 currentCPU)
 #if B_DEBUG_SPINLOCK_CONTENTION


-static uint64
-get_spinlock_counter(spinlock* lock)
-{
-	uint32 high;
-	uint32 low;
-	do {
-		high = (uint32)atomic_get(&lock->count_high);
-		low = (uint32)atomic_get(&lock->count_low);
-	} while (high != atomic_get(&lock->count_high));
-
-	return ((uint64)high << 32) | low;
-}
-
-
 static status_t
 spinlock_contention_syscall(const char* subsystem, uint32 function,
 	void* buffer, size_t bufferSize)
 {
-	spinlock_contention_info info;
-
 	if (function != GET_SPINLOCK_CONTENTION_INFO)
 		return B_BAD_VALUE;

 	if (bufferSize < sizeof(spinlock_contention_info))
 		return B_BAD_VALUE;

-	info.thread_spinlock_counter = get_spinlock_counter(&gThreadSpinlock);
-	info.team_spinlock_counter = get_spinlock_counter(&gTeamSpinlock);
+	// TODO: This isn't very useful at the moment...
+
+	spinlock_contention_info info;
+	info.thread_creation_spinlock = gThreadCreationLock.total_wait;

 	if (!IS_USER_ADDRESS(buffer)
 		|| user_memcpy(buffer, &info, sizeof(info)) != B_OK) {
@ -1406,11 +1378,6 @@ smp_init(kernel_args* args)
 {
 	TRACE("smp_init: entry\n");

-#if DEBUG_SPINLOCK_LATENCIES
-	sEnableLatencyCheck
-		= !get_safemode_boolean(B_SAFEMODE_DISABLE_LATENCY_CHECK, false);
-#endif
-
 #if DEBUG_SPINLOCKS
 	add_debugger_command_etc("spinlock", &dump_spinlock,
 		"Dump info on a spinlock",
--- a/src/tests/system/kernel/spinlock_contention.cpp
+++ b/src/tests/system/kernel/spinlock_contention.cpp
@ -249,10 +249,9 @@ main(int argc, char** argv)
 		time_string(tickTime, buffer));

 	// print results
-	static const char* const kLockNames[] = { "thread", "team", NULL };
-	uint64 lockCounts[] = {
-		endInfo.thread_spinlock_counter - startInfo.thread_spinlock_counter,
-		endInfo.team_spinlock_counter - startInfo.team_spinlock_counter
+	static const char* const kLockNames[] = { "thread creation", NULL };
+	bigtime_t lockCounts[] = {
+		endInfo.thread_creation_spinlock - startInfo.thread_creation_spinlock,
 	};

 	printf("\nlock             counter            time   wasted %% CPU\n");