barrier: More efficient impl, maybe

This commit is contained in:
plutooo 2018-10-23 23:02:23 +02:00 committed by fincs
parent 0a230bae65
commit e8f3964475
2 changed files with 19 additions and 26 deletions

View File

@ -5,15 +5,15 @@
* @copyright libnx Authors * @copyright libnx Authors
*/ */
#pragma once #pragma once
#include "semaphore.h" #include "mutex.h"
#include "condvar.h"
/// Barrier structure. /// Barrier structure.
typedef struct Barrier { typedef struct Barrier {
u64 count; ///< Number of threads to reach the barrier. u64 count; ///< Number of threads to reach the barrier.
u64 thread_total; ///< Number of threads to wait on. u64 total; ///< Number of threads to wait on.
Semaphore throttle; ///< Semaphore to make sure threads release to scheduler one at a time. Mutex mutex;
Semaphore lock; ///< Semaphore to lock barrier to prevent multiple operations by threads at once. CondVar condvar;
Semaphore thread_wait; ///< Semaphore to force a thread to wait if count < thread_total.
} Barrier; } Barrier;
/** /**

View File

@ -1,29 +1,22 @@
#include "kernel/barrier.h" #include "kernel/barrier.h"
void barrierInit(Barrier *b, u64 thread_count) { void barrierInit(Barrier *b, u64 total) {
b->count = 0; b->count = 0;
b->thread_total = thread_count; b->total = total - 1;
semaphoreInit(&b->throttle, 0); mutexInit(&b->mutex);
semaphoreInit(&b->lock, 1); condvarInit(&b->condvar);
semaphoreInit(&b->thread_wait, 0);
} }
void barrierWait(Barrier *b) { void barrierWait(Barrier *b) {
semaphoreWait(&b->lock); mutexLock(&b->mutex);
if(b->count < b->thread_total) {
b->count++; if (b->count++ == b->total) {
}
if(b->count < b->thread_total) {
semaphoreSignal(&b->lock);
semaphoreWait(&b->thread_wait);
semaphoreSignal(&b->throttle);
}
else if(b->count == b->thread_total) {
for(int i = 0; i < b->thread_total-1; i++) {
semaphoreSignal(&b->thread_wait);
semaphoreWait(&b->throttle);
}
b->count = 0; b->count = 0;
semaphoreSignal(&b->lock); condvarWake(&b->condvar, b->total);
} }
else {
condvarWait(&b->condvar, &b->mutex);
}
mutexUnlock(&b->mutex);
} }