1
0
mirror of https://github.com/RIOT-OS/RIOT.git synced 2024-12-29 04:50:03 +01:00

sched: Reverse runqueue order when CLZ is available

This commit reverses the runqueue_cache bit order when the architecture
has a CLZ (count leading zeros) instruction. When the architecture
supports CLZ, it is faster to determine the most significant set bit of
a word than to determine the least significant bit set. Unfortunately
when the instruction is not available, it is more efficient to determine
the least significant bit set.

Reversing the bit order shaves off another 4 cycles on the same54-xpro.
From 147 to 143 ticks when testing with tests/bench_sched_nop.
Architectures where no CLZ instruction is available are not affected.
This commit is contained in:
Koen Zandberg 2020-08-06 20:17:20 +02:00
parent 01e6b62667
commit ab1d0b6f98
No known key found for this signature in database
GPG Key ID: 0895A893E6D2985B

View File

@ -79,6 +79,40 @@ static void (*sched_cb) (kernel_pid_t active_thread,
kernel_pid_t next_thread) = NULL; kernel_pid_t next_thread) = NULL;
#endif #endif
/* Depending on whether the CLZ instruction is available, the order of the
* runqueue_bitcache is reversed. When the instruction is available, it is
* faster to determine the MSBit set. When it is not available it is faster to
* determine the LSBit set. These functions abstract the runqueue modifications
* and readout away, switching between the two orders depending on the CLZ
* instruction availability
*/
static inline void _set_runqueue_bit(thread_t *process)
{
#if defined(BITARITHM_HAS_CLZ)
runqueue_bitcache |= BIT31 >> process->priority;
#else
runqueue_bitcache |= 1 << process->priority;
#endif
}
static inline void _clear_runqueue_bit(thread_t *process)
{
#if defined(BITARITHM_HAS_CLZ)
runqueue_bitcache &= ~(BIT31 >> process->priority);
#else
runqueue_bitcache &= ~(1 << process->priority);
#endif
}
static inline unsigned _get_prio_queue_from_runqueue(void)
{
#if defined(BITARITHM_HAS_CLZ)
return 31 - bitarithm_msb(runqueue_bitcache);
#else
return bitarithm_lsb(runqueue_bitcache);
#endif
}
static void _unschedule(thread_t *active_thread) static void _unschedule(thread_t *active_thread)
{ {
if (active_thread->status == STATUS_RUNNING) { if (active_thread->status == STATUS_RUNNING) {
@ -119,7 +153,7 @@ int __attribute__((used)) sched_run(void)
sched_context_switch_request = 0; sched_context_switch_request = 0;
int nextrq = bitarithm_lsb(runqueue_bitcache); unsigned nextrq = _get_prio_queue_from_runqueue();
thread_t *next_thread = container_of(sched_runqueues[nextrq].next->next, thread_t *next_thread = container_of(sched_runqueues[nextrq].next->next,
thread_t, rq_entry); thread_t, rq_entry);
@ -173,7 +207,7 @@ void sched_set_status(thread_t *process, thread_status_t status)
process->pid, process->priority); process->pid, process->priority);
clist_rpush(&sched_runqueues[process->priority], clist_rpush(&sched_runqueues[process->priority],
&(process->rq_entry)); &(process->rq_entry));
runqueue_bitcache |= 1 << process->priority; _set_runqueue_bit(process);
} }
} }
else { else {
@ -184,7 +218,7 @@ void sched_set_status(thread_t *process, thread_status_t status)
clist_lpop(&sched_runqueues[process->priority]); clist_lpop(&sched_runqueues[process->priority]);
if (!sched_runqueues[process->priority].next) { if (!sched_runqueues[process->priority].next) {
runqueue_bitcache &= ~(1 << process->priority); _clear_runqueue_bit(process);
} }
} }
} }