aboutsummaryrefslogtreecommitdiff
path: root/kern/processor.h
diff options
context:
space:
mode:
authorDamien Zammit <damien@zamaudio.com>2023-09-24 10:35:10 +0000
committerSamuel Thibault <samuel.thibault@ens-lyon.org>2023-09-24 14:38:03 +0200
commitb11e10e2c81c2b608176021364a36d84173358e3 (patch)
tree8bde3f47151865143341e864040af3bde68385a5 /kern/processor.h
parent31d45d0d8ee1d8eee96fc2a283a388b6b6aca669 (diff)
downloadgnumach-b11e10e2c81c2b608176021364a36d84173358e3.tar.gz
gnumach-b11e10e2c81c2b608176021364a36d84173358e3.tar.bz2
gnumach-b11e10e2c81c2b608176021364a36d84173358e3.zip
percpu area using gs segment
This speeds up smp again, by storing the struct processor in a percpu area and avoiding an expensive cpu_number every call of current_processor(), as well as getting the cpu_number by an offset into the percpu area. Untested on 64 bit and work remains to use other percpu arrays. TESTED: (NCPUS=8) -smp 1 boots to login shell ~2x slower than uniprocessor TESTED: (NCPUS=8) -smp 2 boots to INIT but hangs there TESTED: (NCPUS=8) -smp 4 gets stuck seemingly within rumpdisk and hangs TESTED: (NCPUS=1) uniprocessor is a bit faster than normal Message-Id: <20230924103428.455966-3-damien@zamaudio.com>
Diffstat (limited to 'kern/processor.h')
-rw-r--r--kern/processor.h17
1 files changed, 5 insertions, 12 deletions
diff --git a/kern/processor.h b/kern/processor.h
index 79386627..fc204ffa 100644
--- a/kern/processor.h
+++ b/kern/processor.h
@@ -112,6 +112,7 @@ typedef struct processor Processor;
extern struct processor processor_array[NCPUS];
#include <kern/cpu_number.h>
+#include <machine/percpu.h>
/*
* Chain of all processor sets.
@@ -196,23 +197,15 @@ extern processor_t master_processor;
#define PROCESSOR_ASSIGN 4 /* Assignment is changing */
#define PROCESSOR_SHUTDOWN 5 /* Being shutdown */
-/*
- * Use processor ptr array to find current processor's data structure.
- * This replaces a multiplication (index into processor_array) with
- * an array lookup and a memory reference. It also allows us to save
- * space if processor numbering gets too sparse.
- */
-
-extern processor_t processor_ptr[NCPUS];
-
-#define cpu_to_processor(i) (processor_ptr[i])
+#define processor_ptr(i) (&percpu_array[i].processor)
+#define cpu_to_processor processor_ptr
-#define current_processor() (processor_ptr[cpu_number()])
+#define current_processor() (percpu_ptr(struct processor, processor))
#define current_processor_set() (current_processor()->processor_set)
/* Compatibility -- will go away */
-#define cpu_state(slot_num) (processor_ptr[slot_num]->state)
+#define cpu_state(slot_num) (processor_ptr(slot_num)->state)
#define cpu_idle(slot_num) (cpu_state(slot_num) == PROCESSOR_IDLE)
/* Useful lock macros */