forked from Imagelibrary/rtems
sparc: Add _CPU_Get_current_per_CPU_control()
Use register g6 for the per-CPU control of the current processor. The register g6 is reserved for the operating system by the SPARC ABI. On Linux register g6 is used for a similar purpose with the same method since 1996. The register g6 must be initialized during system startup and then must remain unchanged. Since the per-CPU control is used in all critical sections of the operating system, this is a performance optimization for the operating system core procedures. An additional benefit is that the low-level context switch and interrupt processing code is now identical on non-SMP and SMP configurations.
This commit is contained in:
@@ -23,23 +23,6 @@
|
||||
#include <rtems/score/percpu.h>
|
||||
#include <bspopts.h>
|
||||
|
||||
.macro GET_SELF_CPU_CONTROL REG, TMP
|
||||
sethi %hi(_Per_CPU_Information), \REG
|
||||
add \REG, %lo(_Per_CPU_Information), \REG
|
||||
|
||||
#if defined( RTEMS_SMP )
|
||||
#if BSP_LEON3_SMP
|
||||
/* LEON3 SMP support */
|
||||
rd %asr17, \TMP
|
||||
srl \TMP, LEON3_ASR17_PROCESSOR_INDEX_SHIFT, \TMP
|
||||
#else
|
||||
mov 0, \TMP
|
||||
#endif
|
||||
sll \TMP, PER_CPU_CONTROL_SIZE_LOG2, \TMP
|
||||
add \REG, \TMP, \REG
|
||||
#endif /* defined( RTEMS_SMP ) */
|
||||
.endm
|
||||
|
||||
/*
|
||||
* void _CPU_Context_switch(
|
||||
* Context_Control *run,
|
||||
@@ -53,7 +36,7 @@
|
||||
PUBLIC(_CPU_Context_switch)
|
||||
SYM(_CPU_Context_switch):
|
||||
st %g5, [%o0 + G5_OFFSET] ! save the global registers
|
||||
std %g6, [%o0 + G6_OFFSET]
|
||||
st %g7, [%o0 + G7_OFFSET]
|
||||
|
||||
std %l0, [%o0 + L0_OFFSET] ! save the local registers
|
||||
std %l2, [%o0 + L2_OFFSET]
|
||||
@@ -67,11 +50,8 @@ SYM(_CPU_Context_switch):
|
||||
|
||||
std %o6, [%o0 + O6_SP_OFFSET] ! save the output registers
|
||||
|
||||
! o3 = self per-CPU control
|
||||
GET_SELF_CPU_CONTROL %o3, %o4
|
||||
|
||||
! load the ISR stack nesting prevention flag
|
||||
ld [%o3 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE], %o4
|
||||
ld [%g6 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE], %o4
|
||||
! save it a bit later so we do not waste a couple of cycles
|
||||
|
||||
rd %psr, %o2
|
||||
@@ -84,7 +64,6 @@ SYM(_CPU_Context_switch):
|
||||
* This is entered from _CPU_Context_restore with:
|
||||
* o1 = context to restore
|
||||
* o2 = psr
|
||||
* o3 = self per-CPU control
|
||||
*/
|
||||
|
||||
PUBLIC(_CPU_Context_restore_heir)
|
||||
@@ -185,7 +164,7 @@ done_flushing:
|
||||
nop
|
||||
|
||||
ld [%o1 + G5_OFFSET], %g5 ! restore the global registers
|
||||
ldd [%o1 + G6_OFFSET], %g6
|
||||
ld [%o1 + G7_OFFSET], %g7
|
||||
|
||||
! Load thread specific ISR dispatch prevention flag
|
||||
ld [%o1 + ISR_DISPATCH_DISABLE_STACK_OFFSET], %o2
|
||||
@@ -197,7 +176,7 @@ done_flushing:
|
||||
ldd [%o1 + L6_OFFSET], %l6
|
||||
|
||||
! Now restore thread specific ISR dispatch prevention flag
|
||||
st %o2, [%o3 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE]
|
||||
st %o2, [%g6 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE]
|
||||
|
||||
ldd [%o1 + I0_OFFSET], %i0 ! restore the input registers
|
||||
ldd [%o1 + I2_OFFSET], %i2
|
||||
@@ -223,7 +202,6 @@ done_flushing:
|
||||
SYM(_CPU_Context_restore):
|
||||
save %sp, -CPU_MINIMUM_STACK_FRAME_SIZE, %sp
|
||||
rd %psr, %o2
|
||||
GET_SELF_CPU_CONTROL %o3, %o4
|
||||
ba SYM(_CPU_Context_restore_heir)
|
||||
mov %i0, %o1 ! in the delay slot
|
||||
|
||||
@@ -352,7 +330,7 @@ save_isf:
|
||||
st %g1, [%sp + ISF_G1_OFFSET] ! save g1
|
||||
std %g2, [%sp + ISF_G2_OFFSET] ! save g2, g3
|
||||
std %l4, [%sp + ISF_G4_OFFSET] ! save g4, g5 -- see above
|
||||
std %g6, [%sp + ISF_G6_OFFSET] ! save g6, g7
|
||||
st %g7, [%sp + ISF_G7_OFFSET] ! save g7
|
||||
|
||||
std %i0, [%sp + ISF_I0_OFFSET] ! save i0, i1
|
||||
std %i2, [%sp + ISF_I2_OFFSET] ! save i2, i3
|
||||
@@ -370,24 +348,21 @@ save_isf:
|
||||
*
|
||||
* Register usage for this section:
|
||||
*
|
||||
* l5 = per cpu info pointer
|
||||
* l6 = _Thread_Dispatch_disable_level value
|
||||
* l7 = _ISR_Nest_level value
|
||||
*
|
||||
* NOTE: It is assumed that l5 - l7 will be preserved until the ISR
|
||||
* NOTE: It is assumed that l6 - l7 will be preserved until the ISR
|
||||
* nest and thread dispatch disable levels are unnested.
|
||||
*/
|
||||
|
||||
GET_SELF_CPU_CONTROL %l5, %l7
|
||||
|
||||
ld [%l5 + PER_CPU_ISR_NEST_LEVEL], %l7
|
||||
ld [%l5 + PER_CPU_THREAD_DISPATCH_DISABLE_LEVEL], %l6
|
||||
ld [%g6 + PER_CPU_ISR_NEST_LEVEL], %l7
|
||||
ld [%g6 + PER_CPU_THREAD_DISPATCH_DISABLE_LEVEL], %l6
|
||||
|
||||
add %l7, 1, %l7
|
||||
st %l7, [%l5 + PER_CPU_ISR_NEST_LEVEL]
|
||||
st %l7, [%g6 + PER_CPU_ISR_NEST_LEVEL]
|
||||
|
||||
add %l6, 1, %l6
|
||||
st %l6, [%l5 + PER_CPU_THREAD_DISPATCH_DISABLE_LEVEL]
|
||||
st %l6, [%g6 + PER_CPU_THREAD_DISPATCH_DISABLE_LEVEL]
|
||||
|
||||
/*
|
||||
* If ISR nest level was zero (now 1), then switch stack.
|
||||
@@ -405,7 +380,7 @@ save_isf:
|
||||
nop
|
||||
#endif
|
||||
|
||||
ld [%l5 + PER_CPU_INTERRUPT_STACK_HIGH], %sp
|
||||
ld [%g6 + PER_CPU_INTERRUPT_STACK_HIGH], %sp
|
||||
|
||||
dont_switch_stacks:
|
||||
/*
|
||||
@@ -468,7 +443,7 @@ dont_fix_pil2:
|
||||
ld [%l4], %o2 ! o2 = 3rd arg = interrupt exit instant
|
||||
mov %l3, %o1 ! o1 = 2nd arg = interrupt entry instant
|
||||
call SYM(_Profiling_Outer_most_interrupt_entry_and_exit), 0
|
||||
mov %l5, %o0 ! o0 = 1st arg = per-CPU control
|
||||
mov %g6, %o0 ! o0 = 1st arg = per-CPU control
|
||||
profiling_not_outer_most_exit:
|
||||
#else
|
||||
nop ! delay slot
|
||||
@@ -489,15 +464,14 @@ profiling_not_outer_most_exit:
|
||||
*
|
||||
* Register usage for this section:
|
||||
*
|
||||
* l5 = per cpu info pointer
|
||||
* l6 = _Thread_Dispatch_disable_level value
|
||||
* l7 = _ISR_Nest_level value
|
||||
*/
|
||||
|
||||
st %l7, [%l5 + PER_CPU_ISR_NEST_LEVEL]
|
||||
st %l7, [%g6 + PER_CPU_ISR_NEST_LEVEL]
|
||||
|
||||
sub %l6, 1, %l6
|
||||
st %l6, [%l5 + PER_CPU_THREAD_DISPATCH_DISABLE_LEVEL]
|
||||
st %l6, [%g6 + PER_CPU_THREAD_DISPATCH_DISABLE_LEVEL]
|
||||
|
||||
/*
|
||||
* If dispatching is disabled (includes nested interrupt case),
|
||||
@@ -509,7 +483,7 @@ profiling_not_outer_most_exit:
|
||||
nop
|
||||
|
||||
! Are we dispatching from a previous ISR in the interrupted thread?
|
||||
ld [%l5 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE], %l7
|
||||
ld [%g6 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE], %l7
|
||||
orcc %l7, %g0, %g0 ! Is this thread already doing an ISR?
|
||||
bnz simple_return ! Yes, then do a "simple" exit
|
||||
nop
|
||||
@@ -520,7 +494,7 @@ profiling_not_outer_most_exit:
|
||||
* return to the interrupt dispatcher.
|
||||
*/
|
||||
|
||||
ldub [%l5 + PER_CPU_DISPATCH_NEEDED], %l6
|
||||
ldub [%g6 + PER_CPU_DISPATCH_NEEDED], %l6
|
||||
|
||||
orcc %l6, %g0, %g0 ! Is thread switch necessary?
|
||||
bz simple_return ! no, then do a simple return
|
||||
@@ -532,7 +506,7 @@ profiling_not_outer_most_exit:
|
||||
|
||||
! Set ISR dispatch nesting prevention flag
|
||||
mov 1,%l6
|
||||
st %l6, [%l5 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE]
|
||||
st %l6, [%g6 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE]
|
||||
|
||||
/*
|
||||
* The following subtract should get us back on the interrupted
|
||||
@@ -569,9 +543,7 @@ isr_dispatch:
|
||||
* _Thread_Dispatch before leaving this ISR Dispatch context.
|
||||
*/
|
||||
|
||||
GET_SELF_CPU_CONTROL %l5, %l7
|
||||
|
||||
ldub [%l5 + PER_CPU_DISPATCH_NEEDED], %l7
|
||||
ldub [%g6 + PER_CPU_DISPATCH_NEEDED], %l7
|
||||
|
||||
orcc %l7, %g0, %g0 ! Is thread switch necesary?
|
||||
bz allow_nest_again ! No, then clear out and return
|
||||
@@ -587,7 +559,7 @@ dispatchAgain:
|
||||
allow_nest_again:
|
||||
|
||||
! Zero out ISR stack nesting prevention flag
|
||||
st %g0, [%l5 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE]
|
||||
st %g0, [%g6 + SPARC_PER_CPU_ISR_DISPATCH_DISABLE]
|
||||
|
||||
/*
|
||||
* The CWP in place at this point may be different from
|
||||
@@ -619,7 +591,7 @@ simple_return:
|
||||
! g1 is restored later
|
||||
ldd [%fp + ISF_G2_OFFSET], %g2 ! restore g2, g3
|
||||
ldd [%fp + ISF_G4_OFFSET], %g4 ! restore g4, g5
|
||||
ldd [%fp + ISF_G6_OFFSET], %g6 ! restore g6, g7
|
||||
ld [%fp + ISF_G7_OFFSET], %g7 ! restore g7
|
||||
|
||||
ldd [%fp + ISF_I0_OFFSET], %i0 ! restore i0, i1
|
||||
ldd [%fp + ISF_I2_OFFSET], %i2 ! restore i2, i3
|
||||
|
||||
@@ -222,6 +222,9 @@ SYM(hard_reset):
|
||||
nop
|
||||
nop
|
||||
|
||||
sethi %hi(_Per_CPU_Information), %g6 ! get per-CPU control
|
||||
add %g6, %lo(_Per_CPU_Information), %g6
|
||||
|
||||
#if defined(START_LEON3_ENABLE_SMP)
|
||||
rd %asr17, %o0 ! get CPU identifier
|
||||
srl %o0, LEON3_ASR17_PROCESSOR_INDEX_SHIFT, %o0
|
||||
@@ -230,12 +233,10 @@ SYM(hard_reset):
|
||||
beq cpu0
|
||||
nop
|
||||
|
||||
sethi %hi(_Per_CPU_Information), %o1 ! get per-CPU control
|
||||
add %o1, %lo(_Per_CPU_Information), %o1
|
||||
sll %o0, PER_CPU_CONTROL_SIZE_LOG2, %o2
|
||||
add %o1, %o2, %o1
|
||||
sll %o0, PER_CPU_CONTROL_SIZE_LOG2, %l0
|
||||
add %g6, %l0, %g6
|
||||
|
||||
ld [%o1 + PER_CPU_INTERRUPT_STACK_HIGH], %sp ! set stack pointer
|
||||
ld [%g6 + PER_CPU_INTERRUPT_STACK_HIGH], %sp ! set stack pointer
|
||||
sub %sp, 4, %sp ! stack starts at end of area - 4
|
||||
andn %sp, 0x0f, %sp ! align stack on 16-byte boundary
|
||||
mov %sp, %fp ! set frame pointer
|
||||
@@ -247,8 +248,8 @@ SYM(hard_reset):
|
||||
cpu0:
|
||||
#endif
|
||||
|
||||
set (SYM(rdb_start)), %g6 ! End of RAM
|
||||
st %sp, [%g6]
|
||||
set (SYM(rdb_start)), %g5 ! End of RAM
|
||||
st %sp, [%g5]
|
||||
sub %sp, 4, %sp ! stack starts at end of RAM - 4
|
||||
andn %sp, 0x0f, %sp ! align stack on 16-byte boundary
|
||||
mov %sp, %fp ! Set frame pointer
|
||||
@@ -300,12 +301,12 @@ cpu0:
|
||||
set SYM(RAM_START), %l1 ! Cannot use RAM_END due to bug in linker
|
||||
set SYM(RAM_SIZE), %l2
|
||||
add %l1, %l2, %sp
|
||||
st %sp, [%g6]
|
||||
st %sp, [%g5]
|
||||
|
||||
|
||||
set SYM(CLOCK_SPEED), %g6 ! Use 14 MHz in simulator
|
||||
set SYM(CLOCK_SPEED), %g5 ! Use 14 MHz in simulator
|
||||
set 14, %g1
|
||||
st %g1, [%g6]
|
||||
st %g1, [%g5]
|
||||
|
||||
2:
|
||||
#endif
|
||||
@@ -332,8 +333,8 @@ cpu0:
|
||||
nop
|
||||
|
||||
copy_data:
|
||||
ldd [ %g2 ], %g6
|
||||
std %g6 , [ %g3 ] ! copy this double word
|
||||
ldd [ %g2 ], %g5
|
||||
std %g5 , [ %g3 ] ! copy this double word
|
||||
add %g3, 8, %g3 ! bump the destination pointer
|
||||
add %g2, 8, %g2 ! bump the source pointer
|
||||
cmp %g3, %g4 ! Is the pointer past the end of dest?
|
||||
|
||||
@@ -36,7 +36,6 @@ RTEMS_STATIC_ASSERT(
|
||||
)
|
||||
|
||||
SPARC_ASSERT_OFFSET(g5, G5);
|
||||
SPARC_ASSERT_OFFSET(g6, G6);
|
||||
SPARC_ASSERT_OFFSET(g7, G7);
|
||||
|
||||
RTEMS_STATIC_ASSERT(
|
||||
|
||||
@@ -408,14 +408,14 @@ typedef struct {
|
||||
* The registers g2 through g4 are reserved for applications. GCC uses them as
|
||||
* volatile registers by default. So they are treated like volatile registers
|
||||
* in RTEMS as well.
|
||||
*
|
||||
* The register g6 contains the per-CPU control of the current processor. It
|
||||
* is an invariant of the processor context. This register must not be saved
|
||||
* and restored during context switches or interrupt services.
|
||||
*/
|
||||
typedef struct {
|
||||
/** This will contain reserved space for alignment. */
|
||||
uint32_t reserved_for_alignment;
|
||||
/** This will contain the contents of the g5 register. */
|
||||
uint32_t g5;
|
||||
/** This will contain the contents of the g6 register. */
|
||||
uint32_t g6;
|
||||
/** This will contain the contents of the g7 register. */
|
||||
uint32_t g7;
|
||||
|
||||
@@ -490,55 +490,53 @@ typedef struct {
|
||||
*/
|
||||
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define G5_OFFSET 0x04
|
||||
#define G5_OFFSET 0x00
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define G6_OFFSET 0x08
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define G7_OFFSET 0x0C
|
||||
#define G7_OFFSET 0x04
|
||||
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define L0_OFFSET 0x10
|
||||
#define L0_OFFSET 0x08
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define L1_OFFSET 0x14
|
||||
#define L1_OFFSET 0x0C
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define L2_OFFSET 0x18
|
||||
#define L2_OFFSET 0x10
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define L3_OFFSET 0x1C
|
||||
#define L3_OFFSET 0x14
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define L4_OFFSET 0x20
|
||||
#define L4_OFFSET 0x18
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define L5_OFFSET 0x24
|
||||
#define L5_OFFSET 0x1C
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define L6_OFFSET 0x28
|
||||
#define L6_OFFSET 0x20
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define L7_OFFSET 0x2C
|
||||
#define L7_OFFSET 0x24
|
||||
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define I0_OFFSET 0x30
|
||||
#define I0_OFFSET 0x28
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define I1_OFFSET 0x34
|
||||
#define I1_OFFSET 0x2C
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define I2_OFFSET 0x38
|
||||
#define I2_OFFSET 0x30
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define I3_OFFSET 0x3C
|
||||
#define I3_OFFSET 0x34
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define I4_OFFSET 0x40
|
||||
#define I4_OFFSET 0x38
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define I5_OFFSET 0x44
|
||||
#define I5_OFFSET 0x3C
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define I6_FP_OFFSET 0x48
|
||||
#define I6_FP_OFFSET 0x40
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define I7_OFFSET 0x4C
|
||||
#define I7_OFFSET 0x44
|
||||
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define O6_SP_OFFSET 0x50
|
||||
#define O6_SP_OFFSET 0x48
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define O7_OFFSET 0x54
|
||||
#define O7_OFFSET 0x4C
|
||||
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define PSR_OFFSET 0x58
|
||||
#define PSR_OFFSET 0x50
|
||||
/** This macro defines an offset into the context for use in assembly. */
|
||||
#define ISR_DISPATCH_DISABLE_STACK_OFFSET 0x5C
|
||||
#define ISR_DISPATCH_DISABLE_STACK_OFFSET 0x54
|
||||
|
||||
/** This defines the size of the context area for use in assembly. */
|
||||
#define CONTEXT_CONTROL_SIZE 0x68
|
||||
@@ -661,8 +659,8 @@ typedef struct {
|
||||
uint32_t g4;
|
||||
/** This is the offset of the g5 register on an ISF. */
|
||||
uint32_t g5;
|
||||
/** This is the offset of the g6 register on an ISF. */
|
||||
uint32_t g6;
|
||||
/** This is the offset is reserved for alignment on an ISF. */
|
||||
uint32_t reserved_for_alignment;
|
||||
/** This is the offset of the g7 register on an ISF. */
|
||||
uint32_t g7;
|
||||
/** This is the offset of the i0 register on an ISF. */
|
||||
@@ -712,8 +710,6 @@ typedef struct {
|
||||
/** This macro defines an offset into the ISF for use in assembly. */
|
||||
#define ISF_G5_OFFSET CPU_MINIMUM_STACK_FRAME_SIZE + 0x1c
|
||||
/** This macro defines an offset into the ISF for use in assembly. */
|
||||
#define ISF_G6_OFFSET CPU_MINIMUM_STACK_FRAME_SIZE + 0x20
|
||||
/** This macro defines an offset into the ISF for use in assembly. */
|
||||
#define ISF_G7_OFFSET CPU_MINIMUM_STACK_FRAME_SIZE + 0x24
|
||||
/** This macro defines an offset into the ISF for use in assembly. */
|
||||
#define ISF_I0_OFFSET CPU_MINIMUM_STACK_FRAME_SIZE + 0x28
|
||||
@@ -1156,6 +1152,14 @@ void _CPU_Context_restore(
|
||||
Context_Control *new_context
|
||||
) RTEMS_COMPILER_NO_RETURN_ATTRIBUTE;
|
||||
|
||||
/**
|
||||
* @brief The pointer to the current per-CPU control is available via register
|
||||
* g6.
|
||||
*/
|
||||
register struct Per_CPU_Control *_SPARC_Per_CPU_current asm( "g6" );
|
||||
|
||||
#define _CPU_Get_current_per_CPU_control() ( _SPARC_Per_CPU_current )
|
||||
|
||||
#if defined(RTEMS_SMP)
|
||||
uint32_t _CPU_SMP_Initialize( void );
|
||||
|
||||
|
||||
@@ -401,6 +401,11 @@ The registers g2 through g4 are reserved for applications. GCC uses them as
|
||||
volatile registers by default. So they are treated like volatile registers in
|
||||
RTEMS as well.
|
||||
|
||||
The register g6 is reserved for the operating system and contains the address
|
||||
of the per-CPU control block of the current processor. This register is
|
||||
initialized during system start and then remains unchanged. It is not
|
||||
saved/restored by the context switch or interrupt processing code.
|
||||
|
||||
The register g7 is reserved for the operating system and contains the thread
|
||||
pointer used for thread-local storage (TLS) as mandated by the SPARC ABI.
|
||||
|
||||
|
||||
Reference in New Issue
Block a user