Commit ad9cdf41 authored by Jeffrey Lee's avatar Jeffrey Lee
Browse files

Add support for Cortex cache type. Extend ARM_Analyse to, where appropriate,...

Add support for Cortex cache type. Extend ARM_Analyse to, where appropriate, use CPU feature registers to identify CPU capabilities.

  s/ARMops - Support for Cortex multi-level cache (CT_ctype_WB_CR7_Lx). New ARM_Analyse_Fancy to identify CPU capabilities using feature registers.
  s/HAL - Modify pre-ARMop cache code to handle Cortex-syle caches.
  s/MemInfo - Replace ARM_flush_TLB macro call with appropriate ARMop to provide Cortex compatability
  hdr/ARMops - Update list of ARM architectures
  hdr/CoPro15ops - Deprecate ARM_flush_* macros for HAL kernels, as they are no longer capable of flushing all cache types. ARMops should be used instead.
  hdr/KernelWS - Add storage space for multi-level cache properties required for new cache cleaning code.
  Tested under qemu-omap3. Still unable to verify on real hardware due to lack of appropriate MMU code. However new OMAP3 HAL code that uses similar cache management functions appears to work fine on real hardware.

Version 5.35, Tagged as 'Kernel-5_35-4_79_2_98_2_2'
parent e2262380
......@@ -13,11 +13,11 @@
GBLS Module_ComponentPath
Module_MajorVersion SETS "5.35"
Module_Version SETA 535
Module_MinorVersion SETS ""
Module_Date SETS "01 Feb 2009"
Module_ApplicationDate SETS "01-Feb-09"
Module_MinorVersion SETS ""
Module_Date SETS "21 Feb 2009"
Module_ApplicationDate SETS "21-Feb-09"
Module_ComponentName SETS "Kernel"
Module_ComponentPath SETS "castle/RiscOS/Sources/Kernel"
Module_FullVersion SETS "5.35 ("
Module_HelpVersion SETS "5.35 (01 Feb 2009)"
Module_FullVersion SETS "5.35 ("
Module_HelpVersion SETS "5.35 (21 Feb 2009)"
......@@ -5,19 +5,19 @@
#define Module_MajorVersion_CMHG 5.35
#define Module_MinorVersion_CMHG
#define Module_Date_CMHG 01 Feb 2009
#define Module_MinorVersion_CMHG
#define Module_Date_CMHG 21 Feb 2009
#define Module_MajorVersion "5.35"
#define Module_Version 535
#define Module_MinorVersion ""
#define Module_Date "01 Feb 2009"
#define Module_MinorVersion ""
#define Module_Date "21 Feb 2009"
#define Module_ApplicationDate "01-Feb-09"
#define Module_ApplicationDate "21-Feb-09"
#define Module_ComponentName "Kernel"
#define Module_ComponentPath "castle/RiscOS/Sources/Kernel"
#define Module_FullVersion "5.35 ("
#define Module_HelpVersion "5.35 (01 Feb 2009)"
#define Module_FullVersion "5.35 ("
#define Module_HelpVersion "5.35 (21 Feb 2009)"
#define Module_LibraryVersionInfo "5:35"
......@@ -13,13 +13,15 @@
; limitations under the License.
ARMv3 * 0
ARMv4 * 1
ARMv4T * 2
ARMv5 * 3
ARMv5T * 4
ARMv5TE * 5
ARMvF * &F ; 'Fancy' ARM that describes its features in the feature registers
ARMv3 * 0
ARMv4 * 1
ARMv4T * 2
ARMv5 * 3
ARMv5T * 4
ARMv5TE * 5
ARMv5TEJ * 6
ARMv6 * 7
ARMvF * &F ; 'Fancy' ARM that describes its features in the feature registers (Cortex/ARMv7 and above?)
^ 0
ARM600 # 1
......@@ -22,6 +22,9 @@
; 07-10-96 MJS Updated for proper ARM 810 support (not needed for RO 3.70)
; 10-03-97 MJS A few additions for chocolate flavour screen handling (possible
; Domain and FSR register use) in Phoebe OS
; 05-02-09 JL Disable ARM_flush_* when compiling OS for HAL. OS now supports
; too many ARM versions for cache/TLB flushing to be implemented in
; simple macros.
ARM_config_cp CP 15 ;coprocessor number for configuration control
......@@ -51,7 +54,7 @@ ARM8_CTC_reg CN 15 ;Clock and test configuration
ARMA_TCI_reg CN 15 ;Test,Clock and Idle control
;so that AASM will accept the general value for MCR CRm field
;so that bleedin' AASM will accept the general value for MCR CRm field
C0 CN 0
C1 CN 1
C2 CN 2
......@@ -161,6 +164,7 @@ C15 CN 15
TEQ$cond $tmp,#1
;flush whole TLB (both data and instruction for StrongARM)
;trashes $temp
......@@ -200,6 +204,7 @@ C15 CN 15
MCREQ ARM_config_cp,0,R0,ARM8A_cache_reg,C7,0
MCREQ ARM_config_cp,0,R0,ARM8A_TLB_reg,C7,0
; -------------- ARM 6,7 only --------------------------------------------
......@@ -1297,6 +1297,9 @@ MMUControlSoftCopy # 4 ; Soft copy of ARM control register
DeviceCount # 4 ; size of our table of devices in the system heap
DeviceTable # 4 ; pointer to table
Cache_Lx_Info # 4 ; Cache level ID register
Cache_Lx_DTable # 4*8 ; Data/unified cache layout for all 8 levels
Cache_Lx_ITable # 4*8 ; Instruction cache layout for all 8 levels
AplWorkSize * AppSpaceDANode + DANode_Size
This diff is collapsed.
......@@ -35,39 +35,43 @@ RISCOS_InitARM
MOV a4, lr
; Check if we're architecture 3. If so, don't read the control register.
BL Init_ARMarch
MOVEQ a1, #0
ARM_read_control a1, NE
MOVEQ a3, #0
ARM_read_control a3, NE
; Late abort (ARM6 only), 32-bit Data and Program space. No Write buffer (ARM920T
; spec says W bit should be set, but I reckon they're bluffing).
; The F bit's tricky. (1 => CPCLK=FCLK, 0=>CPCLK=FCLK/2). The only chip using it was the
; ARM700, it never really reached the customer, and it's always been programmed with
; CPCLK=FCLK. Therefore we'll keep it that way, and ignore the layering violation.
; All of these bits should be off already, but just in case...
; Off we go.
ARM_write_control a1
ARM_write_control a3
; In case it wasn't a hard reset
MOV a2, #0
MCR ARM_config_cp,0,a2,ARMv4_cache_reg,C7 ; invalidate I+D caches
CMP a1, #ARMvF
; Assume that all ARMvF ARMs have multi-level caches and thus no single MCR op for invalidating all the caches
MCRNE ARM_config_cp,0,a2,ARMv4_cache_reg,C7 ; invalidate I+D caches
BLEQ HAL_InvalidateCache_ARMvF
CMP a1, #ARMv3
MCREQ ARM_config_cp,0,a2,ARMv3_TLBflush_reg,C0 ; flush TLBs
MCRNE ARM_config_cp,0,a2,ARMv4_TLB_reg,C7 ; flush TLBs
; We assume that ARMs with an I cache can have it enabled while the MMU is off.
[ :LNOT:CacheOff
ORRNE a1, a1, #MMUC_I
ARM_write_control a1, NE ; whoosh
ORRNE a3, a3, #MMUC_I
ARM_write_control a3, NE ; whoosh
; Check if we are in a 26-bit mode.
; Keep a soft copy of the CR in a banked register (R13_und)
MSR CPSR_c, #F32_bit+I32_bit+UND32_mode
MOV sp, a1
MOV sp, a3
; Switch into SVC32 mode (we may have been in SVC26 before).
MSR CPSR_c, #F32_bit+I32_bit+SVC32_mode
......@@ -623,6 +627,7 @@ MMU_activation_zone
MOV a4, a1
BL Init_ARMarch ; corrupts a1 and ip
MOV ip, a1 ; Remember architecture for later
MOV a1, a4
MSREQ CPSR_c, #F32_bit+I32_bit+UND32_mode ; Recover the soft copy of the CR
......@@ -637,20 +642,23 @@ MMU_activation_zone
ARM_MMU_transbase v3 ; Always useful to tell it where L1PT is...
MOV ip, #0
MCREQ p15, 0, ip, c5, c0 ; MMU may already be on (but flat mapped)
MCRNE p15, 0, ip, c8, c7 ; if HAL needed it (eg XScale with ECC)
MOV lr, #0
MCREQ p15, 0, lr, c5, c0 ; MMU may already be on (but flat mapped)
MCRNE p15, 0, lr, c8, c7 ; if HAL needed it (eg XScale with ECC)
; so flush TLBs now
ARM_write_control v5
MOVEQ sp, v5
MSREQ CPSR_c, #F32_bit+I32_bit+SVC32_mode
MOV ip, #0 ; junk MMU-off contents of I-cache
MCR ARM_config_cp,0,ip,ARMv4_cache_reg,C7 ; (works on ARMv3)
CMP ip, #ARMvF
MOV lr, #0 ; junk MMU-off contents of I-cache
MCRNE ARM_config_cp,0,lr,ARMv4_cache_reg,C7 ; (works on ARMv3)
BLEQ HAL_InvalidateCache_ARMvF
MOV ip, #4_0000000000000001 ; domain 0 client only
ARM_MMU_domain ip
; HACK HACK HACK - all domains remain in manager mode
; MOV ip, #4_0000000000000001 ; domain 0 client only
; ARM_MMU_domain ip
; MMU now on. Need to jump to logical copy of ourselves. Complication arises if our
; physical address overlaps our logical address - in that case we need to map
......@@ -774,6 +782,12 @@ MMUon_nol1ptoverlap
CallHAL HAL_Init
[ DebugHALTX
BL DebugHALPrint
= "HAL initialised",0
MOV a1, #ZeroPage
LDR v1, [a1, #InitUsedBlock]
LDR v2, [a1, #InitUsedEnd]
......@@ -963,6 +977,53 @@ MMUon_nol1ptoverlap
; Cache invalidation for ARMs with multiple cache levels, used before ARMop initialisation
; This function gets called before we have a stack set up, so we've got to preserve as many registers as possible
; The only register we can safely change is ip, but we can switch into FIQ mode with interrupts disabled and use the banked registers there
MSR CPSR_c, #F32_bit+I32_bit+FIQ32_mode
MRC p15, 1, r8, c0, c0, 1 ; Cache level ID register
BIC r8, r8, #&FF000000 ; Discard unification/coherency bits
MOV r9, #0 ; Current cache level
TST r8, #7 ; Get flags
BEQ %FT10 ; Cache clean complete
MCR p15, 2, r9, c0, c0, 0 ; Program cache size selection register
MRC p15, 1, r10, c0, c0, 0 ; Get size info
AND r11, r10, #&7 ; log2(Line size)-2
BIC r10, r10, #&F0000007 ; Clear flags & line size
MOV r12, r10, LSL #19 ; Number of ways-1 in upper 10 bits
MOV r10, r10, LSR #13 ; Number of sets-1 in upper 15 bits
; Way number needs to be packed right up at the high end of the data word; shift it up
CLZ r14, r12
MOV r12, r12, LSL r14
; Set number needs to start at log2(Line size)
MOV r10, r10, LSR #15 ; Start at bit 2
MOV r10, r10, LSL r11 ; Start at log2(Line size)
; Now calculate the offset numbers we will use to increment sets & ways
BIC r12, r12, r12, LSL #1 ; Way increment
BIC r11, r10, r10, LSL #1 ; Set increment
; Now we can finally clean this cache!
ORR r14, r9, r10 ; Current way (0), set (max), and level
MCR p15, 0, r14, c7, c6, 2 ; Invalidate
ADDS r14, r14, r12 ; Increment way
BCC %BT30 ; Overflow will occur once ways are enumerated
TST r14, r10 ; Are set bits all zero?
SUBNE r14, r14, r11 ; No, so decrement set and loop around again
; This cache is now clean. Move on to the next level.
ADD r9, r9, #2
MOVS r8, r8, LSR #3
; All caches clean; switch back to SVC, then recover the stored PSR from ip (although we can be fairly certain we started in SVC anyway)
MSR CPSR_c, #F32_bit+I32_bit+SVC32_mode
MSR CPSR_cxsf, ip
MOV pc, lr
CountPageTablePages ROUT
MOV a1, #ZeroPage
LDR a2, =CAM
......@@ -1504,7 +1565,9 @@ Init_PageTablesChanged
MOV ip, #0
MCREQ ARM_config_cp,0,ip,ARMv3_TLBflush_reg,C0
MCRNE ARM_config_cp,0,ip,ARMv4_TLB_reg,C7
MCR ARM_config_cp,0,ip,ARMv4_cache_reg,C7 ; works on ARMv3
CMP a1, #ARMvF
MCRNE ARM_config_cp,0,ip,ARMv4_cache_reg,C7 ; works on ARMv3
BLEQ HAL_InvalidateCache_ARMvF
MOV pc, a3
......@@ -872,7 +872,14 @@ MemoryFreePoolLock ROUT
;flush TLB(s) for resume - needed for Wimp resume, precaution for other - no cache flush
;since Free Pool is uncached
Push "r0"
MOV r0,#ZeroPage
ARMop TLB_InvalidateAll,,,r0
Pull "r0"
ARM_flush_TLB r2
TST r0,#&100 ;is it Wimp?
MOVEQ r2,#VRRc_suspend
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment