mirror of
https://source.denx.de/u-boot/u-boot.git
synced 2025-10-24 05:51:33 +02:00
Newer Intel SoCs have different ways of setting up cache-as-ram (CAR). Add support for these along with suitable configuration options. To make the code cleaner, adjust a few definitions in processor.h so that they can be used from assembler. Signed-off-by: Simon Glass <sjg@chromium.org> Reviewed-by: Bin Meng <bmeng.cn@gmail.com>
449 lines
9.9 KiB
ArmAsm
449 lines
9.9 KiB
ArmAsm
/* SPDX-License-Identifier: GPL-2.0 */
|
|
/*
|
|
* This file was modified from the coreboot version.
|
|
*
|
|
* Copyright (C) 2015-2016 Intel Corp.
|
|
*/
|
|
|
|
#include <config.h>
|
|
#include <asm/msr-index.h>
|
|
#include <asm/mtrr.h>
|
|
#include <asm/post.h>
|
|
#include <asm/processor.h>
|
|
#include <asm/processor-flags.h>
|
|
|
|
#define KiB 1024
|
|
|
|
#define IS_POWER_OF_2(x) (!((x) & ((x) - 1)))
|
|
|
|
.global car_init
|
|
car_init:
|
|
post_code(POST_CAR_START)
|
|
|
|
/*
|
|
* Use the MTRR default type MSR as a proxy for detecting INIT#.
|
|
* Reset the system if any known bits are set in that MSR. That is
|
|
* an indication of the CPU not being properly reset.
|
|
*/
|
|
check_for_clean_reset:
|
|
mov $MTRR_DEF_TYPE_MSR, %ecx
|
|
rdmsr
|
|
and $(MTRR_DEF_TYPE_EN | MTRR_DEF_TYPE_FIX_EN), %eax
|
|
cmp $0, %eax
|
|
jz no_reset
|
|
/* perform warm reset */
|
|
movw $IO_PORT_RESET, %dx
|
|
movb $(SYS_RST | RST_CPU), %al
|
|
outb %al, %dx
|
|
|
|
no_reset:
|
|
post_code(POST_CAR_SIPI)
|
|
|
|
/* Clear/disable fixed MTRRs */
|
|
mov $fixed_mtrr_list_size, %ebx
|
|
xor %eax, %eax
|
|
xor %edx, %edx
|
|
|
|
clear_fixed_mtrr:
|
|
add $-2, %ebx
|
|
movzwl fixed_mtrr_list(%ebx), %ecx
|
|
wrmsr
|
|
jnz clear_fixed_mtrr
|
|
|
|
post_code(POST_CAR_MTRR)
|
|
|
|
/* Figure put how many MTRRs we have, and clear them out */
|
|
mov $MTRR_CAP_MSR, %ecx
|
|
rdmsr
|
|
movzb %al, %ebx /* Number of variable MTRRs */
|
|
mov $MTRR_PHYS_BASE_MSR(0), %ecx
|
|
xor %eax, %eax
|
|
xor %edx, %edx
|
|
|
|
clear_var_mtrr:
|
|
wrmsr
|
|
inc %ecx
|
|
wrmsr
|
|
inc %ecx
|
|
dec %ebx
|
|
jnz clear_var_mtrr
|
|
|
|
post_code(POST_CAR_UNCACHEABLE)
|
|
|
|
/* Configure default memory type to uncacheable (UC) */
|
|
mov $MTRR_DEF_TYPE_MSR, %ecx
|
|
rdmsr
|
|
/* Clear enable bits and set default type to UC */
|
|
and $~(MTRR_DEF_TYPE_MASK | MTRR_DEF_TYPE_EN | \
|
|
MTRR_DEF_TYPE_FIX_EN), %eax
|
|
wrmsr
|
|
|
|
/*
|
|
* Configure MTRR_PHYS_MASK_HIGH for proper addressing above 4GB
|
|
* based on the physical address size supported for this processor
|
|
* This is based on read from CPUID EAX = 080000008h, EAX bits [7:0]
|
|
*
|
|
* Examples:
|
|
* MTRR_PHYS_MASK_HIGH = 00000000Fh For 36 bit addressing
|
|
* MTRR_PHYS_MASK_HIGH = 0000000FFh For 40 bit addressing
|
|
*/
|
|
|
|
movl $0x80000008, %eax /* Address sizes leaf */
|
|
cpuid
|
|
sub $32, %al
|
|
movzx %al, %eax
|
|
xorl %esi, %esi
|
|
bts %eax, %esi
|
|
dec %esi /* esi <- MTRR_PHYS_MASK_HIGH */
|
|
|
|
post_code(POST_CAR_BASE_ADDRESS)
|
|
|
|
#if IS_POWER_OF_2(CONFIG_DCACHE_RAM_SIZE)
|
|
/* Configure CAR region as write-back (WB) */
|
|
mov $MTRR_PHYS_BASE_MSR(0), %ecx
|
|
mov $CONFIG_DCACHE_RAM_BASE, %eax
|
|
or $MTRR_TYPE_WRBACK, %eax
|
|
xor %edx,%edx
|
|
wrmsr
|
|
|
|
/* Configure the MTRR mask for the size region */
|
|
mov $MTRR_PHYS_MASK(0), %ecx
|
|
mov $CONFIG_DCACHE_RAM_SIZE, %eax /* size mask */
|
|
dec %eax
|
|
not %eax
|
|
or $MTRR_PHYS_MASK_VALID, %eax
|
|
movl %esi, %edx /* edx <- MTRR_PHYS_MASK_HIGH */
|
|
wrmsr
|
|
#elif (CONFIG_DCACHE_RAM_SIZE == 768 * KiB) /* 768 KiB */
|
|
/* Configure CAR region as write-back (WB) */
|
|
mov $MTRR_PHYS_BASE_MSR(0), %ecx
|
|
mov $CONFIG_DCACHE_RAM_BASE, %eax
|
|
or $MTRR_TYPE_WRBACK, %eax
|
|
xor %edx,%edx
|
|
wrmsr
|
|
|
|
mov $MTRR_PHYS_MASK_MSR(0), %ecx
|
|
mov $(512 * KiB), %eax /* size mask */
|
|
dec %eax
|
|
not %eax
|
|
or $MTRR_PHYS_MASK_VALID, %eax
|
|
movl %esi, %edx /* edx <- MTRR_PHYS_MASK_HIGH */
|
|
wrmsr
|
|
|
|
mov $MTRR_PHYS_BASE_MSR(1), %ecx
|
|
mov $(CONFIG_DCACHE_RAM_BASE + 512 * KiB), %eax
|
|
or $MTRR_TYPE_WRBACK, %eax
|
|
xor %edx,%edx
|
|
wrmsr
|
|
|
|
mov $MTRR_PHYS_MASK_MSR(1), %ecx
|
|
mov $(256 * KiB), %eax /* size mask */
|
|
dec %eax
|
|
not %eax
|
|
or $MTRR_PHYS_MASK_VALID, %eax
|
|
movl %esi, %edx /* edx <- MTRR_PHYS_MASK_HIGH */
|
|
wrmsr
|
|
#else
|
|
#error "DCACHE_RAM_SIZE is not a power of 2 and setup code is missing"
|
|
#endif
|
|
post_code(POST_CAR_FILL)
|
|
|
|
/* Enable variable MTRRs */
|
|
mov $MTRR_DEF_TYPE_MSR, %ecx
|
|
rdmsr
|
|
or $MTRR_DEF_TYPE_EN, %eax
|
|
wrmsr
|
|
|
|
/* Enable caching */
|
|
mov %cr0, %eax
|
|
and $~(X86_CR0_CD | X86_CR0_NW), %eax
|
|
invd
|
|
mov %eax, %cr0
|
|
|
|
#if IS_ENABLED(CONFIG_INTEL_CAR_NEM)
|
|
jmp car_nem
|
|
#elif IS_ENABLED(CONFIG_INTEL_CAR_CQOS)
|
|
jmp car_cqos
|
|
#elif IS_ENABLED(CONFIG_INTEL_CAR_NEM_ENHANCED)
|
|
jmp car_nem_enhanced
|
|
#else
|
|
#error "No CAR mechanism selected:
|
|
#endif
|
|
jmp car_init_ret
|
|
|
|
fixed_mtrr_list:
|
|
.word MTRR_FIX_64K_00000_MSR
|
|
.word MTRR_FIX_16K_80000_MSR
|
|
.word MTRR_FIX_16K_A0000_MSR
|
|
.word MTRR_FIX_4K_C0000_MSR
|
|
.word MTRR_FIX_4K_C8000_MSR
|
|
.word MTRR_FIX_4K_D0000_MSR
|
|
.word MTRR_FIX_4K_D8000_MSR
|
|
.word MTRR_FIX_4K_E0000_MSR
|
|
.word MTRR_FIX_4K_E8000_MSR
|
|
.word MTRR_FIX_4K_F0000_MSR
|
|
.word MTRR_FIX_4K_F8000_MSR
|
|
fixed_mtrr_list_size = . - fixed_mtrr_list
|
|
|
|
#if IS_ENABLED(CONFIG_INTEL_CAR_NEM)
|
|
.global car_nem
|
|
car_nem:
|
|
/* Disable cache eviction (setup stage) */
|
|
mov $MSR_EVICT_CTL, %ecx
|
|
rdmsr
|
|
or $0x1, %eax
|
|
wrmsr
|
|
|
|
post_code(0x26)
|
|
|
|
/* Clear the cache memory region. This will also fill up the cache */
|
|
movl $CONFIG_DCACHE_RAM_BASE, %edi
|
|
movl $CONFIG_DCACHE_RAM_SIZE, %ecx
|
|
shr $0x02, %ecx
|
|
xor %eax, %eax
|
|
cld
|
|
rep stosl
|
|
|
|
post_code(0x27)
|
|
|
|
/* Disable cache eviction (run stage) */
|
|
mov $MSR_EVICT_CTL, %ecx
|
|
rdmsr
|
|
or $0x2, %eax
|
|
wrmsr
|
|
|
|
post_code(0x28)
|
|
|
|
jmp car_init_ret
|
|
|
|
#elif IS_ENABLED(CONFIG_INTEL_CAR_CQOS)
|
|
.global car_cqos
|
|
car_cqos:
|
|
/*
|
|
* Create CBM_LEN_MASK based on CBM_LEN
|
|
* Get CPUID.(EAX=10H, ECX=2H):EAX.CBM_LEN[bits 4:0]
|
|
*/
|
|
mov $0x10, %eax
|
|
mov $0x2, %ecx
|
|
cpuid
|
|
and $0x1f, %eax
|
|
add $1, %al
|
|
|
|
mov $1, %ebx
|
|
mov %al, %cl
|
|
shl %cl, %ebx
|
|
sub $1, %ebx
|
|
|
|
/* Store the CBM_LEN_MASK in mm3 for later use */
|
|
movd %ebx, %mm3
|
|
|
|
/*
|
|
* Disable both L1 and L2 prefetcher. For yet-to-understood reason,
|
|
* prefetchers slow down filling cache with rep stos in CQOS mode.
|
|
*/
|
|
mov $MSR_PREFETCH_CTL, %ecx
|
|
rdmsr
|
|
or $(PREFETCH_L1_DISABLE | PREFETCH_L2_DISABLE), %eax
|
|
wrmsr
|
|
|
|
#if (CONFIG_DCACHE_RAM_SIZE == CONFIG_L2_CACHE_SIZE)
|
|
/*
|
|
* If CAR size is set to full L2 size, mask is calculated as all-zeros.
|
|
* This is not supported by the CPU/uCode.
|
|
*/
|
|
#error "CQOS CAR may not use whole L2 cache area"
|
|
#endif
|
|
|
|
/* Calculate how many bits to be used for CAR */
|
|
xor %edx, %edx
|
|
mov $CONFIG_DCACHE_RAM_SIZE, %eax /* dividend */
|
|
mov $CONFIG_CACHE_QOS_SIZE_PER_BIT, %ecx /* divisor */
|
|
div %ecx /* result is in eax */
|
|
mov %eax, %ecx /* save to ecx */
|
|
mov $1, %ebx
|
|
shl %cl, %ebx
|
|
sub $1, %ebx /* resulting mask is is in ebx */
|
|
|
|
/* Set this mask for initial cache fill */
|
|
mov $MSR_L2_QOS_MASK(0), %ecx
|
|
rdmsr
|
|
mov %ebx, %eax
|
|
wrmsr
|
|
|
|
/* Set CLOS selector to 0 */
|
|
mov $MSR_IA32_PQR_ASSOC, %ecx
|
|
rdmsr
|
|
and $~MSR_IA32_PQR_ASSOC_MASK, %edx /* select mask 0 */
|
|
wrmsr
|
|
|
|
/* We will need to block CAR region from evicts */
|
|
mov $MSR_L2_QOS_MASK(1), %ecx
|
|
rdmsr
|
|
/* Invert bits that are to be used for cache */
|
|
mov %ebx, %eax
|
|
xor $~0, %eax /* invert 32 bits */
|
|
|
|
/*
|
|
* Use CBM_LEN_MASK stored in mm3 to set bits based on Capacity Bit
|
|
* Mask Length.
|
|
*/
|
|
movd %mm3, %ebx
|
|
and %ebx, %eax
|
|
wrmsr
|
|
|
|
post_code(0x26)
|
|
|
|
/* Clear the cache memory region. This will also fill up the cache */
|
|
movl $CONFIG_DCACHE_RAM_BASE, %edi
|
|
movl $CONFIG_DCACHE_RAM_SIZE, %ecx
|
|
shr $0x02, %ecx
|
|
xor %eax, %eax
|
|
cld
|
|
rep stosl
|
|
|
|
post_code(0x27)
|
|
|
|
/* Cache is populated. Use mask 1 that will block evicts */
|
|
mov $MSR_IA32_PQR_ASSOC, %ecx
|
|
rdmsr
|
|
and $~MSR_IA32_PQR_ASSOC_MASK, %edx /* clear index bits first */
|
|
or $1, %edx /* select mask 1 */
|
|
wrmsr
|
|
|
|
/* Enable prefetchers */
|
|
mov $MSR_PREFETCH_CTL, %ecx
|
|
rdmsr
|
|
and $~(PREFETCH_L1_DISABLE | PREFETCH_L2_DISABLE), %eax
|
|
wrmsr
|
|
|
|
post_code(0x28)
|
|
|
|
jmp car_init_ret
|
|
|
|
#elif IS_ENABLED(CONFIG_INTEL_CAR_NEM_ENHANCED)
|
|
.global car_nem_enhanced
|
|
car_nem_enhanced:
|
|
/* Disable cache eviction (setup stage) */
|
|
mov $MSR_EVICT_CTL, %ecx
|
|
rdmsr
|
|
or $0x1, %eax
|
|
wrmsr
|
|
post_code(0x26)
|
|
|
|
/* Create n-way set associativity of cache */
|
|
xorl %edi, %edi
|
|
find_llc_subleaf:
|
|
movl %edi, %ecx
|
|
movl $0x04, %eax
|
|
cpuid
|
|
inc %edi
|
|
and $0xe0, %al /* EAX[7:5] = Cache Level */
|
|
cmp $0x60, %al /* Check to see if it is LLC */
|
|
jnz find_llc_subleaf
|
|
|
|
/*
|
|
* Set MSR 0xC91 IA32_L3_MASK_! = 0xE/0xFE/0xFFE/0xFFFE
|
|
* for 4/8/16 way of LLC
|
|
*/
|
|
shr $22, %ebx
|
|
inc %ebx
|
|
/* Calculate n-way associativity of LLC */
|
|
mov %bl, %cl
|
|
|
|
/*
|
|
* Maximizing RO cacheability while locking in the CAR to a
|
|
* single way since that particular way won't be victim candidate
|
|
* for evictions.
|
|
* This has been done after programing LLC_WAY_MASK_1 MSR
|
|
* with desired LLC way as mentioned below.
|
|
*
|
|
* Hence create Code and Data Size as per request
|
|
* Code Size (RO) : Up to 16M
|
|
* Data Size (RW) : Up to 256K
|
|
*/
|
|
movl $0x01, %eax
|
|
/*
|
|
* LLC Ways -> LLC_WAY_MASK_1:
|
|
* 4: 0x000E
|
|
* 8: 0x00FE
|
|
* 12: 0x0FFE
|
|
* 16: 0xFFFE
|
|
*
|
|
* These MSRs contain one bit per each way of LLC
|
|
* - If this bit is '0' - the way is protected from eviction
|
|
* - If this bit is '1' - the way is not protected from eviction
|
|
*/
|
|
shl %cl, %eax
|
|
subl $0x02, %eax
|
|
movl $MSR_IA32_L3_MASK_1, %ecx
|
|
xorl %edx, %edx
|
|
wrmsr
|
|
/*
|
|
* Set MSR 0xC92 IA32_L3_MASK_2 = 0x1
|
|
*
|
|
* For SKL SOC, data size remains 256K consistently.
|
|
* Hence, creating 1-way associative cache for Data
|
|
*/
|
|
mov $MSR_IA32_L3_MASK_2, %ecx
|
|
mov $0x01, %eax
|
|
xorl %edx, %edx
|
|
wrmsr
|
|
/*
|
|
* Set MSR_IA32_PQR_ASSOC = 0x02
|
|
*
|
|
* Possible values:
|
|
* 0: Default value, no way mask should be applied
|
|
* 1: Apply way mask 1 to LLC
|
|
* 2: Apply way mask 2 to LLC
|
|
* 3: Shouldn't be use in NEM Mode
|
|
*/
|
|
movl $MSR_IA32_PQR_ASSOC, %ecx
|
|
movl $0x02, %eax
|
|
xorl %edx, %edx
|
|
wrmsr
|
|
|
|
movl $CONFIG_DCACHE_RAM_BASE, %edi
|
|
movl $CONFIG_DCACHE_RAM_SIZE, %ecx
|
|
shr $0x02, %ecx
|
|
xor %eax, %eax
|
|
cld
|
|
rep stosl
|
|
/*
|
|
* Set MSR_IA32_PQR_ASSOC = 0x01
|
|
* At this stage we apply LLC_WAY_MASK_1 to the cache.
|
|
* i.e. way 0 is protected from eviction.
|
|
*/
|
|
movl $MSR_IA32_PQR_ASSOC, %ecx
|
|
movl $0x01, %eax
|
|
xorl %edx, %edx
|
|
wrmsr
|
|
|
|
post_code(0x27)
|
|
/*
|
|
* Enable No-Eviction Mode Run State by setting
|
|
* NO_EVICT_MODE MSR 2E0h bit [1] = '1'.
|
|
*/
|
|
|
|
movl $MSR_EVICT_CTL, %ecx
|
|
rdmsr
|
|
orl $0x02, %eax
|
|
wrmsr
|
|
|
|
post_code(0x28)
|
|
|
|
jmp car_init_ret
|
|
#endif
|
|
|
|
#if CONFIG_IS_ENABLED(X86_16BIT_INIT)
|
|
_dt_ucode_base_size:
|
|
/* These next two fields are filled in by binman */
|
|
.globl ucode_base
|
|
ucode_base: /* Declared in microcode.h */
|
|
.long 0 /* microcode base */
|
|
.globl ucode_size
|
|
ucode_size: /* Declared in microcode.h */
|
|
.long 0 /* microcode size */
|
|
.long CONFIG_SYS_MONITOR_BASE /* code region base */
|
|
.long CONFIG_SYS_MONITOR_LEN /* code region size */
|
|
#endif
|