cpu/x86/mp_init: Use clflush to write SIPI data back to RAM

Improve boot time performances by replacing the wbinvd instruction
with multiple clflush to ensure that the SIPI data is written back to
RAM.

According to some experimental measurements, the wbinvd execution
takes between 1.6 up and 6 milliseconds to complete. In the case of
the SIPI data, wbinvd unnecessarily flushes and invalidates the entire
cache. Indeed, the SIPI module is quite small (about 400 bytes) and
cflush'ing the associated cache lines is almost instantaneous,
typically less than 100 microseconds.

BUG=b/260455826
TEST=Successful boot on Skolas and Rex board

Change-Id: I0e00db8eaa6a3cb41bec3422572c8f2a9bec4057
Signed-off-by: Jeremy Compostella <jeremy.compostella@intel.com>
Suggested-by: Erin Park <erin.park@intel.com>
Reviewed-on: https://review.coreboot.org/c/coreboot/+/75391
Reviewed-by: Kyösti Mälkki <kyosti.malkki@gmail.com>
Tested-by: build bot (Jenkins) <no-reply@coreboot.org>
Reviewed-by: Arthur Heymans <arthur@aheymans.xyz>
This commit is contained in:
Jeremy Compostella 2023-05-22 17:38:10 -07:00 committed by Martin L Roth
parent f167df4d3f
commit 4a2ce029fb
3 changed files with 14 additions and 11 deletions

View file

@ -12,16 +12,11 @@ bool clflush_supported(void)
return (cpuid_edx(1) >> CPUID_FEATURE_CLFLUSH_BIT) & 1;
}
static void clflush_region(const uintptr_t start, const size_t size)
void clflush_region(const uintptr_t start, const size_t size)
{
uintptr_t addr;
const size_t cl_size = ((cpuid_ebx(1) >> 8) & 0xff) * 8;
if (!clflush_supported()) {
printk(BIOS_DEBUG, "Not flushing cache to RAM, CLFLUSH not supported\n");
return;
}
printk(BIOS_SPEW, "CLFLUSH [0x%lx, 0x%lx]\n", start, start + size);
for (addr = ALIGN_DOWN(start, cl_size); addr < start + size; addr += cl_size)
@ -54,5 +49,8 @@ void arch_segment_loaded(uintptr_t start, size_t size, int flags)
if (!cbmem_online())
return;
clflush_region(start, size);
if (clflush_supported())
clflush_region(start, size);
else
printk(BIOS_DEBUG, "Not flushing cache to RAM, CLFLUSH not supported\n");
}

View file

@ -364,6 +364,13 @@ static atomic_t *load_sipi_vector(struct mp_params *mp_params)
ap_count = &sp->ap_count;
atomic_set(ap_count, 0);
/* Make sure SIPI data hits RAM so the APs that come up will see the
startup code even if the caches are disabled. */
if (clflush_supported())
clflush_region((uintptr_t)mod_loc, module_size);
else
wbinvd();
return ap_count;
}
@ -626,10 +633,6 @@ static enum cb_err mp_init(struct bus *cpu_bus, struct mp_params *p)
if (ap_count == NULL)
return CB_ERR;
/* Make sure SIPI data hits RAM so the APs that come up will see
* the startup code even if the caches are disabled. */
wbinvd();
/* Start the APs providing number of APs and the cpus_entered field. */
global_num_aps = p->num_cpus - 1;
if (start_aps(cpu_bus, global_num_aps, ap_count) != CB_SUCCESS) {

View file

@ -13,6 +13,7 @@
#if !defined(__ASSEMBLER__)
#include <stdbool.h>
#include <stddef.h>
static inline void wbinvd(void)
{
@ -30,6 +31,7 @@ static inline void clflush(void *addr)
}
bool clflush_supported(void);
void clflush_region(const uintptr_t start, const size_t size);
/* The following functions require the __always_inline due to AMD
* function STOP_CAR_AND_CPU that disables cache as