cpu/x86/smm: allow SSE instructions in SMM modules

If SSE instructions are enabled in the build assume the SMM
modules are compiled with SSE instructions. As such enable
the SSE instructions in SMM mode by setting up the cr4 register.
In addition, provide a place to save and restore the SSE state
in both the relocation handler and permanent handler.

Change-Id: Ifa16876b57544919fde88fba5b8f18e4ca286841
Signed-off-by: Aaron Durbin <adurbin@chromium.org>
Reviewed-on: https://review.coreboot.org/20244
Reviewed-by: Furquan Shaikh <furquan@google.com>
Tested-by: build bot (Jenkins) <no-reply@coreboot.org>
This commit is contained in:
Aaron Durbin 2017-06-16 15:16:13 -05:00 committed by Martin Roth
parent 604f69868f
commit 8ade68a270
3 changed files with 81 additions and 4 deletions

View file

@ -185,6 +185,13 @@ load_msr:
and $~(CR0_CLEAR_FLAGS_CACHE_ENABLE), %eax and $~(CR0_CLEAR_FLAGS_CACHE_ENABLE), %eax
mov %eax, %cr0 mov %eax, %cr0
#if IS_ENABLED(CONFIG_SSE)
/* Enable sse instructions. */
mov %cr4, %eax
orl $(CR4_OSFXSR | CR4_OSXMMEXCPT), %eax
mov %eax, %cr4
#endif
/* c_handler(cpu_num) */ /* c_handler(cpu_num) */
push %esi /* cpu_num */ push %esi /* cpu_num */
mov c_handler, %eax mov c_handler, %eax

View file

@ -19,6 +19,14 @@
#include <cpu/x86/cache.h> #include <cpu/x86/cache.h>
#include <console/console.h> #include <console/console.h>
#define FXSAVE_SIZE 512
/* FXSAVE area during relocation. While it may not be strictly needed the
SMM stub code relies on the FXSAVE area being non-zero to enable SSE
instructions within SMM mode. */
static uint8_t fxsave_area_relocation[CONFIG_MAX_CPUS][FXSAVE_SIZE]
__attribute__((aligned(16)));
/* /*
* Components that make up the SMRAM: * Components that make up the SMRAM:
* 1. Save state - the total save state memory used * 1. Save state - the total save state memory used
@ -36,6 +44,8 @@ struct smm_stub_params {
u32 stack_top; u32 stack_top;
u32 c_handler; u32 c_handler;
u32 c_handler_arg; u32 c_handler_arg;
u32 fxsave_area;
u32 fxsave_area_size;
struct smm_runtime runtime; struct smm_runtime runtime;
} __attribute__ ((packed)); } __attribute__ ((packed));
@ -164,7 +174,8 @@ static void smm_stub_place_staggered_entry_points(char *base,
* concurrent areas requested. The save state always lives at the top of SMRAM * concurrent areas requested. The save state always lives at the top of SMRAM
* space, and the entry point is at offset 0x8000. * space, and the entry point is at offset 0x8000.
*/ */
static int smm_module_setup_stub(void *smbase, struct smm_loader_params *params) static int smm_module_setup_stub(void *smbase, struct smm_loader_params *params,
void *fxsave_area)
{ {
size_t total_save_state_size; size_t total_save_state_size;
size_t smm_stub_size; size_t smm_stub_size;
@ -253,6 +264,8 @@ static int smm_module_setup_stub(void *smbase, struct smm_loader_params *params)
stub_params->stack_size = params->per_cpu_stack_size; stub_params->stack_size = params->per_cpu_stack_size;
stub_params->c_handler = (uintptr_t)params->handler; stub_params->c_handler = (uintptr_t)params->handler;
stub_params->c_handler_arg = (uintptr_t)params->handler_arg; stub_params->c_handler_arg = (uintptr_t)params->handler_arg;
stub_params->fxsave_area = (uintptr_t)fxsave_area;
stub_params->fxsave_area_size = FXSAVE_SIZE;
stub_params->runtime.smbase = (uintptr_t)smbase; stub_params->runtime.smbase = (uintptr_t)smbase;
stub_params->runtime.save_state_size = params->per_cpu_save_state_size; stub_params->runtime.save_state_size = params->per_cpu_save_state_size;
@ -293,7 +306,7 @@ int smm_setup_relocation_handler(struct smm_loader_params *params)
if (params->num_concurrent_stacks == 0) if (params->num_concurrent_stacks == 0)
params->num_concurrent_stacks = CONFIG_MAX_CPUS; params->num_concurrent_stacks = CONFIG_MAX_CPUS;
return smm_module_setup_stub(smram, params); return smm_module_setup_stub(smram, params, fxsave_area_relocation);
} }
/* The SMM module is placed within the provided region in the following /* The SMM module is placed within the provided region in the following
@ -320,6 +333,9 @@ int smm_load_module(void *smram, size_t size, struct smm_loader_params *params)
size_t handler_size; size_t handler_size;
size_t module_alignment; size_t module_alignment;
size_t alignment_size; size_t alignment_size;
size_t fxsave_size;
void *fxsave_area;
size_t total_size;
char *base; char *base;
if (size <= SMM_DEFAULT_SIZE) if (size <= SMM_DEFAULT_SIZE)
@ -350,8 +366,19 @@ int smm_load_module(void *smram, size_t size, struct smm_loader_params *params)
base += alignment_size; base += alignment_size;
} }
fxsave_size = 0;
fxsave_area = NULL;
if (IS_ENABLED(CONFIG_SSE)) {
fxsave_size = FXSAVE_SIZE * params->num_concurrent_stacks;
/* FXSAVE area below all the stacks stack. */
fxsave_area = params->stack_top;
fxsave_area -= total_stack_size + fxsave_size;
}
/* Does the required amount of memory exceed the SMRAM region size? */ /* Does the required amount of memory exceed the SMRAM region size? */
if ((total_stack_size + handler_size + SMM_DEFAULT_SIZE) > size) total_size = total_stack_size + handler_size;
total_size += fxsave_size + SMM_DEFAULT_SIZE;
if (total_size > size)
return -1; return -1;
if (rmodule_load(base, &smm_mod)) if (rmodule_load(base, &smm_mod))
@ -360,5 +387,5 @@ int smm_load_module(void *smram, size_t size, struct smm_loader_params *params)
params->handler = rmodule_entry(&smm_mod); params->handler = rmodule_entry(&smm_mod);
params->handler_arg = rmodule_parameters(&smm_mod); params->handler_arg = rmodule_parameters(&smm_mod);
return smm_module_setup_stub(smram, params); return smm_module_setup_stub(smram, params, fxsave_area);
} }

View file

@ -36,6 +36,10 @@ c_handler:
.long 0 .long 0
c_handler_arg: c_handler_arg:
.long 0 .long 0
fxsave_area:
.long 0
fxsave_area_size:
.long 0
/* struct smm_runtime begins here. */ /* struct smm_runtime begins here. */
smm_runtime: smm_runtime:
smbase: smbase:
@ -122,6 +126,8 @@ smm_trampoline32:
* not be assigned. Use the fallback stack and check this condition in * not be assigned. Use the fallback stack and check this condition in
* C handler. */ * C handler. */
movl $(fallback_stack_top), %esp movl $(fallback_stack_top), %esp
/* Clear fxsave location as there will be no saving/restoring. */
xor %edi, %edi
jmp 2f jmp 2f
1: 1:
movl stack_size, %eax movl stack_size, %eax
@ -130,7 +136,33 @@ smm_trampoline32:
subl %eax, %edx subl %eax, %edx
mov %edx, %esp mov %edx, %esp
/* calculate fxsave location */
mov fxsave_area, %edi
test %edi, %edi
jz 2f
movl fxsave_area_size, %eax
mul %ecx
add %eax, %edi
2: 2:
/* Save location of fxsave area. */
push %edi
mov %esp, %ebp
test %edi, %edi
jz 1f
/* Enable sse instructions. */
mov %cr4, %eax
orl $(CR4_OSFXSR | CR4_OSXMMEXCPT), %eax
mov %eax, %cr4
/* Save FP state. */
fxsave (%edi)
1:
/* Align stack to 16 bytes. Another 16 bytes are pushed below. */
andl $0xfffffff0, %esp
/* Call into the c-based SMM relocation function with the platform /* Call into the c-based SMM relocation function with the platform
* parameters. Equivalent to: * parameters. Equivalent to:
* struct arg = { c_handler_params, cpu_num, smm_runtime {; * struct arg = { c_handler_params, cpu_num, smm_runtime {;
@ -143,5 +175,16 @@ smm_trampoline32:
mov c_handler, %eax mov c_handler, %eax
call *%eax call *%eax
/* Restore stack from call frame */
mov %ebp, %esp
/* Retrieve fxsave location. */
pop %edi
test %edi, %edi
jz 1f
/* Restore FP state. */
fxrstor (%edi)
1:
/* Exit from SM mode. */ /* Exit from SM mode. */
rsm rsm