x86/boot: Add early boot support when running with SEV active
Early in the boot process, add checks to determine if the kernel is running with Secure Encrypted Virtualization (SEV) active. Checking for SEV requires checking that the kernel is running under a hypervisor (CPUID 0x00000001, bit 31), that the SEV feature is available (CPUID 0x8000001f, bit 1) and then checking a non-interceptable SEV MSR (0xc0010131, bit 0). This check is required so that during early compressed kernel booting the pagetables (both the boot pagetables and KASLR pagetables (if enabled) are updated to include the encryption mask so that when the kernel is decompressed into encrypted memory, it can boot properly. After the kernel is decompressed and continues booting the same logic is used to check if SEV is active and set a flag indicating so. This allows to distinguish between SME and SEV, each of which have unique differences in how certain things are handled: e.g. DMA (always bounce buffered with SEV) or EFI tables (always access decrypted with SME). Signed-off-by: Tom Lendacky <thomas.lendacky@amd.com> Signed-off-by: Brijesh Singh <brijesh.singh@amd.com> Signed-off-by: Thomas Gleixner <tglx@linutronix.de> Reviewed-by: Borislav Petkov <bp@suse.de> Tested-by: Borislav Petkov <bp@suse.de> Cc: Laura Abbott <labbott@redhat.com> Cc: Kees Cook <keescook@chromium.org> Cc: kvm@vger.kernel.org Cc: Konrad Rzeszutek Wilk <konrad.wilk@oracle.com> Cc: Radim Krčmář <rkrcmar@redhat.com> Cc: Borislav Petkov <bp@alien8.de> Cc: Andy Lutomirski <luto@kernel.org> Cc: Paolo Bonzini <pbonzini@redhat.com> Cc: "Kirill A. Shutemov" <kirill.shutemov@linux.intel.com> Link: https://lkml.kernel.org/r/20171020143059.3291-13-brijesh.singh@amd.com
This commit is contained in:
parent
d7b417fa08
commit
1958b5fc40
@ -78,6 +78,7 @@ vmlinux-objs-$(CONFIG_EARLY_PRINTK) += $(obj)/early_serial_console.o
|
|||||||
vmlinux-objs-$(CONFIG_RANDOMIZE_BASE) += $(obj)/kaslr.o
|
vmlinux-objs-$(CONFIG_RANDOMIZE_BASE) += $(obj)/kaslr.o
|
||||||
ifdef CONFIG_X86_64
|
ifdef CONFIG_X86_64
|
||||||
vmlinux-objs-$(CONFIG_RANDOMIZE_BASE) += $(obj)/pagetable.o
|
vmlinux-objs-$(CONFIG_RANDOMIZE_BASE) += $(obj)/pagetable.o
|
||||||
|
vmlinux-objs-y += $(obj)/mem_encrypt.o
|
||||||
endif
|
endif
|
||||||
|
|
||||||
$(obj)/eboot.o: KBUILD_CFLAGS += -fshort-wchar -mno-red-zone
|
$(obj)/eboot.o: KBUILD_CFLAGS += -fshort-wchar -mno-red-zone
|
||||||
|
@ -131,6 +131,19 @@ ENTRY(startup_32)
|
|||||||
/*
|
/*
|
||||||
* Build early 4G boot pagetable
|
* Build early 4G boot pagetable
|
||||||
*/
|
*/
|
||||||
|
/*
|
||||||
|
* If SEV is active then set the encryption mask in the page tables.
|
||||||
|
* This will insure that when the kernel is copied and decompressed
|
||||||
|
* it will be done so encrypted.
|
||||||
|
*/
|
||||||
|
call get_sev_encryption_bit
|
||||||
|
xorl %edx, %edx
|
||||||
|
testl %eax, %eax
|
||||||
|
jz 1f
|
||||||
|
subl $32, %eax /* Encryption bit is always above bit 31 */
|
||||||
|
bts %eax, %edx /* Set encryption mask for page tables */
|
||||||
|
1:
|
||||||
|
|
||||||
/* Initialize Page tables to 0 */
|
/* Initialize Page tables to 0 */
|
||||||
leal pgtable(%ebx), %edi
|
leal pgtable(%ebx), %edi
|
||||||
xorl %eax, %eax
|
xorl %eax, %eax
|
||||||
@ -141,12 +154,14 @@ ENTRY(startup_32)
|
|||||||
leal pgtable + 0(%ebx), %edi
|
leal pgtable + 0(%ebx), %edi
|
||||||
leal 0x1007 (%edi), %eax
|
leal 0x1007 (%edi), %eax
|
||||||
movl %eax, 0(%edi)
|
movl %eax, 0(%edi)
|
||||||
|
addl %edx, 4(%edi)
|
||||||
|
|
||||||
/* Build Level 3 */
|
/* Build Level 3 */
|
||||||
leal pgtable + 0x1000(%ebx), %edi
|
leal pgtable + 0x1000(%ebx), %edi
|
||||||
leal 0x1007(%edi), %eax
|
leal 0x1007(%edi), %eax
|
||||||
movl $4, %ecx
|
movl $4, %ecx
|
||||||
1: movl %eax, 0x00(%edi)
|
1: movl %eax, 0x00(%edi)
|
||||||
|
addl %edx, 0x04(%edi)
|
||||||
addl $0x00001000, %eax
|
addl $0x00001000, %eax
|
||||||
addl $8, %edi
|
addl $8, %edi
|
||||||
decl %ecx
|
decl %ecx
|
||||||
@ -157,6 +172,7 @@ ENTRY(startup_32)
|
|||||||
movl $0x00000183, %eax
|
movl $0x00000183, %eax
|
||||||
movl $2048, %ecx
|
movl $2048, %ecx
|
||||||
1: movl %eax, 0(%edi)
|
1: movl %eax, 0(%edi)
|
||||||
|
addl %edx, 4(%edi)
|
||||||
addl $0x00200000, %eax
|
addl $0x00200000, %eax
|
||||||
addl $8, %edi
|
addl $8, %edi
|
||||||
decl %ecx
|
decl %ecx
|
||||||
|
120
arch/x86/boot/compressed/mem_encrypt.S
Normal file
120
arch/x86/boot/compressed/mem_encrypt.S
Normal file
@ -0,0 +1,120 @@
|
|||||||
|
/*
|
||||||
|
* AMD Memory Encryption Support
|
||||||
|
*
|
||||||
|
* Copyright (C) 2017 Advanced Micro Devices, Inc.
|
||||||
|
*
|
||||||
|
* Author: Tom Lendacky <thomas.lendacky@amd.com>
|
||||||
|
*
|
||||||
|
* This program is free software; you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License version 2 as
|
||||||
|
* published by the Free Software Foundation.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include <linux/linkage.h>
|
||||||
|
|
||||||
|
#include <asm/processor-flags.h>
|
||||||
|
#include <asm/msr.h>
|
||||||
|
#include <asm/asm-offsets.h>
|
||||||
|
|
||||||
|
.text
|
||||||
|
.code32
|
||||||
|
ENTRY(get_sev_encryption_bit)
|
||||||
|
xor %eax, %eax
|
||||||
|
|
||||||
|
#ifdef CONFIG_AMD_MEM_ENCRYPT
|
||||||
|
push %ebx
|
||||||
|
push %ecx
|
||||||
|
push %edx
|
||||||
|
push %edi
|
||||||
|
|
||||||
|
/*
|
||||||
|
* RIP-relative addressing is needed to access the encryption bit
|
||||||
|
* variable. Since we are running in 32-bit mode we need this call/pop
|
||||||
|
* sequence to get the proper relative addressing.
|
||||||
|
*/
|
||||||
|
call 1f
|
||||||
|
1: popl %edi
|
||||||
|
subl $1b, %edi
|
||||||
|
|
||||||
|
movl enc_bit(%edi), %eax
|
||||||
|
cmpl $0, %eax
|
||||||
|
jge .Lsev_exit
|
||||||
|
|
||||||
|
/* Check if running under a hypervisor */
|
||||||
|
movl $1, %eax
|
||||||
|
cpuid
|
||||||
|
bt $31, %ecx /* Check the hypervisor bit */
|
||||||
|
jnc .Lno_sev
|
||||||
|
|
||||||
|
movl $0x80000000, %eax /* CPUID to check the highest leaf */
|
||||||
|
cpuid
|
||||||
|
cmpl $0x8000001f, %eax /* See if 0x8000001f is available */
|
||||||
|
jb .Lno_sev
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Check for the SEV feature:
|
||||||
|
* CPUID Fn8000_001F[EAX] - Bit 1
|
||||||
|
* CPUID Fn8000_001F[EBX] - Bits 5:0
|
||||||
|
* Pagetable bit position used to indicate encryption
|
||||||
|
*/
|
||||||
|
movl $0x8000001f, %eax
|
||||||
|
cpuid
|
||||||
|
bt $1, %eax /* Check if SEV is available */
|
||||||
|
jnc .Lno_sev
|
||||||
|
|
||||||
|
movl $MSR_AMD64_SEV, %ecx /* Read the SEV MSR */
|
||||||
|
rdmsr
|
||||||
|
bt $MSR_AMD64_SEV_ENABLED_BIT, %eax /* Check if SEV is active */
|
||||||
|
jnc .Lno_sev
|
||||||
|
|
||||||
|
movl %ebx, %eax
|
||||||
|
andl $0x3f, %eax /* Return the encryption bit location */
|
||||||
|
movl %eax, enc_bit(%edi)
|
||||||
|
jmp .Lsev_exit
|
||||||
|
|
||||||
|
.Lno_sev:
|
||||||
|
xor %eax, %eax
|
||||||
|
movl %eax, enc_bit(%edi)
|
||||||
|
|
||||||
|
.Lsev_exit:
|
||||||
|
pop %edi
|
||||||
|
pop %edx
|
||||||
|
pop %ecx
|
||||||
|
pop %ebx
|
||||||
|
|
||||||
|
#endif /* CONFIG_AMD_MEM_ENCRYPT */
|
||||||
|
|
||||||
|
ret
|
||||||
|
ENDPROC(get_sev_encryption_bit)
|
||||||
|
|
||||||
|
.code64
|
||||||
|
ENTRY(get_sev_encryption_mask)
|
||||||
|
xor %rax, %rax
|
||||||
|
|
||||||
|
#ifdef CONFIG_AMD_MEM_ENCRYPT
|
||||||
|
push %rbp
|
||||||
|
push %rdx
|
||||||
|
|
||||||
|
movq %rsp, %rbp /* Save current stack pointer */
|
||||||
|
|
||||||
|
call get_sev_encryption_bit /* Get the encryption bit position */
|
||||||
|
testl %eax, %eax
|
||||||
|
jz .Lno_sev_mask
|
||||||
|
|
||||||
|
xor %rdx, %rdx
|
||||||
|
bts %rax, %rdx /* Create the encryption mask */
|
||||||
|
mov %rdx, %rax /* ... and return it */
|
||||||
|
|
||||||
|
.Lno_sev_mask:
|
||||||
|
movq %rbp, %rsp /* Restore original stack pointer */
|
||||||
|
|
||||||
|
pop %rdx
|
||||||
|
pop %rbp
|
||||||
|
#endif
|
||||||
|
|
||||||
|
ret
|
||||||
|
ENDPROC(get_sev_encryption_mask)
|
||||||
|
|
||||||
|
.data
|
||||||
|
enc_bit:
|
||||||
|
.int 0xffffffff
|
@ -109,4 +109,6 @@ static inline void console_init(void)
|
|||||||
{ }
|
{ }
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
unsigned long get_sev_encryption_mask(void);
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
@ -77,16 +77,18 @@ static unsigned long top_level_pgt;
|
|||||||
* Mapping information structure passed to kernel_ident_mapping_init().
|
* Mapping information structure passed to kernel_ident_mapping_init().
|
||||||
* Due to relocation, pointers must be assigned at run time not build time.
|
* Due to relocation, pointers must be assigned at run time not build time.
|
||||||
*/
|
*/
|
||||||
static struct x86_mapping_info mapping_info = {
|
static struct x86_mapping_info mapping_info;
|
||||||
.page_flag = __PAGE_KERNEL_LARGE_EXEC,
|
|
||||||
};
|
|
||||||
|
|
||||||
/* Locates and clears a region for a new top level page table. */
|
/* Locates and clears a region for a new top level page table. */
|
||||||
void initialize_identity_maps(void)
|
void initialize_identity_maps(void)
|
||||||
{
|
{
|
||||||
|
unsigned long sev_me_mask = get_sev_encryption_mask();
|
||||||
|
|
||||||
/* Init mapping_info with run-time function/buffer pointers. */
|
/* Init mapping_info with run-time function/buffer pointers. */
|
||||||
mapping_info.alloc_pgt_page = alloc_pgt_page;
|
mapping_info.alloc_pgt_page = alloc_pgt_page;
|
||||||
mapping_info.context = &pgt_data;
|
mapping_info.context = &pgt_data;
|
||||||
|
mapping_info.page_flag = __PAGE_KERNEL_LARGE_EXEC | sev_me_mask;
|
||||||
|
mapping_info.kernpg_flag = _KERNPG_TABLE | sev_me_mask;
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* It should be impossible for this not to already be true,
|
* It should be impossible for this not to already be true,
|
||||||
|
@ -324,6 +324,9 @@
|
|||||||
#define MSR_AMD64_IBSBRTARGET 0xc001103b
|
#define MSR_AMD64_IBSBRTARGET 0xc001103b
|
||||||
#define MSR_AMD64_IBSOPDATA4 0xc001103d
|
#define MSR_AMD64_IBSOPDATA4 0xc001103d
|
||||||
#define MSR_AMD64_IBS_REG_COUNT_MAX 8 /* includes MSR_AMD64_IBSBRTARGET */
|
#define MSR_AMD64_IBS_REG_COUNT_MAX 8 /* includes MSR_AMD64_IBSBRTARGET */
|
||||||
|
#define MSR_AMD64_SEV 0xc0010131
|
||||||
|
#define MSR_AMD64_SEV_ENABLED_BIT 0
|
||||||
|
#define MSR_AMD64_SEV_ENABLED BIT_ULL(MSR_AMD64_SEV_ENABLED_BIT)
|
||||||
|
|
||||||
/* Fam 17h MSRs */
|
/* Fam 17h MSRs */
|
||||||
#define MSR_F17H_IRPERF 0xc00000e9
|
#define MSR_F17H_IRPERF 0xc00000e9
|
||||||
|
@ -110,5 +110,4 @@ struct kvm_vcpu_pv_apf_data {
|
|||||||
#define KVM_PV_EOI_ENABLED KVM_PV_EOI_MASK
|
#define KVM_PV_EOI_ENABLED KVM_PV_EOI_MASK
|
||||||
#define KVM_PV_EOI_DISABLED 0x0
|
#define KVM_PV_EOI_DISABLED 0x0
|
||||||
|
|
||||||
|
|
||||||
#endif /* _UAPI_ASM_X86_KVM_PARA_H */
|
#endif /* _UAPI_ASM_X86_KVM_PARA_H */
|
||||||
|
@ -313,7 +313,9 @@ void __init mem_encrypt_init(void)
|
|||||||
if (sev_active())
|
if (sev_active())
|
||||||
dma_ops = &sev_dma_ops;
|
dma_ops = &sev_dma_ops;
|
||||||
|
|
||||||
pr_info("AMD Secure Memory Encryption (SME) active\n");
|
pr_info("AMD %s active\n",
|
||||||
|
sev_active() ? "Secure Encrypted Virtualization (SEV)"
|
||||||
|
: "Secure Memory Encryption (SME)");
|
||||||
}
|
}
|
||||||
|
|
||||||
void swiotlb_set_mem_attributes(void *vaddr, unsigned long size)
|
void swiotlb_set_mem_attributes(void *vaddr, unsigned long size)
|
||||||
@ -641,37 +643,63 @@ void __init __nostackprotector sme_enable(struct boot_params *bp)
|
|||||||
{
|
{
|
||||||
const char *cmdline_ptr, *cmdline_arg, *cmdline_on, *cmdline_off;
|
const char *cmdline_ptr, *cmdline_arg, *cmdline_on, *cmdline_off;
|
||||||
unsigned int eax, ebx, ecx, edx;
|
unsigned int eax, ebx, ecx, edx;
|
||||||
|
unsigned long feature_mask;
|
||||||
bool active_by_default;
|
bool active_by_default;
|
||||||
unsigned long me_mask;
|
unsigned long me_mask;
|
||||||
char buffer[16];
|
char buffer[16];
|
||||||
u64 msr;
|
u64 msr;
|
||||||
|
|
||||||
/* Check for the SME support leaf */
|
/* Check for the SME/SEV support leaf */
|
||||||
eax = 0x80000000;
|
eax = 0x80000000;
|
||||||
ecx = 0;
|
ecx = 0;
|
||||||
native_cpuid(&eax, &ebx, &ecx, &edx);
|
native_cpuid(&eax, &ebx, &ecx, &edx);
|
||||||
if (eax < 0x8000001f)
|
if (eax < 0x8000001f)
|
||||||
return;
|
return;
|
||||||
|
|
||||||
|
#define AMD_SME_BIT BIT(0)
|
||||||
|
#define AMD_SEV_BIT BIT(1)
|
||||||
/*
|
/*
|
||||||
* Check for the SME feature:
|
* Set the feature mask (SME or SEV) based on whether we are
|
||||||
* CPUID Fn8000_001F[EAX] - Bit 0
|
* running under a hypervisor.
|
||||||
* Secure Memory Encryption support
|
*/
|
||||||
* CPUID Fn8000_001F[EBX] - Bits 5:0
|
eax = 1;
|
||||||
* Pagetable bit position used to indicate encryption
|
ecx = 0;
|
||||||
|
native_cpuid(&eax, &ebx, &ecx, &edx);
|
||||||
|
feature_mask = (ecx & BIT(31)) ? AMD_SEV_BIT : AMD_SME_BIT;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Check for the SME/SEV feature:
|
||||||
|
* CPUID Fn8000_001F[EAX]
|
||||||
|
* - Bit 0 - Secure Memory Encryption support
|
||||||
|
* - Bit 1 - Secure Encrypted Virtualization support
|
||||||
|
* CPUID Fn8000_001F[EBX]
|
||||||
|
* - Bits 5:0 - Pagetable bit position used to indicate encryption
|
||||||
*/
|
*/
|
||||||
eax = 0x8000001f;
|
eax = 0x8000001f;
|
||||||
ecx = 0;
|
ecx = 0;
|
||||||
native_cpuid(&eax, &ebx, &ecx, &edx);
|
native_cpuid(&eax, &ebx, &ecx, &edx);
|
||||||
if (!(eax & 1))
|
if (!(eax & feature_mask))
|
||||||
return;
|
return;
|
||||||
|
|
||||||
me_mask = 1UL << (ebx & 0x3f);
|
me_mask = 1UL << (ebx & 0x3f);
|
||||||
|
|
||||||
/* Check if SME is enabled */
|
/* Check if memory encryption is enabled */
|
||||||
msr = __rdmsr(MSR_K8_SYSCFG);
|
if (feature_mask == AMD_SME_BIT) {
|
||||||
if (!(msr & MSR_K8_SYSCFG_MEM_ENCRYPT))
|
/* For SME, check the SYSCFG MSR */
|
||||||
|
msr = __rdmsr(MSR_K8_SYSCFG);
|
||||||
|
if (!(msr & MSR_K8_SYSCFG_MEM_ENCRYPT))
|
||||||
|
return;
|
||||||
|
} else {
|
||||||
|
/* For SEV, check the SEV MSR */
|
||||||
|
msr = __rdmsr(MSR_AMD64_SEV);
|
||||||
|
if (!(msr & MSR_AMD64_SEV_ENABLED))
|
||||||
|
return;
|
||||||
|
|
||||||
|
/* SEV state cannot be controlled by a command line option */
|
||||||
|
sme_me_mask = me_mask;
|
||||||
|
sev_enabled = true;
|
||||||
return;
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Fixups have not been applied to phys_base yet and we're running
|
* Fixups have not been applied to phys_base yet and we're running
|
||||||
|
Loading…
Reference in New Issue
Block a user