1756e12e7SXiaoyao Li /* 2756e12e7SXiaoyao Li * QEMU TDX support 3756e12e7SXiaoyao Li * 4756e12e7SXiaoyao Li * Copyright (c) 2025 Intel Corporation 5756e12e7SXiaoyao Li * 6756e12e7SXiaoyao Li * Author: 7756e12e7SXiaoyao Li * Xiaoyao Li <xiaoyao.li@intel.com> 8756e12e7SXiaoyao Li * 9756e12e7SXiaoyao Li * SPDX-License-Identifier: GPL-2.0-or-later 10756e12e7SXiaoyao Li */ 11756e12e7SXiaoyao Li 12756e12e7SXiaoyao Li #include "qemu/osdep.h" 138eddedc3SXiaoyao Li #include "qemu/error-report.h" 14d05a0858SIsaku Yamahata #include "qemu/base64.h" 154420ba0eSXiaoyao Li #include "qemu/mmap-alloc.h" 168eddedc3SXiaoyao Li #include "qapi/error.h" 17756e12e7SXiaoyao Li #include "qom/object_interfaces.h" 18d05a0858SIsaku Yamahata #include "crypto/hash.h" 19bb45580dSXiaoyao Li #include "system/kvm_int.h" 206e250463SXiaoyao Li #include "system/runstate.h" 214420ba0eSXiaoyao Li #include "system/system.h" 22ebc2d2b4SIsaku Yamahata #include "system/ramblock.h" 23756e12e7SXiaoyao Li 241ff5048dSXiaoyao Li #include <linux/kvm_para.h> 251ff5048dSXiaoyao Li 268c94c84cSXiaoyao Li #include "cpu.h" 278c94c84cSXiaoyao Li #include "cpu-internal.h" 28f18672e4SXiaoyao Li #include "hw/i386/e820_memory_layout.h" 294420ba0eSXiaoyao Li #include "hw/i386/tdvf.h" 30631a2ac5SXiaoyao Li #include "hw/i386/x86.h" 31a7314259SXiaoyao Li #include "hw/i386/tdvf-hob.h" 32b455880eSXiaoyao Li #include "kvm_i386.h" 33756e12e7SXiaoyao Li #include "tdx.h" 34756e12e7SXiaoyao Li 350e73b843SXiaoyao Li #define TDX_MIN_TSC_FREQUENCY_KHZ (100 * 1000) 360e73b843SXiaoyao Li #define TDX_MAX_TSC_FREQUENCY_KHZ (10 * 1000 * 1000) 370e73b843SXiaoyao Li 3853b6f406SXiaoyao Li #define TDX_TD_ATTRIBUTES_DEBUG BIT_ULL(0) 396016e297SXiaoyao Li #define TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE BIT_ULL(28) 40bb3be394SXiaoyao Li #define TDX_TD_ATTRIBUTES_PKS BIT_ULL(30) 41bb3be394SXiaoyao Li #define TDX_TD_ATTRIBUTES_PERFMON BIT_ULL(63) 426016e297SXiaoyao Li 4353b6f406SXiaoyao Li #define TDX_SUPPORTED_TD_ATTRS (TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE |\ 4453b6f406SXiaoyao Li TDX_TD_ATTRIBUTES_PKS | \ 4553b6f406SXiaoyao Li TDX_TD_ATTRIBUTES_PERFMON) 4653b6f406SXiaoyao Li 471619d0e4SXiaoyao Li static TdxGuest *tdx_guest; 481619d0e4SXiaoyao Li 498eddedc3SXiaoyao Li static struct kvm_tdx_capabilities *tdx_caps; 5075ec6189SXiaoyao Li static struct kvm_cpuid2 *tdx_supported_cpuid; 518eddedc3SXiaoyao Li 521619d0e4SXiaoyao Li /* Valid after kvm_arch_init()->confidential_guest_kvm_init()->tdx_kvm_init() */ 531619d0e4SXiaoyao Li bool is_tdx_vm(void) 541619d0e4SXiaoyao Li { 551619d0e4SXiaoyao Li return !!tdx_guest; 561619d0e4SXiaoyao Li } 571619d0e4SXiaoyao Li 588eddedc3SXiaoyao Li enum tdx_ioctl_level { 598eddedc3SXiaoyao Li TDX_VM_IOCTL, 608eddedc3SXiaoyao Li TDX_VCPU_IOCTL, 618eddedc3SXiaoyao Li }; 628eddedc3SXiaoyao Li 638eddedc3SXiaoyao Li static int tdx_ioctl_internal(enum tdx_ioctl_level level, void *state, 648eddedc3SXiaoyao Li int cmd_id, __u32 flags, void *data, 658eddedc3SXiaoyao Li Error **errp) 66631a2ac5SXiaoyao Li { 678eddedc3SXiaoyao Li struct kvm_tdx_cmd tdx_cmd = {}; 688eddedc3SXiaoyao Li int r; 698eddedc3SXiaoyao Li 708eddedc3SXiaoyao Li const char *tdx_ioctl_name[] = { 718eddedc3SXiaoyao Li [KVM_TDX_CAPABILITIES] = "KVM_TDX_CAPABILITIES", 728eddedc3SXiaoyao Li [KVM_TDX_INIT_VM] = "KVM_TDX_INIT_VM", 738eddedc3SXiaoyao Li [KVM_TDX_INIT_VCPU] = "KVM_TDX_INIT_VCPU", 748eddedc3SXiaoyao Li [KVM_TDX_INIT_MEM_REGION] = "KVM_TDX_INIT_MEM_REGION", 758eddedc3SXiaoyao Li [KVM_TDX_FINALIZE_VM] = "KVM_TDX_FINALIZE_VM", 768eddedc3SXiaoyao Li [KVM_TDX_GET_CPUID] = "KVM_TDX_GET_CPUID", 778eddedc3SXiaoyao Li }; 788eddedc3SXiaoyao Li 798eddedc3SXiaoyao Li tdx_cmd.id = cmd_id; 808eddedc3SXiaoyao Li tdx_cmd.flags = flags; 818eddedc3SXiaoyao Li tdx_cmd.data = (__u64)(unsigned long)data; 828eddedc3SXiaoyao Li 838eddedc3SXiaoyao Li switch (level) { 848eddedc3SXiaoyao Li case TDX_VM_IOCTL: 858eddedc3SXiaoyao Li r = kvm_vm_ioctl(kvm_state, KVM_MEMORY_ENCRYPT_OP, &tdx_cmd); 868eddedc3SXiaoyao Li break; 878eddedc3SXiaoyao Li case TDX_VCPU_IOCTL: 888eddedc3SXiaoyao Li r = kvm_vcpu_ioctl(state, KVM_MEMORY_ENCRYPT_OP, &tdx_cmd); 898eddedc3SXiaoyao Li break; 908eddedc3SXiaoyao Li default: 918eddedc3SXiaoyao Li error_setg(errp, "Invalid tdx_ioctl_level %d", level); 928eddedc3SXiaoyao Li return -EINVAL; 938eddedc3SXiaoyao Li } 948eddedc3SXiaoyao Li 958eddedc3SXiaoyao Li if (r < 0) { 968eddedc3SXiaoyao Li error_setg_errno(errp, -r, "TDX ioctl %s failed, hw_errors: 0x%llx", 978eddedc3SXiaoyao Li tdx_ioctl_name[cmd_id], tdx_cmd.hw_error); 988eddedc3SXiaoyao Li } 998eddedc3SXiaoyao Li return r; 1008eddedc3SXiaoyao Li } 1018eddedc3SXiaoyao Li 1028eddedc3SXiaoyao Li static inline int tdx_vm_ioctl(int cmd_id, __u32 flags, void *data, 1038eddedc3SXiaoyao Li Error **errp) 1048eddedc3SXiaoyao Li { 1058eddedc3SXiaoyao Li return tdx_ioctl_internal(TDX_VM_IOCTL, NULL, cmd_id, flags, data, errp); 1068eddedc3SXiaoyao Li } 1078eddedc3SXiaoyao Li 1088eddedc3SXiaoyao Li static inline int tdx_vcpu_ioctl(CPUState *cpu, int cmd_id, __u32 flags, 1098eddedc3SXiaoyao Li void *data, Error **errp) 1108eddedc3SXiaoyao Li { 1118eddedc3SXiaoyao Li return tdx_ioctl_internal(TDX_VCPU_IOCTL, cpu, cmd_id, flags, data, errp); 1128eddedc3SXiaoyao Li } 1138eddedc3SXiaoyao Li 1148eddedc3SXiaoyao Li static int get_tdx_capabilities(Error **errp) 1158eddedc3SXiaoyao Li { 1168eddedc3SXiaoyao Li struct kvm_tdx_capabilities *caps; 1178eddedc3SXiaoyao Li /* 1st generation of TDX reports 6 cpuid configs */ 1188eddedc3SXiaoyao Li int nr_cpuid_configs = 6; 1198eddedc3SXiaoyao Li size_t size; 1208eddedc3SXiaoyao Li int r; 1218eddedc3SXiaoyao Li 1228eddedc3SXiaoyao Li do { 1238eddedc3SXiaoyao Li Error *local_err = NULL; 1248eddedc3SXiaoyao Li size = sizeof(struct kvm_tdx_capabilities) + 1258eddedc3SXiaoyao Li nr_cpuid_configs * sizeof(struct kvm_cpuid_entry2); 1268eddedc3SXiaoyao Li caps = g_malloc0(size); 1278eddedc3SXiaoyao Li caps->cpuid.nent = nr_cpuid_configs; 1288eddedc3SXiaoyao Li 1298eddedc3SXiaoyao Li r = tdx_vm_ioctl(KVM_TDX_CAPABILITIES, 0, caps, &local_err); 1308eddedc3SXiaoyao Li if (r == -E2BIG) { 1318eddedc3SXiaoyao Li g_free(caps); 1328eddedc3SXiaoyao Li nr_cpuid_configs *= 2; 1338eddedc3SXiaoyao Li if (nr_cpuid_configs > KVM_MAX_CPUID_ENTRIES) { 1348eddedc3SXiaoyao Li error_report("KVM TDX seems broken that number of CPUID entries" 1358eddedc3SXiaoyao Li " in kvm_tdx_capabilities exceeds limit: %d", 1368eddedc3SXiaoyao Li KVM_MAX_CPUID_ENTRIES); 1378eddedc3SXiaoyao Li error_propagate(errp, local_err); 1388eddedc3SXiaoyao Li return r; 1398eddedc3SXiaoyao Li } 1408eddedc3SXiaoyao Li error_free(local_err); 1418eddedc3SXiaoyao Li } else if (r < 0) { 1428eddedc3SXiaoyao Li g_free(caps); 1438eddedc3SXiaoyao Li error_propagate(errp, local_err); 1448eddedc3SXiaoyao Li return r; 1458eddedc3SXiaoyao Li } 1468eddedc3SXiaoyao Li } while (r == -E2BIG); 1478eddedc3SXiaoyao Li 1488eddedc3SXiaoyao Li tdx_caps = caps; 149631a2ac5SXiaoyao Li 150631a2ac5SXiaoyao Li return 0; 151631a2ac5SXiaoyao Li } 152631a2ac5SXiaoyao Li 1530dd5fe5eSChao Peng void tdx_set_tdvf_region(MemoryRegion *tdvf_mr) 1540dd5fe5eSChao Peng { 1550dd5fe5eSChao Peng assert(!tdx_guest->tdvf_mr); 1560dd5fe5eSChao Peng tdx_guest->tdvf_mr = tdvf_mr; 1570dd5fe5eSChao Peng } 1580dd5fe5eSChao Peng 159a7314259SXiaoyao Li static TdxFirmwareEntry *tdx_get_hob_entry(TdxGuest *tdx) 160a7314259SXiaoyao Li { 161a7314259SXiaoyao Li TdxFirmwareEntry *entry; 162a7314259SXiaoyao Li 163a7314259SXiaoyao Li for_each_tdx_fw_entry(&tdx->tdvf, entry) { 164a7314259SXiaoyao Li if (entry->type == TDVF_SECTION_TYPE_TD_HOB) { 165a7314259SXiaoyao Li return entry; 166a7314259SXiaoyao Li } 167a7314259SXiaoyao Li } 168a7314259SXiaoyao Li error_report("TDVF metadata doesn't specify TD_HOB location."); 169a7314259SXiaoyao Li exit(1); 170a7314259SXiaoyao Li } 171a7314259SXiaoyao Li 172f18672e4SXiaoyao Li static void tdx_add_ram_entry(uint64_t address, uint64_t length, 173f18672e4SXiaoyao Li enum TdxRamType type) 174f18672e4SXiaoyao Li { 175f18672e4SXiaoyao Li uint32_t nr_entries = tdx_guest->nr_ram_entries; 176f18672e4SXiaoyao Li tdx_guest->ram_entries = g_renew(TdxRamEntry, tdx_guest->ram_entries, 177f18672e4SXiaoyao Li nr_entries + 1); 178f18672e4SXiaoyao Li 179f18672e4SXiaoyao Li tdx_guest->ram_entries[nr_entries].address = address; 180f18672e4SXiaoyao Li tdx_guest->ram_entries[nr_entries].length = length; 181f18672e4SXiaoyao Li tdx_guest->ram_entries[nr_entries].type = type; 182f18672e4SXiaoyao Li tdx_guest->nr_ram_entries++; 183f18672e4SXiaoyao Li } 184f18672e4SXiaoyao Li 185f18672e4SXiaoyao Li static int tdx_accept_ram_range(uint64_t address, uint64_t length) 186f18672e4SXiaoyao Li { 187f18672e4SXiaoyao Li uint64_t head_start, tail_start, head_length, tail_length; 188f18672e4SXiaoyao Li uint64_t tmp_address, tmp_length; 189f18672e4SXiaoyao Li TdxRamEntry *e; 190f18672e4SXiaoyao Li int i = 0; 191f18672e4SXiaoyao Li 192f18672e4SXiaoyao Li do { 193f18672e4SXiaoyao Li if (i == tdx_guest->nr_ram_entries) { 194f18672e4SXiaoyao Li return -1; 195f18672e4SXiaoyao Li } 196f18672e4SXiaoyao Li 197f18672e4SXiaoyao Li e = &tdx_guest->ram_entries[i++]; 198f18672e4SXiaoyao Li } while (address + length <= e->address || address >= e->address + e->length); 199f18672e4SXiaoyao Li 200f18672e4SXiaoyao Li /* 201f18672e4SXiaoyao Li * The to-be-accepted ram range must be fully contained by one 202f18672e4SXiaoyao Li * RAM entry. 203f18672e4SXiaoyao Li */ 204f18672e4SXiaoyao Li if (e->address > address || 205f18672e4SXiaoyao Li e->address + e->length < address + length) { 206f18672e4SXiaoyao Li return -1; 207f18672e4SXiaoyao Li } 208f18672e4SXiaoyao Li 209f18672e4SXiaoyao Li if (e->type == TDX_RAM_ADDED) { 210f18672e4SXiaoyao Li return 0; 211f18672e4SXiaoyao Li } 212f18672e4SXiaoyao Li 213f18672e4SXiaoyao Li tmp_address = e->address; 214f18672e4SXiaoyao Li tmp_length = e->length; 215f18672e4SXiaoyao Li 216f18672e4SXiaoyao Li e->address = address; 217f18672e4SXiaoyao Li e->length = length; 218f18672e4SXiaoyao Li e->type = TDX_RAM_ADDED; 219f18672e4SXiaoyao Li 220f18672e4SXiaoyao Li head_length = address - tmp_address; 221f18672e4SXiaoyao Li if (head_length > 0) { 222f18672e4SXiaoyao Li head_start = tmp_address; 223f18672e4SXiaoyao Li tdx_add_ram_entry(head_start, head_length, TDX_RAM_UNACCEPTED); 224f18672e4SXiaoyao Li } 225f18672e4SXiaoyao Li 226f18672e4SXiaoyao Li tail_start = address + length; 227f18672e4SXiaoyao Li if (tail_start < tmp_address + tmp_length) { 228f18672e4SXiaoyao Li tail_length = tmp_address + tmp_length - tail_start; 229f18672e4SXiaoyao Li tdx_add_ram_entry(tail_start, tail_length, TDX_RAM_UNACCEPTED); 230f18672e4SXiaoyao Li } 231f18672e4SXiaoyao Li 232f18672e4SXiaoyao Li return 0; 233f18672e4SXiaoyao Li } 234f18672e4SXiaoyao Li 235f18672e4SXiaoyao Li static int tdx_ram_entry_compare(const void *lhs_, const void* rhs_) 236f18672e4SXiaoyao Li { 237f18672e4SXiaoyao Li const TdxRamEntry *lhs = lhs_; 238f18672e4SXiaoyao Li const TdxRamEntry *rhs = rhs_; 239f18672e4SXiaoyao Li 240f18672e4SXiaoyao Li if (lhs->address == rhs->address) { 241f18672e4SXiaoyao Li return 0; 242f18672e4SXiaoyao Li } 243f18672e4SXiaoyao Li if (le64_to_cpu(lhs->address) > le64_to_cpu(rhs->address)) { 244f18672e4SXiaoyao Li return 1; 245f18672e4SXiaoyao Li } 246f18672e4SXiaoyao Li return -1; 247f18672e4SXiaoyao Li } 248f18672e4SXiaoyao Li 249f18672e4SXiaoyao Li static void tdx_init_ram_entries(void) 250f18672e4SXiaoyao Li { 251f18672e4SXiaoyao Li unsigned i, j, nr_e820_entries; 252f18672e4SXiaoyao Li 253f18672e4SXiaoyao Li nr_e820_entries = e820_get_table(NULL); 254f18672e4SXiaoyao Li tdx_guest->ram_entries = g_new(TdxRamEntry, nr_e820_entries); 255f18672e4SXiaoyao Li 256f18672e4SXiaoyao Li for (i = 0, j = 0; i < nr_e820_entries; i++) { 257f18672e4SXiaoyao Li uint64_t addr, len; 258f18672e4SXiaoyao Li 259f18672e4SXiaoyao Li if (e820_get_entry(i, E820_RAM, &addr, &len)) { 260f18672e4SXiaoyao Li tdx_guest->ram_entries[j].address = addr; 261f18672e4SXiaoyao Li tdx_guest->ram_entries[j].length = len; 262f18672e4SXiaoyao Li tdx_guest->ram_entries[j].type = TDX_RAM_UNACCEPTED; 263f18672e4SXiaoyao Li j++; 264f18672e4SXiaoyao Li } 265f18672e4SXiaoyao Li } 266f18672e4SXiaoyao Li tdx_guest->nr_ram_entries = j; 267f18672e4SXiaoyao Li } 268f18672e4SXiaoyao Li 26941f7fd22SXiaoyao Li static void tdx_post_init_vcpus(void) 27041f7fd22SXiaoyao Li { 27141f7fd22SXiaoyao Li TdxFirmwareEntry *hob; 27241f7fd22SXiaoyao Li CPUState *cpu; 27341f7fd22SXiaoyao Li 27441f7fd22SXiaoyao Li hob = tdx_get_hob_entry(tdx_guest); 27541f7fd22SXiaoyao Li CPU_FOREACH(cpu) { 27641f7fd22SXiaoyao Li tdx_vcpu_ioctl(cpu, KVM_TDX_INIT_VCPU, 0, (void *)hob->address, 27741f7fd22SXiaoyao Li &error_fatal); 27841f7fd22SXiaoyao Li } 27941f7fd22SXiaoyao Li } 28041f7fd22SXiaoyao Li 2814420ba0eSXiaoyao Li static void tdx_finalize_vm(Notifier *notifier, void *unused) 2824420ba0eSXiaoyao Li { 2834420ba0eSXiaoyao Li TdxFirmware *tdvf = &tdx_guest->tdvf; 2844420ba0eSXiaoyao Li TdxFirmwareEntry *entry; 285ebc2d2b4SIsaku Yamahata RAMBlock *ram_block; 286ebc2d2b4SIsaku Yamahata Error *local_err = NULL; 287ebc2d2b4SIsaku Yamahata int r; 2884420ba0eSXiaoyao Li 289f18672e4SXiaoyao Li tdx_init_ram_entries(); 290f18672e4SXiaoyao Li 2914420ba0eSXiaoyao Li for_each_tdx_fw_entry(tdvf, entry) { 2924420ba0eSXiaoyao Li switch (entry->type) { 2934420ba0eSXiaoyao Li case TDVF_SECTION_TYPE_BFV: 2944420ba0eSXiaoyao Li case TDVF_SECTION_TYPE_CFV: 2954420ba0eSXiaoyao Li entry->mem_ptr = tdvf->mem_ptr + entry->data_offset; 2964420ba0eSXiaoyao Li break; 2974420ba0eSXiaoyao Li case TDVF_SECTION_TYPE_TD_HOB: 2984420ba0eSXiaoyao Li case TDVF_SECTION_TYPE_TEMP_MEM: 2994420ba0eSXiaoyao Li entry->mem_ptr = qemu_ram_mmap(-1, entry->size, 3004420ba0eSXiaoyao Li qemu_real_host_page_size(), 0, 0); 3014420ba0eSXiaoyao Li if (entry->mem_ptr == MAP_FAILED) { 3024420ba0eSXiaoyao Li error_report("Failed to mmap memory for TDVF section %d", 3034420ba0eSXiaoyao Li entry->type); 3044420ba0eSXiaoyao Li exit(1); 3054420ba0eSXiaoyao Li } 306f18672e4SXiaoyao Li if (tdx_accept_ram_range(entry->address, entry->size)) { 307f18672e4SXiaoyao Li error_report("Failed to accept memory for TDVF section %d", 308f18672e4SXiaoyao Li entry->type); 309f18672e4SXiaoyao Li qemu_ram_munmap(-1, entry->mem_ptr, entry->size); 310f18672e4SXiaoyao Li exit(1); 311f18672e4SXiaoyao Li } 3124420ba0eSXiaoyao Li break; 3134420ba0eSXiaoyao Li default: 3144420ba0eSXiaoyao Li error_report("Unsupported TDVF section %d", entry->type); 3154420ba0eSXiaoyao Li exit(1); 3164420ba0eSXiaoyao Li } 3174420ba0eSXiaoyao Li } 318f18672e4SXiaoyao Li 319f18672e4SXiaoyao Li qsort(tdx_guest->ram_entries, tdx_guest->nr_ram_entries, 320f18672e4SXiaoyao Li sizeof(TdxRamEntry), &tdx_ram_entry_compare); 321a7314259SXiaoyao Li 322a7314259SXiaoyao Li tdvf_hob_create(tdx_guest, tdx_get_hob_entry(tdx_guest)); 323ebc2d2b4SIsaku Yamahata 32441f7fd22SXiaoyao Li tdx_post_init_vcpus(); 32541f7fd22SXiaoyao Li 326ebc2d2b4SIsaku Yamahata for_each_tdx_fw_entry(tdvf, entry) { 327ebc2d2b4SIsaku Yamahata struct kvm_tdx_init_mem_region region; 328ebc2d2b4SIsaku Yamahata uint32_t flags; 329ebc2d2b4SIsaku Yamahata 330ebc2d2b4SIsaku Yamahata region = (struct kvm_tdx_init_mem_region) { 331ebc2d2b4SIsaku Yamahata .source_addr = (uint64_t)entry->mem_ptr, 332ebc2d2b4SIsaku Yamahata .gpa = entry->address, 333ebc2d2b4SIsaku Yamahata .nr_pages = entry->size >> 12, 334ebc2d2b4SIsaku Yamahata }; 335ebc2d2b4SIsaku Yamahata 336ebc2d2b4SIsaku Yamahata flags = entry->attributes & TDVF_SECTION_ATTRIBUTES_MR_EXTEND ? 337ebc2d2b4SIsaku Yamahata KVM_TDX_MEASURE_MEMORY_REGION : 0; 338ebc2d2b4SIsaku Yamahata 339ebc2d2b4SIsaku Yamahata do { 340ebc2d2b4SIsaku Yamahata error_free(local_err); 341ebc2d2b4SIsaku Yamahata local_err = NULL; 342ebc2d2b4SIsaku Yamahata r = tdx_vcpu_ioctl(first_cpu, KVM_TDX_INIT_MEM_REGION, flags, 343ebc2d2b4SIsaku Yamahata ®ion, &local_err); 344ebc2d2b4SIsaku Yamahata } while (r == -EAGAIN || r == -EINTR); 345ebc2d2b4SIsaku Yamahata if (r < 0) { 346ebc2d2b4SIsaku Yamahata error_report_err(local_err); 347ebc2d2b4SIsaku Yamahata exit(1); 348ebc2d2b4SIsaku Yamahata } 349ebc2d2b4SIsaku Yamahata 350ebc2d2b4SIsaku Yamahata if (entry->type == TDVF_SECTION_TYPE_TD_HOB || 351ebc2d2b4SIsaku Yamahata entry->type == TDVF_SECTION_TYPE_TEMP_MEM) { 352ebc2d2b4SIsaku Yamahata qemu_ram_munmap(-1, entry->mem_ptr, entry->size); 353ebc2d2b4SIsaku Yamahata entry->mem_ptr = NULL; 354ebc2d2b4SIsaku Yamahata } 355ebc2d2b4SIsaku Yamahata } 356ebc2d2b4SIsaku Yamahata 357ebc2d2b4SIsaku Yamahata /* 358ebc2d2b4SIsaku Yamahata * TDVF image has been copied into private region above via 359ebc2d2b4SIsaku Yamahata * KVM_MEMORY_MAPPING. It becomes useless. 360ebc2d2b4SIsaku Yamahata */ 361ebc2d2b4SIsaku Yamahata ram_block = tdx_guest->tdvf_mr->ram_block; 362ebc2d2b4SIsaku Yamahata ram_block_discard_range(ram_block, 0, ram_block->max_length); 363ae60ff4eSXiaoyao Li 364ae60ff4eSXiaoyao Li tdx_vm_ioctl(KVM_TDX_FINALIZE_VM, 0, NULL, &error_fatal); 365ae60ff4eSXiaoyao Li CONFIDENTIAL_GUEST_SUPPORT(tdx_guest)->ready = true; 3664420ba0eSXiaoyao Li } 3674420ba0eSXiaoyao Li 3684420ba0eSXiaoyao Li static Notifier tdx_machine_done_notify = { 3694420ba0eSXiaoyao Li .notify = tdx_finalize_vm, 3704420ba0eSXiaoyao Li }; 3714420ba0eSXiaoyao Li 3720ba06e46SXiaoyao Li /* 3730ba06e46SXiaoyao Li * Some CPUID bits change from fixed1 to configurable bits when TDX module 3740ba06e46SXiaoyao Li * supports TDX_FEATURES0.VE_REDUCTION. e.g., MCA/MCE/MTRR/CORE_CAPABILITY. 3750ba06e46SXiaoyao Li * 3760ba06e46SXiaoyao Li * To make QEMU work with all the versions of TDX module, keep the fixed1 bits 3770ba06e46SXiaoyao Li * here if they are ever fixed1 bits in any of the version though not fixed1 in 3780ba06e46SXiaoyao Li * the latest version. Otherwise, with the older version of TDX module, QEMU may 3790ba06e46SXiaoyao Li * treat the fixed1 bit as unsupported. 3800ba06e46SXiaoyao Li * 3810ba06e46SXiaoyao Li * For newer TDX module, it does no harm to keep them in tdx_fixed1_bits even 3820ba06e46SXiaoyao Li * though they changed to configurable bits. Because tdx_fixed1_bits is used to 3830ba06e46SXiaoyao Li * setup the supported bits. 3840ba06e46SXiaoyao Li */ 3850ba06e46SXiaoyao Li KvmCpuidInfo tdx_fixed1_bits = { 3860ba06e46SXiaoyao Li .cpuid.nent = 8, 3870ba06e46SXiaoyao Li .entries[0] = { 3880ba06e46SXiaoyao Li .function = 0x1, 3890ba06e46SXiaoyao Li .index = 0, 3900ba06e46SXiaoyao Li .ecx = CPUID_EXT_SSE3 | CPUID_EXT_PCLMULQDQ | CPUID_EXT_DTES64 | 3910ba06e46SXiaoyao Li CPUID_EXT_DSCPL | CPUID_EXT_SSSE3 | CPUID_EXT_CX16 | 3920ba06e46SXiaoyao Li CPUID_EXT_PDCM | CPUID_EXT_PCID | CPUID_EXT_SSE41 | 3930ba06e46SXiaoyao Li CPUID_EXT_SSE42 | CPUID_EXT_X2APIC | CPUID_EXT_MOVBE | 3940ba06e46SXiaoyao Li CPUID_EXT_POPCNT | CPUID_EXT_AES | CPUID_EXT_XSAVE | 3950ba06e46SXiaoyao Li CPUID_EXT_RDRAND | CPUID_EXT_HYPERVISOR, 3960ba06e46SXiaoyao Li .edx = CPUID_FP87 | CPUID_VME | CPUID_DE | CPUID_PSE | CPUID_TSC | 3970ba06e46SXiaoyao Li CPUID_MSR | CPUID_PAE | CPUID_MCE | CPUID_CX8 | CPUID_APIC | 3980ba06e46SXiaoyao Li CPUID_SEP | CPUID_MTRR | CPUID_PGE | CPUID_MCA | CPUID_CMOV | 3990ba06e46SXiaoyao Li CPUID_PAT | CPUID_CLFLUSH | CPUID_DTS | CPUID_MMX | CPUID_FXSR | 4000ba06e46SXiaoyao Li CPUID_SSE | CPUID_SSE2, 4010ba06e46SXiaoyao Li }, 4020ba06e46SXiaoyao Li .entries[1] = { 4030ba06e46SXiaoyao Li .function = 0x6, 4040ba06e46SXiaoyao Li .index = 0, 4050ba06e46SXiaoyao Li .eax = CPUID_6_EAX_ARAT, 4060ba06e46SXiaoyao Li }, 4070ba06e46SXiaoyao Li .entries[2] = { 4080ba06e46SXiaoyao Li .function = 0x7, 4090ba06e46SXiaoyao Li .index = 0, 4100ba06e46SXiaoyao Li .flags = KVM_CPUID_FLAG_SIGNIFCANT_INDEX, 4110ba06e46SXiaoyao Li .ebx = CPUID_7_0_EBX_FSGSBASE | CPUID_7_0_EBX_FDP_EXCPTN_ONLY | 4120ba06e46SXiaoyao Li CPUID_7_0_EBX_SMEP | CPUID_7_0_EBX_INVPCID | 4130ba06e46SXiaoyao Li CPUID_7_0_EBX_ZERO_FCS_FDS | CPUID_7_0_EBX_RDSEED | 4140ba06e46SXiaoyao Li CPUID_7_0_EBX_SMAP | CPUID_7_0_EBX_CLFLUSHOPT | 4150ba06e46SXiaoyao Li CPUID_7_0_EBX_CLWB | CPUID_7_0_EBX_SHA_NI, 4160ba06e46SXiaoyao Li .ecx = CPUID_7_0_ECX_BUS_LOCK_DETECT | CPUID_7_0_ECX_MOVDIRI | 4170ba06e46SXiaoyao Li CPUID_7_0_ECX_MOVDIR64B, 4180ba06e46SXiaoyao Li .edx = CPUID_7_0_EDX_MD_CLEAR | CPUID_7_0_EDX_SPEC_CTRL | 4190ba06e46SXiaoyao Li CPUID_7_0_EDX_STIBP | CPUID_7_0_EDX_FLUSH_L1D | 4200ba06e46SXiaoyao Li CPUID_7_0_EDX_ARCH_CAPABILITIES | CPUID_7_0_EDX_CORE_CAPABILITY | 4210ba06e46SXiaoyao Li CPUID_7_0_EDX_SPEC_CTRL_SSBD, 4220ba06e46SXiaoyao Li }, 4230ba06e46SXiaoyao Li .entries[3] = { 4240ba06e46SXiaoyao Li .function = 0x7, 4250ba06e46SXiaoyao Li .index = 2, 4260ba06e46SXiaoyao Li .flags = KVM_CPUID_FLAG_SIGNIFCANT_INDEX, 4270ba06e46SXiaoyao Li .edx = CPUID_7_2_EDX_PSFD | CPUID_7_2_EDX_IPRED_CTRL | 4280ba06e46SXiaoyao Li CPUID_7_2_EDX_RRSBA_CTRL | CPUID_7_2_EDX_BHI_CTRL, 4290ba06e46SXiaoyao Li }, 4300ba06e46SXiaoyao Li .entries[4] = { 4310ba06e46SXiaoyao Li .function = 0xD, 4320ba06e46SXiaoyao Li .index = 0, 4330ba06e46SXiaoyao Li .flags = KVM_CPUID_FLAG_SIGNIFCANT_INDEX, 4340ba06e46SXiaoyao Li .eax = XSTATE_FP_MASK | XSTATE_SSE_MASK, 4350ba06e46SXiaoyao Li }, 4360ba06e46SXiaoyao Li .entries[5] = { 4370ba06e46SXiaoyao Li .function = 0xD, 4380ba06e46SXiaoyao Li .index = 1, 4390ba06e46SXiaoyao Li .flags = KVM_CPUID_FLAG_SIGNIFCANT_INDEX, 4400ba06e46SXiaoyao Li .eax = CPUID_XSAVE_XSAVEOPT | CPUID_XSAVE_XSAVEC| 4410ba06e46SXiaoyao Li CPUID_XSAVE_XGETBV1 | CPUID_XSAVE_XSAVES, 4420ba06e46SXiaoyao Li }, 4430ba06e46SXiaoyao Li .entries[6] = { 4440ba06e46SXiaoyao Li .function = 0x80000001, 4450ba06e46SXiaoyao Li .index = 0, 4460ba06e46SXiaoyao Li .ecx = CPUID_EXT3_LAHF_LM | CPUID_EXT3_ABM | CPUID_EXT3_3DNOWPREFETCH, 4470ba06e46SXiaoyao Li /* 4480ba06e46SXiaoyao Li * Strictly speaking, SYSCALL is not fixed1 bit since it depends on 4490ba06e46SXiaoyao Li * the CPU to be in 64-bit mode. But here fixed1 is used to serve the 4500ba06e46SXiaoyao Li * purpose of supported bits for TDX. In this sense, SYACALL is always 4510ba06e46SXiaoyao Li * supported. 4520ba06e46SXiaoyao Li */ 4530ba06e46SXiaoyao Li .edx = CPUID_EXT2_SYSCALL | CPUID_EXT2_NX | CPUID_EXT2_PDPE1GB | 4540ba06e46SXiaoyao Li CPUID_EXT2_RDTSCP | CPUID_EXT2_LM, 4550ba06e46SXiaoyao Li }, 4560ba06e46SXiaoyao Li .entries[7] = { 4570ba06e46SXiaoyao Li .function = 0x80000007, 4580ba06e46SXiaoyao Li .index = 0, 4590ba06e46SXiaoyao Li .edx = CPUID_APM_INVTSC, 4600ba06e46SXiaoyao Li }, 4610ba06e46SXiaoyao Li }; 4620ba06e46SXiaoyao Li 46331df29c5SXiaoyao Li typedef struct TdxAttrsMap { 46431df29c5SXiaoyao Li uint32_t attr_index; 46531df29c5SXiaoyao Li uint32_t cpuid_leaf; 46631df29c5SXiaoyao Li uint32_t cpuid_subleaf; 46731df29c5SXiaoyao Li int cpuid_reg; 46831df29c5SXiaoyao Li uint32_t feat_mask; 46931df29c5SXiaoyao Li } TdxAttrsMap; 47031df29c5SXiaoyao Li 47131df29c5SXiaoyao Li static TdxAttrsMap tdx_attrs_maps[] = { 47231df29c5SXiaoyao Li {.attr_index = 27, 47331df29c5SXiaoyao Li .cpuid_leaf = 7, 47431df29c5SXiaoyao Li .cpuid_subleaf = 1, 47531df29c5SXiaoyao Li .cpuid_reg = R_EAX, 47631df29c5SXiaoyao Li .feat_mask = CPUID_7_1_EAX_LASS,}, 47731df29c5SXiaoyao Li 47831df29c5SXiaoyao Li {.attr_index = 30, 47931df29c5SXiaoyao Li .cpuid_leaf = 7, 48031df29c5SXiaoyao Li .cpuid_subleaf = 0, 48131df29c5SXiaoyao Li .cpuid_reg = R_ECX, 48231df29c5SXiaoyao Li .feat_mask = CPUID_7_0_ECX_PKS,}, 48331df29c5SXiaoyao Li 48431df29c5SXiaoyao Li {.attr_index = 31, 48531df29c5SXiaoyao Li .cpuid_leaf = 7, 48631df29c5SXiaoyao Li .cpuid_subleaf = 0, 48731df29c5SXiaoyao Li .cpuid_reg = R_ECX, 48831df29c5SXiaoyao Li .feat_mask = CPUID_7_0_ECX_KeyLocker,}, 48931df29c5SXiaoyao Li }; 49031df29c5SXiaoyao Li 4918c94c84cSXiaoyao Li typedef struct TdxXFAMDep { 4928c94c84cSXiaoyao Li int xfam_bit; 4938c94c84cSXiaoyao Li FeatureMask feat_mask; 4948c94c84cSXiaoyao Li } TdxXFAMDep; 4958c94c84cSXiaoyao Li 4968c94c84cSXiaoyao Li /* 4978c94c84cSXiaoyao Li * Note, only the CPUID bits whose virtualization type are "XFAM & Native" are 4988c94c84cSXiaoyao Li * defiend here. 4998c94c84cSXiaoyao Li * 5008c94c84cSXiaoyao Li * For those whose virtualization type are "XFAM & Configured & Native", they 5018c94c84cSXiaoyao Li * are reported as configurable bits. And they are not supported if not in the 5028c94c84cSXiaoyao Li * configureable bits list from KVM even if the corresponding XFAM bit is 5038c94c84cSXiaoyao Li * supported. 5048c94c84cSXiaoyao Li */ 5058c94c84cSXiaoyao Li TdxXFAMDep tdx_xfam_deps[] = { 5068c94c84cSXiaoyao Li { XSTATE_YMM_BIT, { FEAT_1_ECX, CPUID_EXT_FMA }}, 5078c94c84cSXiaoyao Li { XSTATE_YMM_BIT, { FEAT_7_0_EBX, CPUID_7_0_EBX_AVX2 }}, 5088c94c84cSXiaoyao Li { XSTATE_OPMASK_BIT, { FEAT_7_0_ECX, CPUID_7_0_ECX_AVX512_VBMI}}, 5098c94c84cSXiaoyao Li { XSTATE_OPMASK_BIT, { FEAT_7_0_EDX, CPUID_7_0_EDX_AVX512_FP16}}, 5108c94c84cSXiaoyao Li { XSTATE_PT_BIT, { FEAT_7_0_EBX, CPUID_7_0_EBX_INTEL_PT}}, 5118c94c84cSXiaoyao Li { XSTATE_PKRU_BIT, { FEAT_7_0_ECX, CPUID_7_0_ECX_PKU}}, 5128c94c84cSXiaoyao Li { XSTATE_XTILE_CFG_BIT, { FEAT_7_0_EDX, CPUID_7_0_EDX_AMX_BF16 }}, 5138c94c84cSXiaoyao Li { XSTATE_XTILE_CFG_BIT, { FEAT_7_0_EDX, CPUID_7_0_EDX_AMX_TILE }}, 5148c94c84cSXiaoyao Li { XSTATE_XTILE_CFG_BIT, { FEAT_7_0_EDX, CPUID_7_0_EDX_AMX_INT8 }}, 5158c94c84cSXiaoyao Li }; 5168c94c84cSXiaoyao Li 5170ba06e46SXiaoyao Li static struct kvm_cpuid_entry2 *find_in_supported_entry(uint32_t function, 5180ba06e46SXiaoyao Li uint32_t index) 5190ba06e46SXiaoyao Li { 5200ba06e46SXiaoyao Li struct kvm_cpuid_entry2 *e; 5210ba06e46SXiaoyao Li 5220ba06e46SXiaoyao Li e = cpuid_find_entry(tdx_supported_cpuid, function, index); 5230ba06e46SXiaoyao Li if (!e) { 5240ba06e46SXiaoyao Li if (tdx_supported_cpuid->nent >= KVM_MAX_CPUID_ENTRIES) { 5250ba06e46SXiaoyao Li error_report("tdx_supported_cpuid requries more space than %d entries", 5260ba06e46SXiaoyao Li KVM_MAX_CPUID_ENTRIES); 5270ba06e46SXiaoyao Li exit(1); 5280ba06e46SXiaoyao Li } 5290ba06e46SXiaoyao Li e = &tdx_supported_cpuid->entries[tdx_supported_cpuid->nent++]; 5300ba06e46SXiaoyao Li e->function = function; 5310ba06e46SXiaoyao Li e->index = index; 5320ba06e46SXiaoyao Li } 5330ba06e46SXiaoyao Li 5340ba06e46SXiaoyao Li return e; 5350ba06e46SXiaoyao Li } 5360ba06e46SXiaoyao Li 5370ba06e46SXiaoyao Li static void tdx_add_supported_cpuid_by_fixed1_bits(void) 5380ba06e46SXiaoyao Li { 5390ba06e46SXiaoyao Li struct kvm_cpuid_entry2 *e, *e1; 5400ba06e46SXiaoyao Li int i; 5410ba06e46SXiaoyao Li 5420ba06e46SXiaoyao Li for (i = 0; i < tdx_fixed1_bits.cpuid.nent; i++) { 5430ba06e46SXiaoyao Li e = &tdx_fixed1_bits.entries[i]; 5440ba06e46SXiaoyao Li 5450ba06e46SXiaoyao Li e1 = find_in_supported_entry(e->function, e->index); 5460ba06e46SXiaoyao Li e1->eax |= e->eax; 5470ba06e46SXiaoyao Li e1->ebx |= e->ebx; 5480ba06e46SXiaoyao Li e1->ecx |= e->ecx; 5490ba06e46SXiaoyao Li e1->edx |= e->edx; 5500ba06e46SXiaoyao Li } 5510ba06e46SXiaoyao Li } 5520ba06e46SXiaoyao Li 55331df29c5SXiaoyao Li static void tdx_add_supported_cpuid_by_attrs(void) 55431df29c5SXiaoyao Li { 55531df29c5SXiaoyao Li struct kvm_cpuid_entry2 *e; 55631df29c5SXiaoyao Li TdxAttrsMap *map; 55731df29c5SXiaoyao Li int i; 55831df29c5SXiaoyao Li 55931df29c5SXiaoyao Li for (i = 0; i < ARRAY_SIZE(tdx_attrs_maps); i++) { 56031df29c5SXiaoyao Li map = &tdx_attrs_maps[i]; 56131df29c5SXiaoyao Li if (!((1ULL << map->attr_index) & tdx_caps->supported_attrs)) { 56231df29c5SXiaoyao Li continue; 56331df29c5SXiaoyao Li } 56431df29c5SXiaoyao Li 56531df29c5SXiaoyao Li e = find_in_supported_entry(map->cpuid_leaf, map->cpuid_subleaf); 56631df29c5SXiaoyao Li 56731df29c5SXiaoyao Li switch(map->cpuid_reg) { 56831df29c5SXiaoyao Li case R_EAX: 56931df29c5SXiaoyao Li e->eax |= map->feat_mask; 57031df29c5SXiaoyao Li break; 57131df29c5SXiaoyao Li case R_EBX: 57231df29c5SXiaoyao Li e->ebx |= map->feat_mask; 57331df29c5SXiaoyao Li break; 57431df29c5SXiaoyao Li case R_ECX: 57531df29c5SXiaoyao Li e->ecx |= map->feat_mask; 57631df29c5SXiaoyao Li break; 57731df29c5SXiaoyao Li case R_EDX: 57831df29c5SXiaoyao Li e->edx |= map->feat_mask; 57931df29c5SXiaoyao Li break; 58031df29c5SXiaoyao Li } 58131df29c5SXiaoyao Li } 58231df29c5SXiaoyao Li } 58331df29c5SXiaoyao Li 5848c94c84cSXiaoyao Li static void tdx_add_supported_cpuid_by_xfam(void) 5858c94c84cSXiaoyao Li { 5868c94c84cSXiaoyao Li struct kvm_cpuid_entry2 *e; 5878c94c84cSXiaoyao Li int i; 5888c94c84cSXiaoyao Li 5898c94c84cSXiaoyao Li const TdxXFAMDep *xfam_dep; 5908c94c84cSXiaoyao Li const FeatureWordInfo *f; 5918c94c84cSXiaoyao Li for (i = 0; i < ARRAY_SIZE(tdx_xfam_deps); i++) { 5928c94c84cSXiaoyao Li xfam_dep = &tdx_xfam_deps[i]; 5938c94c84cSXiaoyao Li if (!((1ULL << xfam_dep->xfam_bit) & tdx_caps->supported_xfam)) { 5948c94c84cSXiaoyao Li continue; 5958c94c84cSXiaoyao Li } 5968c94c84cSXiaoyao Li 5978c94c84cSXiaoyao Li f = &feature_word_info[xfam_dep->feat_mask.index]; 5988c94c84cSXiaoyao Li if (f->type != CPUID_FEATURE_WORD) { 5998c94c84cSXiaoyao Li continue; 6008c94c84cSXiaoyao Li } 6018c94c84cSXiaoyao Li 6028c94c84cSXiaoyao Li e = find_in_supported_entry(f->cpuid.eax, f->cpuid.ecx); 6038c94c84cSXiaoyao Li switch(f->cpuid.reg) { 6048c94c84cSXiaoyao Li case R_EAX: 6058c94c84cSXiaoyao Li e->eax |= xfam_dep->feat_mask.mask; 6068c94c84cSXiaoyao Li break; 6078c94c84cSXiaoyao Li case R_EBX: 6088c94c84cSXiaoyao Li e->ebx |= xfam_dep->feat_mask.mask; 6098c94c84cSXiaoyao Li break; 6108c94c84cSXiaoyao Li case R_ECX: 6118c94c84cSXiaoyao Li e->ecx |= xfam_dep->feat_mask.mask; 6128c94c84cSXiaoyao Li break; 6138c94c84cSXiaoyao Li case R_EDX: 6148c94c84cSXiaoyao Li e->edx |= xfam_dep->feat_mask.mask; 6158c94c84cSXiaoyao Li break; 6168c94c84cSXiaoyao Li } 6178c94c84cSXiaoyao Li } 6188c94c84cSXiaoyao Li 6198c94c84cSXiaoyao Li e = find_in_supported_entry(0xd, 0); 6208c94c84cSXiaoyao Li e->eax |= (tdx_caps->supported_xfam & CPUID_XSTATE_XCR0_MASK); 6218c94c84cSXiaoyao Li e->edx |= (tdx_caps->supported_xfam & CPUID_XSTATE_XCR0_MASK) >> 32; 6228c94c84cSXiaoyao Li 6238c94c84cSXiaoyao Li e = find_in_supported_entry(0xd, 1); 624*9f5771c5SXiaoyao Li /* 625*9f5771c5SXiaoyao Li * Mark XFD always support for TDX, it will be cleared finally in 626*9f5771c5SXiaoyao Li * tdx_adjust_cpuid_features() if XFD is unavailable on the hardware 627*9f5771c5SXiaoyao Li * because in this case the original data has it as 0. 628*9f5771c5SXiaoyao Li */ 629*9f5771c5SXiaoyao Li e->eax |= CPUID_XSAVE_XFD; 6308c94c84cSXiaoyao Li e->ecx |= (tdx_caps->supported_xfam & CPUID_XSTATE_XSS_MASK); 6318c94c84cSXiaoyao Li e->edx |= (tdx_caps->supported_xfam & CPUID_XSTATE_XSS_MASK) >> 32; 6328c94c84cSXiaoyao Li } 6338c94c84cSXiaoyao Li 63475ec6189SXiaoyao Li static void tdx_setup_supported_cpuid(void) 63575ec6189SXiaoyao Li { 63675ec6189SXiaoyao Li if (tdx_supported_cpuid) { 63775ec6189SXiaoyao Li return; 63875ec6189SXiaoyao Li } 63975ec6189SXiaoyao Li 64075ec6189SXiaoyao Li tdx_supported_cpuid = g_malloc0(sizeof(*tdx_supported_cpuid) + 64175ec6189SXiaoyao Li KVM_MAX_CPUID_ENTRIES * sizeof(struct kvm_cpuid_entry2)); 64275ec6189SXiaoyao Li 64375ec6189SXiaoyao Li memcpy(tdx_supported_cpuid->entries, tdx_caps->cpuid.entries, 64475ec6189SXiaoyao Li tdx_caps->cpuid.nent * sizeof(struct kvm_cpuid_entry2)); 64575ec6189SXiaoyao Li tdx_supported_cpuid->nent = tdx_caps->cpuid.nent; 6460ba06e46SXiaoyao Li 6470ba06e46SXiaoyao Li tdx_add_supported_cpuid_by_fixed1_bits(); 64831df29c5SXiaoyao Li tdx_add_supported_cpuid_by_attrs(); 6498c94c84cSXiaoyao Li tdx_add_supported_cpuid_by_xfam(); 65075ec6189SXiaoyao Li } 65175ec6189SXiaoyao Li 6528eddedc3SXiaoyao Li static int tdx_kvm_init(ConfidentialGuestSupport *cgs, Error **errp) 6538eddedc3SXiaoyao Li { 654810d4e83SXiaoyao Li MachineState *ms = MACHINE(qdev_get_machine()); 655810d4e83SXiaoyao Li X86MachineState *x86ms = X86_MACHINE(ms); 6561619d0e4SXiaoyao Li TdxGuest *tdx = TDX_GUEST(cgs); 6578eddedc3SXiaoyao Li int r = 0; 6588eddedc3SXiaoyao Li 6598eddedc3SXiaoyao Li kvm_mark_guest_state_protected(); 6608eddedc3SXiaoyao Li 661810d4e83SXiaoyao Li if (x86ms->smm == ON_OFF_AUTO_AUTO) { 662810d4e83SXiaoyao Li x86ms->smm = ON_OFF_AUTO_OFF; 663810d4e83SXiaoyao Li } else if (x86ms->smm == ON_OFF_AUTO_ON) { 664810d4e83SXiaoyao Li error_setg(errp, "TDX VM doesn't support SMM"); 665810d4e83SXiaoyao Li return -EINVAL; 666810d4e83SXiaoyao Li } 667810d4e83SXiaoyao Li 668e7ef6089SXiaoyao Li if (x86ms->pic == ON_OFF_AUTO_AUTO) { 669e7ef6089SXiaoyao Li x86ms->pic = ON_OFF_AUTO_OFF; 670e7ef6089SXiaoyao Li } else if (x86ms->pic == ON_OFF_AUTO_ON) { 671e7ef6089SXiaoyao Li error_setg(errp, "TDX VM doesn't support PIC"); 672e7ef6089SXiaoyao Li return -EINVAL; 673e7ef6089SXiaoyao Li } 674e7ef6089SXiaoyao Li 675bb45580dSXiaoyao Li if (kvm_state->kernel_irqchip_split == ON_OFF_AUTO_AUTO) { 676bb45580dSXiaoyao Li kvm_state->kernel_irqchip_split = ON_OFF_AUTO_ON; 677bb45580dSXiaoyao Li } else if (kvm_state->kernel_irqchip_split != ON_OFF_AUTO_ON) { 678bb45580dSXiaoyao Li error_setg(errp, "TDX VM requires kernel_irqchip to be split"); 679bb45580dSXiaoyao Li return -EINVAL; 680bb45580dSXiaoyao Li } 681bb45580dSXiaoyao Li 6828eddedc3SXiaoyao Li if (!tdx_caps) { 6838eddedc3SXiaoyao Li r = get_tdx_capabilities(errp); 6841619d0e4SXiaoyao Li if (r) { 6851619d0e4SXiaoyao Li return r; 6861619d0e4SXiaoyao Li } 6878eddedc3SXiaoyao Li } 6888eddedc3SXiaoyao Li 68975ec6189SXiaoyao Li tdx_setup_supported_cpuid(); 69075ec6189SXiaoyao Li 6911ff5048dSXiaoyao Li /* TDX relies on KVM_HC_MAP_GPA_RANGE to handle TDG.VP.VMCALL<MapGPA> */ 6921ff5048dSXiaoyao Li if (!kvm_enable_hypercall(BIT_ULL(KVM_HC_MAP_GPA_RANGE))) { 6931ff5048dSXiaoyao Li return -EOPNOTSUPP; 6941ff5048dSXiaoyao Li } 6951ff5048dSXiaoyao Li 696da672865SXiaoyao Li /* 697da672865SXiaoyao Li * Set kvm_readonly_mem_allowed to false, because TDX only supports readonly 698da672865SXiaoyao Li * memory for shared memory but not for private memory. Besides, whether a 699da672865SXiaoyao Li * memslot is private or shared is not determined by QEMU. 700da672865SXiaoyao Li * 701da672865SXiaoyao Li * Thus, just mark readonly memory not supported for simplicity. 702da672865SXiaoyao Li */ 703da672865SXiaoyao Li kvm_readonly_mem_allowed = false; 704da672865SXiaoyao Li 7054420ba0eSXiaoyao Li qemu_add_machine_init_done_notifier(&tdx_machine_done_notify); 7064420ba0eSXiaoyao Li 7071619d0e4SXiaoyao Li tdx_guest = tdx; 7081619d0e4SXiaoyao Li return 0; 7098eddedc3SXiaoyao Li } 7108eddedc3SXiaoyao Li 711b455880eSXiaoyao Li static int tdx_kvm_type(X86ConfidentialGuest *cg) 712b455880eSXiaoyao Li { 713b455880eSXiaoyao Li /* Do the object check */ 714b455880eSXiaoyao Li TDX_GUEST(cg); 715b455880eSXiaoyao Li 716b455880eSXiaoyao Li return KVM_X86_TDX_VM; 717b455880eSXiaoyao Li } 718b455880eSXiaoyao Li 7197c615242SXiaoyao Li static void tdx_cpu_instance_init(X86ConfidentialGuest *cg, CPUState *cpu) 7207c615242SXiaoyao Li { 7219002494fSXiaoyao Li X86CPU *x86cpu = X86_CPU(cpu); 7229002494fSXiaoyao Li 7237c615242SXiaoyao Li object_property_set_bool(OBJECT(cpu), "pmu", false, &error_abort); 7249002494fSXiaoyao Li 7259002494fSXiaoyao Li x86cpu->enable_cpuid_0x1f = true; 7267c615242SXiaoyao Li } 7277c615242SXiaoyao Li 72875ec6189SXiaoyao Li static uint32_t tdx_adjust_cpuid_features(X86ConfidentialGuest *cg, 72975ec6189SXiaoyao Li uint32_t feature, uint32_t index, 73075ec6189SXiaoyao Li int reg, uint32_t value) 73175ec6189SXiaoyao Li { 73275ec6189SXiaoyao Li struct kvm_cpuid_entry2 *e; 73375ec6189SXiaoyao Li 7340ba06e46SXiaoyao Li e = cpuid_find_entry(&tdx_fixed1_bits.cpuid, feature, index); 7350ba06e46SXiaoyao Li if (e) { 7360ba06e46SXiaoyao Li value |= cpuid_entry_get_reg(e, reg); 7370ba06e46SXiaoyao Li } 7380ba06e46SXiaoyao Li 73975ec6189SXiaoyao Li if (is_feature_word_cpuid(feature, index, reg)) { 74075ec6189SXiaoyao Li e = cpuid_find_entry(tdx_supported_cpuid, feature, index); 74175ec6189SXiaoyao Li if (e) { 74275ec6189SXiaoyao Li value &= cpuid_entry_get_reg(e, reg); 74375ec6189SXiaoyao Li } 74475ec6189SXiaoyao Li } 74575ec6189SXiaoyao Li 74675ec6189SXiaoyao Li return value; 74775ec6189SXiaoyao Li } 74875ec6189SXiaoyao Li 74953b6f406SXiaoyao Li static int tdx_validate_attributes(TdxGuest *tdx, Error **errp) 75053b6f406SXiaoyao Li { 75153b6f406SXiaoyao Li if ((tdx->attributes & ~tdx_caps->supported_attrs)) { 75253b6f406SXiaoyao Li error_setg(errp, "Invalid attributes 0x%lx for TDX VM " 75353b6f406SXiaoyao Li "(KVM supported: 0x%llx)", tdx->attributes, 75453b6f406SXiaoyao Li tdx_caps->supported_attrs); 75553b6f406SXiaoyao Li return -1; 75653b6f406SXiaoyao Li } 75753b6f406SXiaoyao Li 75853b6f406SXiaoyao Li if (tdx->attributes & ~TDX_SUPPORTED_TD_ATTRS) { 75953b6f406SXiaoyao Li error_setg(errp, "Some QEMU unsupported TD attribute bits being " 76053b6f406SXiaoyao Li "requested: 0x%lx (QEMU supported: 0x%llx)", 76153b6f406SXiaoyao Li tdx->attributes, TDX_SUPPORTED_TD_ATTRS); 76253b6f406SXiaoyao Li return -1; 76353b6f406SXiaoyao Li } 76453b6f406SXiaoyao Li 76553b6f406SXiaoyao Li return 0; 76653b6f406SXiaoyao Li } 76753b6f406SXiaoyao Li 76853b6f406SXiaoyao Li static int setup_td_guest_attributes(X86CPU *x86cpu, Error **errp) 769bb3be394SXiaoyao Li { 770bb3be394SXiaoyao Li CPUX86State *env = &x86cpu->env; 771bb3be394SXiaoyao Li 772bb3be394SXiaoyao Li tdx_guest->attributes |= (env->features[FEAT_7_0_ECX] & CPUID_7_0_ECX_PKS) ? 773bb3be394SXiaoyao Li TDX_TD_ATTRIBUTES_PKS : 0; 774bb3be394SXiaoyao Li tdx_guest->attributes |= x86cpu->enable_pmu ? TDX_TD_ATTRIBUTES_PERFMON : 0; 77553b6f406SXiaoyao Li 77653b6f406SXiaoyao Li return tdx_validate_attributes(tdx_guest, errp); 777bb3be394SXiaoyao Li } 778bb3be394SXiaoyao Li 779f15898b0SXiaoyao Li static int setup_td_xfam(X86CPU *x86cpu, Error **errp) 780f15898b0SXiaoyao Li { 781f15898b0SXiaoyao Li CPUX86State *env = &x86cpu->env; 782f15898b0SXiaoyao Li uint64_t xfam; 783f15898b0SXiaoyao Li 784f15898b0SXiaoyao Li xfam = env->features[FEAT_XSAVE_XCR0_LO] | 785f15898b0SXiaoyao Li env->features[FEAT_XSAVE_XCR0_HI] | 786f15898b0SXiaoyao Li env->features[FEAT_XSAVE_XSS_LO] | 787f15898b0SXiaoyao Li env->features[FEAT_XSAVE_XSS_HI]; 788f15898b0SXiaoyao Li 789f15898b0SXiaoyao Li if (xfam & ~tdx_caps->supported_xfam) { 790f15898b0SXiaoyao Li error_setg(errp, "Invalid XFAM 0x%lx for TDX VM (supported: 0x%llx))", 791f15898b0SXiaoyao Li xfam, tdx_caps->supported_xfam); 792f15898b0SXiaoyao Li return -1; 793f15898b0SXiaoyao Li } 794f15898b0SXiaoyao Li 795f15898b0SXiaoyao Li tdx_guest->xfam = xfam; 796f15898b0SXiaoyao Li return 0; 797f15898b0SXiaoyao Li } 798f15898b0SXiaoyao Li 799f15898b0SXiaoyao Li static void tdx_filter_cpuid(struct kvm_cpuid2 *cpuids) 800f15898b0SXiaoyao Li { 801f15898b0SXiaoyao Li int i, dest_cnt = 0; 802f15898b0SXiaoyao Li struct kvm_cpuid_entry2 *src, *dest, *conf; 803f15898b0SXiaoyao Li 804f15898b0SXiaoyao Li for (i = 0; i < cpuids->nent; i++) { 805f15898b0SXiaoyao Li src = cpuids->entries + i; 806f15898b0SXiaoyao Li conf = cpuid_find_entry(&tdx_caps->cpuid, src->function, src->index); 807f15898b0SXiaoyao Li if (!conf) { 808f15898b0SXiaoyao Li continue; 809f15898b0SXiaoyao Li } 810f15898b0SXiaoyao Li dest = cpuids->entries + dest_cnt; 811f15898b0SXiaoyao Li 812f15898b0SXiaoyao Li dest->function = src->function; 813f15898b0SXiaoyao Li dest->index = src->index; 814f15898b0SXiaoyao Li dest->flags = src->flags; 815f15898b0SXiaoyao Li dest->eax = src->eax & conf->eax; 816f15898b0SXiaoyao Li dest->ebx = src->ebx & conf->ebx; 817f15898b0SXiaoyao Li dest->ecx = src->ecx & conf->ecx; 818f15898b0SXiaoyao Li dest->edx = src->edx & conf->edx; 819f15898b0SXiaoyao Li 820f15898b0SXiaoyao Li dest_cnt++; 821f15898b0SXiaoyao Li } 822f15898b0SXiaoyao Li cpuids->nent = dest_cnt++; 823f15898b0SXiaoyao Li } 824f15898b0SXiaoyao Li 825f15898b0SXiaoyao Li int tdx_pre_create_vcpu(CPUState *cpu, Error **errp) 826f15898b0SXiaoyao Li { 827f15898b0SXiaoyao Li X86CPU *x86cpu = X86_CPU(cpu); 828f15898b0SXiaoyao Li CPUX86State *env = &x86cpu->env; 829f15898b0SXiaoyao Li g_autofree struct kvm_tdx_init_vm *init_vm = NULL; 830f15898b0SXiaoyao Li Error *local_err = NULL; 831d05a0858SIsaku Yamahata size_t data_len; 832f15898b0SXiaoyao Li int retry = 10000; 833f15898b0SXiaoyao Li int r = 0; 834f15898b0SXiaoyao Li 835f15898b0SXiaoyao Li QEMU_LOCK_GUARD(&tdx_guest->lock); 836f15898b0SXiaoyao Li if (tdx_guest->initialized) { 837f15898b0SXiaoyao Li return r; 838f15898b0SXiaoyao Li } 839f15898b0SXiaoyao Li 840f15898b0SXiaoyao Li init_vm = g_malloc0(sizeof(struct kvm_tdx_init_vm) + 841f15898b0SXiaoyao Li sizeof(struct kvm_cpuid_entry2) * KVM_MAX_CPUID_ENTRIES); 842f15898b0SXiaoyao Li 843d529a2acSXiaoyao Li if (!kvm_check_extension(kvm_state, KVM_CAP_X86_APIC_BUS_CYCLES_NS)) { 844d529a2acSXiaoyao Li error_setg(errp, "KVM doesn't support KVM_CAP_X86_APIC_BUS_CYCLES_NS"); 845d529a2acSXiaoyao Li return -EOPNOTSUPP; 846d529a2acSXiaoyao Li } 847d529a2acSXiaoyao Li 848d529a2acSXiaoyao Li r = kvm_vm_enable_cap(kvm_state, KVM_CAP_X86_APIC_BUS_CYCLES_NS, 849d529a2acSXiaoyao Li 0, TDX_APIC_BUS_CYCLES_NS); 850d529a2acSXiaoyao Li if (r < 0) { 851d529a2acSXiaoyao Li error_setg_errno(errp, -r, 852d529a2acSXiaoyao Li "Unable to set core crystal clock frequency to 25MHz"); 853d529a2acSXiaoyao Li return r; 854d529a2acSXiaoyao Li } 855d529a2acSXiaoyao Li 8560e73b843SXiaoyao Li if (env->tsc_khz && (env->tsc_khz < TDX_MIN_TSC_FREQUENCY_KHZ || 8570e73b843SXiaoyao Li env->tsc_khz > TDX_MAX_TSC_FREQUENCY_KHZ)) { 8580e73b843SXiaoyao Li error_setg(errp, "Invalid TSC %ld KHz, must specify cpu_frequency " 8590e73b843SXiaoyao Li "between [%d, %d] kHz", env->tsc_khz, 8600e73b843SXiaoyao Li TDX_MIN_TSC_FREQUENCY_KHZ, TDX_MAX_TSC_FREQUENCY_KHZ); 8610e73b843SXiaoyao Li return -EINVAL; 8620e73b843SXiaoyao Li } 8630e73b843SXiaoyao Li 8640e73b843SXiaoyao Li if (env->tsc_khz % (25 * 1000)) { 8650e73b843SXiaoyao Li error_setg(errp, "Invalid TSC %ld KHz, it must be multiple of 25MHz", 8660e73b843SXiaoyao Li env->tsc_khz); 8670e73b843SXiaoyao Li return -EINVAL; 8680e73b843SXiaoyao Li } 8690e73b843SXiaoyao Li 8700e73b843SXiaoyao Li /* it's safe even env->tsc_khz is 0. KVM uses host's tsc_khz in this case */ 8710e73b843SXiaoyao Li r = kvm_vm_ioctl(kvm_state, KVM_SET_TSC_KHZ, env->tsc_khz); 8720e73b843SXiaoyao Li if (r < 0) { 8730e73b843SXiaoyao Li error_setg_errno(errp, -r, "Unable to set TSC frequency to %ld kHz", 8740e73b843SXiaoyao Li env->tsc_khz); 8750e73b843SXiaoyao Li return r; 8760e73b843SXiaoyao Li } 8770e73b843SXiaoyao Li 878d05a0858SIsaku Yamahata if (tdx_guest->mrconfigid) { 879d05a0858SIsaku Yamahata g_autofree uint8_t *data = qbase64_decode(tdx_guest->mrconfigid, 880d05a0858SIsaku Yamahata strlen(tdx_guest->mrconfigid), &data_len, errp); 881d05a0858SIsaku Yamahata if (!data) { 882d05a0858SIsaku Yamahata return -1; 883d05a0858SIsaku Yamahata } 884d05a0858SIsaku Yamahata if (data_len != QCRYPTO_HASH_DIGEST_LEN_SHA384) { 885d05a0858SIsaku Yamahata error_setg(errp, "TDX: failed to decode mrconfigid"); 886d05a0858SIsaku Yamahata return -1; 887d05a0858SIsaku Yamahata } 888d05a0858SIsaku Yamahata memcpy(init_vm->mrconfigid, data, data_len); 889d05a0858SIsaku Yamahata } 890d05a0858SIsaku Yamahata 891d05a0858SIsaku Yamahata if (tdx_guest->mrowner) { 892d05a0858SIsaku Yamahata g_autofree uint8_t *data = qbase64_decode(tdx_guest->mrowner, 893d05a0858SIsaku Yamahata strlen(tdx_guest->mrowner), &data_len, errp); 894d05a0858SIsaku Yamahata if (!data) { 895d05a0858SIsaku Yamahata return -1; 896d05a0858SIsaku Yamahata } 897d05a0858SIsaku Yamahata if (data_len != QCRYPTO_HASH_DIGEST_LEN_SHA384) { 898d05a0858SIsaku Yamahata error_setg(errp, "TDX: failed to decode mrowner"); 899d05a0858SIsaku Yamahata return -1; 900d05a0858SIsaku Yamahata } 901d05a0858SIsaku Yamahata memcpy(init_vm->mrowner, data, data_len); 902d05a0858SIsaku Yamahata } 903d05a0858SIsaku Yamahata 904d05a0858SIsaku Yamahata if (tdx_guest->mrownerconfig) { 905d05a0858SIsaku Yamahata g_autofree uint8_t *data = qbase64_decode(tdx_guest->mrownerconfig, 906d05a0858SIsaku Yamahata strlen(tdx_guest->mrownerconfig), &data_len, errp); 907d05a0858SIsaku Yamahata if (!data) { 908d05a0858SIsaku Yamahata return -1; 909d05a0858SIsaku Yamahata } 910d05a0858SIsaku Yamahata if (data_len != QCRYPTO_HASH_DIGEST_LEN_SHA384) { 911d05a0858SIsaku Yamahata error_setg(errp, "TDX: failed to decode mrownerconfig"); 912d05a0858SIsaku Yamahata return -1; 913d05a0858SIsaku Yamahata } 914d05a0858SIsaku Yamahata memcpy(init_vm->mrownerconfig, data, data_len); 915d05a0858SIsaku Yamahata } 916d05a0858SIsaku Yamahata 91753b6f406SXiaoyao Li r = setup_td_guest_attributes(x86cpu, errp); 91853b6f406SXiaoyao Li if (r) { 91953b6f406SXiaoyao Li return r; 92053b6f406SXiaoyao Li } 921bb3be394SXiaoyao Li 922f15898b0SXiaoyao Li r = setup_td_xfam(x86cpu, errp); 923f15898b0SXiaoyao Li if (r) { 924f15898b0SXiaoyao Li return r; 925f15898b0SXiaoyao Li } 926f15898b0SXiaoyao Li 927f15898b0SXiaoyao Li init_vm->cpuid.nent = kvm_x86_build_cpuid(env, init_vm->cpuid.entries, 0); 928f15898b0SXiaoyao Li tdx_filter_cpuid(&init_vm->cpuid); 929f15898b0SXiaoyao Li 930f15898b0SXiaoyao Li init_vm->attributes = tdx_guest->attributes; 931f15898b0SXiaoyao Li init_vm->xfam = tdx_guest->xfam; 932f15898b0SXiaoyao Li 933f15898b0SXiaoyao Li /* 934f15898b0SXiaoyao Li * KVM_TDX_INIT_VM gets -EAGAIN when KVM side SEAMCALL(TDH_MNG_CREATE) 935f15898b0SXiaoyao Li * gets TDX_RND_NO_ENTROPY due to Random number generation (e.g., RDRAND or 936f15898b0SXiaoyao Li * RDSEED) is busy. 937f15898b0SXiaoyao Li * 938f15898b0SXiaoyao Li * Retry for the case. 939f15898b0SXiaoyao Li */ 940f15898b0SXiaoyao Li do { 941f15898b0SXiaoyao Li error_free(local_err); 942f15898b0SXiaoyao Li local_err = NULL; 943f15898b0SXiaoyao Li r = tdx_vm_ioctl(KVM_TDX_INIT_VM, 0, init_vm, &local_err); 944f15898b0SXiaoyao Li } while (r == -EAGAIN && --retry); 945f15898b0SXiaoyao Li 946f15898b0SXiaoyao Li if (r < 0) { 947f15898b0SXiaoyao Li if (!retry) { 948f15898b0SXiaoyao Li error_append_hint(&local_err, "Hardware RNG (Random Number " 949f15898b0SXiaoyao Li "Generator) is busy occupied by someone (via RDRAND/RDSEED) " 950f15898b0SXiaoyao Li "maliciously, which leads to KVM_TDX_INIT_VM keeping failure " 951f15898b0SXiaoyao Li "due to lack of entropy.\n"); 952f15898b0SXiaoyao Li } 953f15898b0SXiaoyao Li error_propagate(errp, local_err); 954f15898b0SXiaoyao Li return r; 955f15898b0SXiaoyao Li } 956f15898b0SXiaoyao Li 957f15898b0SXiaoyao Li tdx_guest->initialized = true; 958f15898b0SXiaoyao Li 959f15898b0SXiaoyao Li return 0; 960f15898b0SXiaoyao Li } 961f15898b0SXiaoyao Li 962cb5d65a8SXiaoyao Li int tdx_parse_tdvf(void *flash_ptr, int size) 963cb5d65a8SXiaoyao Li { 964cb5d65a8SXiaoyao Li return tdvf_parse_metadata(&tdx_guest->tdvf, flash_ptr, size); 965cb5d65a8SXiaoyao Li } 966cb5d65a8SXiaoyao Li 9676e250463SXiaoyao Li static void tdx_panicked_on_fatal_error(X86CPU *cpu, uint64_t error_code, 9686e250463SXiaoyao Li char *message, uint64_t gpa) 9696e250463SXiaoyao Li { 9706e250463SXiaoyao Li GuestPanicInformation *panic_info; 9716e250463SXiaoyao Li 9726e250463SXiaoyao Li panic_info = g_new0(GuestPanicInformation, 1); 9736e250463SXiaoyao Li panic_info->type = GUEST_PANIC_INFORMATION_TYPE_TDX; 9746e250463SXiaoyao Li panic_info->u.tdx.error_code = (uint32_t) error_code; 9756e250463SXiaoyao Li panic_info->u.tdx.message = message; 9766e250463SXiaoyao Li panic_info->u.tdx.gpa = gpa; 9776e250463SXiaoyao Li 9786e250463SXiaoyao Li qemu_system_guest_panicked(panic_info); 9796e250463SXiaoyao Li } 9806e250463SXiaoyao Li 98198dbfd68SXiaoyao Li /* 98298dbfd68SXiaoyao Li * Only 8 registers can contain valid ASCII byte stream to form the fatal 98398dbfd68SXiaoyao Li * message, and their sequence is: R14, R15, RBX, RDI, RSI, R8, R9, RDX 98498dbfd68SXiaoyao Li */ 98598dbfd68SXiaoyao Li #define TDX_FATAL_MESSAGE_MAX 64 98698dbfd68SXiaoyao Li 9876e250463SXiaoyao Li #define TDX_REPORT_FATAL_ERROR_GPA_VALID BIT_ULL(63) 9886e250463SXiaoyao Li 98998dbfd68SXiaoyao Li int tdx_handle_report_fatal_error(X86CPU *cpu, struct kvm_run *run) 99098dbfd68SXiaoyao Li { 99198dbfd68SXiaoyao Li uint64_t error_code = run->system_event.data[R_R12]; 99298dbfd68SXiaoyao Li uint64_t reg_mask = run->system_event.data[R_ECX]; 99398dbfd68SXiaoyao Li char *message = NULL; 99498dbfd68SXiaoyao Li uint64_t *tmp; 9956e250463SXiaoyao Li uint64_t gpa = -1ull; 99698dbfd68SXiaoyao Li 99798dbfd68SXiaoyao Li if (error_code & 0xffff) { 99898dbfd68SXiaoyao Li error_report("TDX: REPORT_FATAL_ERROR: invalid error code: 0x%lx", 99998dbfd68SXiaoyao Li error_code); 100098dbfd68SXiaoyao Li return -1; 100198dbfd68SXiaoyao Li } 100298dbfd68SXiaoyao Li 100398dbfd68SXiaoyao Li if (reg_mask) { 100498dbfd68SXiaoyao Li message = g_malloc0(TDX_FATAL_MESSAGE_MAX + 1); 100598dbfd68SXiaoyao Li tmp = (uint64_t *)message; 100698dbfd68SXiaoyao Li 100798dbfd68SXiaoyao Li #define COPY_REG(REG) \ 100898dbfd68SXiaoyao Li do { \ 100998dbfd68SXiaoyao Li if (reg_mask & BIT_ULL(REG)) { \ 101098dbfd68SXiaoyao Li *(tmp++) = run->system_event.data[REG]; \ 101198dbfd68SXiaoyao Li } \ 101298dbfd68SXiaoyao Li } while (0) 101398dbfd68SXiaoyao Li 101498dbfd68SXiaoyao Li COPY_REG(R_R14); 101598dbfd68SXiaoyao Li COPY_REG(R_R15); 101698dbfd68SXiaoyao Li COPY_REG(R_EBX); 101798dbfd68SXiaoyao Li COPY_REG(R_EDI); 101898dbfd68SXiaoyao Li COPY_REG(R_ESI); 101998dbfd68SXiaoyao Li COPY_REG(R_R8); 102098dbfd68SXiaoyao Li COPY_REG(R_R9); 102198dbfd68SXiaoyao Li COPY_REG(R_EDX); 102298dbfd68SXiaoyao Li *((char *)tmp) = '\0'; 102398dbfd68SXiaoyao Li } 102498dbfd68SXiaoyao Li #undef COPY_REG 102598dbfd68SXiaoyao Li 10266e250463SXiaoyao Li if (error_code & TDX_REPORT_FATAL_ERROR_GPA_VALID) { 10276e250463SXiaoyao Li gpa = run->system_event.data[R_R13]; 10286e250463SXiaoyao Li } 10296e250463SXiaoyao Li 10306e250463SXiaoyao Li tdx_panicked_on_fatal_error(cpu, error_code, message, gpa); 10316e250463SXiaoyao Li 103298dbfd68SXiaoyao Li return -1; 103398dbfd68SXiaoyao Li } 103498dbfd68SXiaoyao Li 10356016e297SXiaoyao Li static bool tdx_guest_get_sept_ve_disable(Object *obj, Error **errp) 10366016e297SXiaoyao Li { 10376016e297SXiaoyao Li TdxGuest *tdx = TDX_GUEST(obj); 10386016e297SXiaoyao Li 10396016e297SXiaoyao Li return !!(tdx->attributes & TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE); 10406016e297SXiaoyao Li } 10416016e297SXiaoyao Li 10426016e297SXiaoyao Li static void tdx_guest_set_sept_ve_disable(Object *obj, bool value, Error **errp) 10436016e297SXiaoyao Li { 10446016e297SXiaoyao Li TdxGuest *tdx = TDX_GUEST(obj); 10456016e297SXiaoyao Li 10466016e297SXiaoyao Li if (value) { 10476016e297SXiaoyao Li tdx->attributes |= TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE; 10486016e297SXiaoyao Li } else { 10496016e297SXiaoyao Li tdx->attributes &= ~TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE; 10506016e297SXiaoyao Li } 10516016e297SXiaoyao Li } 10526016e297SXiaoyao Li 1053d05a0858SIsaku Yamahata static char *tdx_guest_get_mrconfigid(Object *obj, Error **errp) 1054d05a0858SIsaku Yamahata { 1055d05a0858SIsaku Yamahata TdxGuest *tdx = TDX_GUEST(obj); 1056d05a0858SIsaku Yamahata 1057d05a0858SIsaku Yamahata return g_strdup(tdx->mrconfigid); 1058d05a0858SIsaku Yamahata } 1059d05a0858SIsaku Yamahata 1060d05a0858SIsaku Yamahata static void tdx_guest_set_mrconfigid(Object *obj, const char *value, Error **errp) 1061d05a0858SIsaku Yamahata { 1062d05a0858SIsaku Yamahata TdxGuest *tdx = TDX_GUEST(obj); 1063d05a0858SIsaku Yamahata 1064d05a0858SIsaku Yamahata g_free(tdx->mrconfigid); 1065d05a0858SIsaku Yamahata tdx->mrconfigid = g_strdup(value); 1066d05a0858SIsaku Yamahata } 1067d05a0858SIsaku Yamahata 1068d05a0858SIsaku Yamahata static char *tdx_guest_get_mrowner(Object *obj, Error **errp) 1069d05a0858SIsaku Yamahata { 1070d05a0858SIsaku Yamahata TdxGuest *tdx = TDX_GUEST(obj); 1071d05a0858SIsaku Yamahata 1072d05a0858SIsaku Yamahata return g_strdup(tdx->mrowner); 1073d05a0858SIsaku Yamahata } 1074d05a0858SIsaku Yamahata 1075d05a0858SIsaku Yamahata static void tdx_guest_set_mrowner(Object *obj, const char *value, Error **errp) 1076d05a0858SIsaku Yamahata { 1077d05a0858SIsaku Yamahata TdxGuest *tdx = TDX_GUEST(obj); 1078d05a0858SIsaku Yamahata 1079d05a0858SIsaku Yamahata g_free(tdx->mrowner); 1080d05a0858SIsaku Yamahata tdx->mrowner = g_strdup(value); 1081d05a0858SIsaku Yamahata } 1082d05a0858SIsaku Yamahata 1083d05a0858SIsaku Yamahata static char *tdx_guest_get_mrownerconfig(Object *obj, Error **errp) 1084d05a0858SIsaku Yamahata { 1085d05a0858SIsaku Yamahata TdxGuest *tdx = TDX_GUEST(obj); 1086d05a0858SIsaku Yamahata 1087d05a0858SIsaku Yamahata return g_strdup(tdx->mrownerconfig); 1088d05a0858SIsaku Yamahata } 1089d05a0858SIsaku Yamahata 1090d05a0858SIsaku Yamahata static void tdx_guest_set_mrownerconfig(Object *obj, const char *value, Error **errp) 1091d05a0858SIsaku Yamahata { 1092d05a0858SIsaku Yamahata TdxGuest *tdx = TDX_GUEST(obj); 1093d05a0858SIsaku Yamahata 1094d05a0858SIsaku Yamahata g_free(tdx->mrownerconfig); 1095d05a0858SIsaku Yamahata tdx->mrownerconfig = g_strdup(value); 1096d05a0858SIsaku Yamahata } 1097d05a0858SIsaku Yamahata 1098756e12e7SXiaoyao Li /* tdx guest */ 1099756e12e7SXiaoyao Li OBJECT_DEFINE_TYPE_WITH_INTERFACES(TdxGuest, 1100756e12e7SXiaoyao Li tdx_guest, 1101756e12e7SXiaoyao Li TDX_GUEST, 1102756e12e7SXiaoyao Li X86_CONFIDENTIAL_GUEST, 1103756e12e7SXiaoyao Li { TYPE_USER_CREATABLE }, 1104756e12e7SXiaoyao Li { NULL }) 1105756e12e7SXiaoyao Li 1106756e12e7SXiaoyao Li static void tdx_guest_init(Object *obj) 1107756e12e7SXiaoyao Li { 1108756e12e7SXiaoyao Li ConfidentialGuestSupport *cgs = CONFIDENTIAL_GUEST_SUPPORT(obj); 1109756e12e7SXiaoyao Li TdxGuest *tdx = TDX_GUEST(obj); 1110756e12e7SXiaoyao Li 1111f15898b0SXiaoyao Li qemu_mutex_init(&tdx->lock); 1112f15898b0SXiaoyao Li 1113756e12e7SXiaoyao Li cgs->require_guest_memfd = true; 1114714af522SIsaku Yamahata tdx->attributes = TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE; 1115756e12e7SXiaoyao Li 1116756e12e7SXiaoyao Li object_property_add_uint64_ptr(obj, "attributes", &tdx->attributes, 1117756e12e7SXiaoyao Li OBJ_PROP_FLAG_READWRITE); 11186016e297SXiaoyao Li object_property_add_bool(obj, "sept-ve-disable", 11196016e297SXiaoyao Li tdx_guest_get_sept_ve_disable, 11206016e297SXiaoyao Li tdx_guest_set_sept_ve_disable); 1121d05a0858SIsaku Yamahata object_property_add_str(obj, "mrconfigid", 1122d05a0858SIsaku Yamahata tdx_guest_get_mrconfigid, 1123d05a0858SIsaku Yamahata tdx_guest_set_mrconfigid); 1124d05a0858SIsaku Yamahata object_property_add_str(obj, "mrowner", 1125d05a0858SIsaku Yamahata tdx_guest_get_mrowner, tdx_guest_set_mrowner); 1126d05a0858SIsaku Yamahata object_property_add_str(obj, "mrownerconfig", 1127d05a0858SIsaku Yamahata tdx_guest_get_mrownerconfig, 1128d05a0858SIsaku Yamahata tdx_guest_set_mrownerconfig); 1129756e12e7SXiaoyao Li } 1130756e12e7SXiaoyao Li 1131756e12e7SXiaoyao Li static void tdx_guest_finalize(Object *obj) 1132756e12e7SXiaoyao Li { 1133756e12e7SXiaoyao Li } 1134756e12e7SXiaoyao Li 1135756e12e7SXiaoyao Li static void tdx_guest_class_init(ObjectClass *oc, const void *data) 1136756e12e7SXiaoyao Li { 1137631a2ac5SXiaoyao Li ConfidentialGuestSupportClass *klass = CONFIDENTIAL_GUEST_SUPPORT_CLASS(oc); 1138b455880eSXiaoyao Li X86ConfidentialGuestClass *x86_klass = X86_CONFIDENTIAL_GUEST_CLASS(oc); 1139b455880eSXiaoyao Li 1140631a2ac5SXiaoyao Li klass->kvm_init = tdx_kvm_init; 1141b455880eSXiaoyao Li x86_klass->kvm_type = tdx_kvm_type; 11427c615242SXiaoyao Li x86_klass->cpu_instance_init = tdx_cpu_instance_init; 114375ec6189SXiaoyao Li x86_klass->adjust_cpuid_features = tdx_adjust_cpuid_features; 1144756e12e7SXiaoyao Li } 1145