xref: /openbmc/qemu/target/i386/kvm/tdx.c (revision 9f5771c57dbe92d46361afd992a5851c846d0322)
1756e12e7SXiaoyao Li /*
2756e12e7SXiaoyao Li  * QEMU TDX support
3756e12e7SXiaoyao Li  *
4756e12e7SXiaoyao Li  * Copyright (c) 2025 Intel Corporation
5756e12e7SXiaoyao Li  *
6756e12e7SXiaoyao Li  * Author:
7756e12e7SXiaoyao Li  *      Xiaoyao Li <xiaoyao.li@intel.com>
8756e12e7SXiaoyao Li  *
9756e12e7SXiaoyao Li  * SPDX-License-Identifier: GPL-2.0-or-later
10756e12e7SXiaoyao Li  */
11756e12e7SXiaoyao Li 
12756e12e7SXiaoyao Li #include "qemu/osdep.h"
138eddedc3SXiaoyao Li #include "qemu/error-report.h"
14d05a0858SIsaku Yamahata #include "qemu/base64.h"
154420ba0eSXiaoyao Li #include "qemu/mmap-alloc.h"
168eddedc3SXiaoyao Li #include "qapi/error.h"
17756e12e7SXiaoyao Li #include "qom/object_interfaces.h"
18d05a0858SIsaku Yamahata #include "crypto/hash.h"
19bb45580dSXiaoyao Li #include "system/kvm_int.h"
206e250463SXiaoyao Li #include "system/runstate.h"
214420ba0eSXiaoyao Li #include "system/system.h"
22ebc2d2b4SIsaku Yamahata #include "system/ramblock.h"
23756e12e7SXiaoyao Li 
241ff5048dSXiaoyao Li #include <linux/kvm_para.h>
251ff5048dSXiaoyao Li 
268c94c84cSXiaoyao Li #include "cpu.h"
278c94c84cSXiaoyao Li #include "cpu-internal.h"
28f18672e4SXiaoyao Li #include "hw/i386/e820_memory_layout.h"
294420ba0eSXiaoyao Li #include "hw/i386/tdvf.h"
30631a2ac5SXiaoyao Li #include "hw/i386/x86.h"
31a7314259SXiaoyao Li #include "hw/i386/tdvf-hob.h"
32b455880eSXiaoyao Li #include "kvm_i386.h"
33756e12e7SXiaoyao Li #include "tdx.h"
34756e12e7SXiaoyao Li 
350e73b843SXiaoyao Li #define TDX_MIN_TSC_FREQUENCY_KHZ   (100 * 1000)
360e73b843SXiaoyao Li #define TDX_MAX_TSC_FREQUENCY_KHZ   (10 * 1000 * 1000)
370e73b843SXiaoyao Li 
3853b6f406SXiaoyao Li #define TDX_TD_ATTRIBUTES_DEBUG             BIT_ULL(0)
396016e297SXiaoyao Li #define TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE   BIT_ULL(28)
40bb3be394SXiaoyao Li #define TDX_TD_ATTRIBUTES_PKS               BIT_ULL(30)
41bb3be394SXiaoyao Li #define TDX_TD_ATTRIBUTES_PERFMON           BIT_ULL(63)
426016e297SXiaoyao Li 
4353b6f406SXiaoyao Li #define TDX_SUPPORTED_TD_ATTRS  (TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE |\
4453b6f406SXiaoyao Li                                  TDX_TD_ATTRIBUTES_PKS | \
4553b6f406SXiaoyao Li                                  TDX_TD_ATTRIBUTES_PERFMON)
4653b6f406SXiaoyao Li 
471619d0e4SXiaoyao Li static TdxGuest *tdx_guest;
481619d0e4SXiaoyao Li 
498eddedc3SXiaoyao Li static struct kvm_tdx_capabilities *tdx_caps;
5075ec6189SXiaoyao Li static struct kvm_cpuid2 *tdx_supported_cpuid;
518eddedc3SXiaoyao Li 
521619d0e4SXiaoyao Li /* Valid after kvm_arch_init()->confidential_guest_kvm_init()->tdx_kvm_init() */
531619d0e4SXiaoyao Li bool is_tdx_vm(void)
541619d0e4SXiaoyao Li {
551619d0e4SXiaoyao Li     return !!tdx_guest;
561619d0e4SXiaoyao Li }
571619d0e4SXiaoyao Li 
588eddedc3SXiaoyao Li enum tdx_ioctl_level {
598eddedc3SXiaoyao Li     TDX_VM_IOCTL,
608eddedc3SXiaoyao Li     TDX_VCPU_IOCTL,
618eddedc3SXiaoyao Li };
628eddedc3SXiaoyao Li 
638eddedc3SXiaoyao Li static int tdx_ioctl_internal(enum tdx_ioctl_level level, void *state,
648eddedc3SXiaoyao Li                               int cmd_id, __u32 flags, void *data,
658eddedc3SXiaoyao Li                               Error **errp)
66631a2ac5SXiaoyao Li {
678eddedc3SXiaoyao Li     struct kvm_tdx_cmd tdx_cmd = {};
688eddedc3SXiaoyao Li     int r;
698eddedc3SXiaoyao Li 
708eddedc3SXiaoyao Li     const char *tdx_ioctl_name[] = {
718eddedc3SXiaoyao Li         [KVM_TDX_CAPABILITIES] = "KVM_TDX_CAPABILITIES",
728eddedc3SXiaoyao Li         [KVM_TDX_INIT_VM] = "KVM_TDX_INIT_VM",
738eddedc3SXiaoyao Li         [KVM_TDX_INIT_VCPU] = "KVM_TDX_INIT_VCPU",
748eddedc3SXiaoyao Li         [KVM_TDX_INIT_MEM_REGION] = "KVM_TDX_INIT_MEM_REGION",
758eddedc3SXiaoyao Li         [KVM_TDX_FINALIZE_VM] = "KVM_TDX_FINALIZE_VM",
768eddedc3SXiaoyao Li         [KVM_TDX_GET_CPUID] = "KVM_TDX_GET_CPUID",
778eddedc3SXiaoyao Li     };
788eddedc3SXiaoyao Li 
798eddedc3SXiaoyao Li     tdx_cmd.id = cmd_id;
808eddedc3SXiaoyao Li     tdx_cmd.flags = flags;
818eddedc3SXiaoyao Li     tdx_cmd.data = (__u64)(unsigned long)data;
828eddedc3SXiaoyao Li 
838eddedc3SXiaoyao Li     switch (level) {
848eddedc3SXiaoyao Li     case TDX_VM_IOCTL:
858eddedc3SXiaoyao Li         r = kvm_vm_ioctl(kvm_state, KVM_MEMORY_ENCRYPT_OP, &tdx_cmd);
868eddedc3SXiaoyao Li         break;
878eddedc3SXiaoyao Li     case TDX_VCPU_IOCTL:
888eddedc3SXiaoyao Li         r = kvm_vcpu_ioctl(state, KVM_MEMORY_ENCRYPT_OP, &tdx_cmd);
898eddedc3SXiaoyao Li         break;
908eddedc3SXiaoyao Li     default:
918eddedc3SXiaoyao Li         error_setg(errp, "Invalid tdx_ioctl_level %d", level);
928eddedc3SXiaoyao Li         return -EINVAL;
938eddedc3SXiaoyao Li     }
948eddedc3SXiaoyao Li 
958eddedc3SXiaoyao Li     if (r < 0) {
968eddedc3SXiaoyao Li         error_setg_errno(errp, -r, "TDX ioctl %s failed, hw_errors: 0x%llx",
978eddedc3SXiaoyao Li                          tdx_ioctl_name[cmd_id], tdx_cmd.hw_error);
988eddedc3SXiaoyao Li     }
998eddedc3SXiaoyao Li     return r;
1008eddedc3SXiaoyao Li }
1018eddedc3SXiaoyao Li 
1028eddedc3SXiaoyao Li static inline int tdx_vm_ioctl(int cmd_id, __u32 flags, void *data,
1038eddedc3SXiaoyao Li                                Error **errp)
1048eddedc3SXiaoyao Li {
1058eddedc3SXiaoyao Li     return tdx_ioctl_internal(TDX_VM_IOCTL, NULL, cmd_id, flags, data, errp);
1068eddedc3SXiaoyao Li }
1078eddedc3SXiaoyao Li 
1088eddedc3SXiaoyao Li static inline int tdx_vcpu_ioctl(CPUState *cpu, int cmd_id, __u32 flags,
1098eddedc3SXiaoyao Li                                  void *data, Error **errp)
1108eddedc3SXiaoyao Li {
1118eddedc3SXiaoyao Li     return  tdx_ioctl_internal(TDX_VCPU_IOCTL, cpu, cmd_id, flags, data, errp);
1128eddedc3SXiaoyao Li }
1138eddedc3SXiaoyao Li 
1148eddedc3SXiaoyao Li static int get_tdx_capabilities(Error **errp)
1158eddedc3SXiaoyao Li {
1168eddedc3SXiaoyao Li     struct kvm_tdx_capabilities *caps;
1178eddedc3SXiaoyao Li     /* 1st generation of TDX reports 6 cpuid configs */
1188eddedc3SXiaoyao Li     int nr_cpuid_configs = 6;
1198eddedc3SXiaoyao Li     size_t size;
1208eddedc3SXiaoyao Li     int r;
1218eddedc3SXiaoyao Li 
1228eddedc3SXiaoyao Li     do {
1238eddedc3SXiaoyao Li         Error *local_err = NULL;
1248eddedc3SXiaoyao Li         size = sizeof(struct kvm_tdx_capabilities) +
1258eddedc3SXiaoyao Li                       nr_cpuid_configs * sizeof(struct kvm_cpuid_entry2);
1268eddedc3SXiaoyao Li         caps = g_malloc0(size);
1278eddedc3SXiaoyao Li         caps->cpuid.nent = nr_cpuid_configs;
1288eddedc3SXiaoyao Li 
1298eddedc3SXiaoyao Li         r = tdx_vm_ioctl(KVM_TDX_CAPABILITIES, 0, caps, &local_err);
1308eddedc3SXiaoyao Li         if (r == -E2BIG) {
1318eddedc3SXiaoyao Li             g_free(caps);
1328eddedc3SXiaoyao Li             nr_cpuid_configs *= 2;
1338eddedc3SXiaoyao Li             if (nr_cpuid_configs > KVM_MAX_CPUID_ENTRIES) {
1348eddedc3SXiaoyao Li                 error_report("KVM TDX seems broken that number of CPUID entries"
1358eddedc3SXiaoyao Li                              " in kvm_tdx_capabilities exceeds limit: %d",
1368eddedc3SXiaoyao Li                              KVM_MAX_CPUID_ENTRIES);
1378eddedc3SXiaoyao Li                 error_propagate(errp, local_err);
1388eddedc3SXiaoyao Li                 return r;
1398eddedc3SXiaoyao Li             }
1408eddedc3SXiaoyao Li             error_free(local_err);
1418eddedc3SXiaoyao Li         } else if (r < 0) {
1428eddedc3SXiaoyao Li             g_free(caps);
1438eddedc3SXiaoyao Li             error_propagate(errp, local_err);
1448eddedc3SXiaoyao Li             return r;
1458eddedc3SXiaoyao Li         }
1468eddedc3SXiaoyao Li     } while (r == -E2BIG);
1478eddedc3SXiaoyao Li 
1488eddedc3SXiaoyao Li     tdx_caps = caps;
149631a2ac5SXiaoyao Li 
150631a2ac5SXiaoyao Li     return 0;
151631a2ac5SXiaoyao Li }
152631a2ac5SXiaoyao Li 
1530dd5fe5eSChao Peng void tdx_set_tdvf_region(MemoryRegion *tdvf_mr)
1540dd5fe5eSChao Peng {
1550dd5fe5eSChao Peng     assert(!tdx_guest->tdvf_mr);
1560dd5fe5eSChao Peng     tdx_guest->tdvf_mr = tdvf_mr;
1570dd5fe5eSChao Peng }
1580dd5fe5eSChao Peng 
159a7314259SXiaoyao Li static TdxFirmwareEntry *tdx_get_hob_entry(TdxGuest *tdx)
160a7314259SXiaoyao Li {
161a7314259SXiaoyao Li     TdxFirmwareEntry *entry;
162a7314259SXiaoyao Li 
163a7314259SXiaoyao Li     for_each_tdx_fw_entry(&tdx->tdvf, entry) {
164a7314259SXiaoyao Li         if (entry->type == TDVF_SECTION_TYPE_TD_HOB) {
165a7314259SXiaoyao Li             return entry;
166a7314259SXiaoyao Li         }
167a7314259SXiaoyao Li     }
168a7314259SXiaoyao Li     error_report("TDVF metadata doesn't specify TD_HOB location.");
169a7314259SXiaoyao Li     exit(1);
170a7314259SXiaoyao Li }
171a7314259SXiaoyao Li 
172f18672e4SXiaoyao Li static void tdx_add_ram_entry(uint64_t address, uint64_t length,
173f18672e4SXiaoyao Li                               enum TdxRamType type)
174f18672e4SXiaoyao Li {
175f18672e4SXiaoyao Li     uint32_t nr_entries = tdx_guest->nr_ram_entries;
176f18672e4SXiaoyao Li     tdx_guest->ram_entries = g_renew(TdxRamEntry, tdx_guest->ram_entries,
177f18672e4SXiaoyao Li                                      nr_entries + 1);
178f18672e4SXiaoyao Li 
179f18672e4SXiaoyao Li     tdx_guest->ram_entries[nr_entries].address = address;
180f18672e4SXiaoyao Li     tdx_guest->ram_entries[nr_entries].length = length;
181f18672e4SXiaoyao Li     tdx_guest->ram_entries[nr_entries].type = type;
182f18672e4SXiaoyao Li     tdx_guest->nr_ram_entries++;
183f18672e4SXiaoyao Li }
184f18672e4SXiaoyao Li 
185f18672e4SXiaoyao Li static int tdx_accept_ram_range(uint64_t address, uint64_t length)
186f18672e4SXiaoyao Li {
187f18672e4SXiaoyao Li     uint64_t head_start, tail_start, head_length, tail_length;
188f18672e4SXiaoyao Li     uint64_t tmp_address, tmp_length;
189f18672e4SXiaoyao Li     TdxRamEntry *e;
190f18672e4SXiaoyao Li     int i = 0;
191f18672e4SXiaoyao Li 
192f18672e4SXiaoyao Li     do {
193f18672e4SXiaoyao Li         if (i == tdx_guest->nr_ram_entries) {
194f18672e4SXiaoyao Li             return -1;
195f18672e4SXiaoyao Li         }
196f18672e4SXiaoyao Li 
197f18672e4SXiaoyao Li         e = &tdx_guest->ram_entries[i++];
198f18672e4SXiaoyao Li     } while (address + length <= e->address || address >= e->address + e->length);
199f18672e4SXiaoyao Li 
200f18672e4SXiaoyao Li     /*
201f18672e4SXiaoyao Li      * The to-be-accepted ram range must be fully contained by one
202f18672e4SXiaoyao Li      * RAM entry.
203f18672e4SXiaoyao Li      */
204f18672e4SXiaoyao Li     if (e->address > address ||
205f18672e4SXiaoyao Li         e->address + e->length < address + length) {
206f18672e4SXiaoyao Li         return -1;
207f18672e4SXiaoyao Li     }
208f18672e4SXiaoyao Li 
209f18672e4SXiaoyao Li     if (e->type == TDX_RAM_ADDED) {
210f18672e4SXiaoyao Li         return 0;
211f18672e4SXiaoyao Li     }
212f18672e4SXiaoyao Li 
213f18672e4SXiaoyao Li     tmp_address = e->address;
214f18672e4SXiaoyao Li     tmp_length = e->length;
215f18672e4SXiaoyao Li 
216f18672e4SXiaoyao Li     e->address = address;
217f18672e4SXiaoyao Li     e->length = length;
218f18672e4SXiaoyao Li     e->type = TDX_RAM_ADDED;
219f18672e4SXiaoyao Li 
220f18672e4SXiaoyao Li     head_length = address - tmp_address;
221f18672e4SXiaoyao Li     if (head_length > 0) {
222f18672e4SXiaoyao Li         head_start = tmp_address;
223f18672e4SXiaoyao Li         tdx_add_ram_entry(head_start, head_length, TDX_RAM_UNACCEPTED);
224f18672e4SXiaoyao Li     }
225f18672e4SXiaoyao Li 
226f18672e4SXiaoyao Li     tail_start = address + length;
227f18672e4SXiaoyao Li     if (tail_start < tmp_address + tmp_length) {
228f18672e4SXiaoyao Li         tail_length = tmp_address + tmp_length - tail_start;
229f18672e4SXiaoyao Li         tdx_add_ram_entry(tail_start, tail_length, TDX_RAM_UNACCEPTED);
230f18672e4SXiaoyao Li     }
231f18672e4SXiaoyao Li 
232f18672e4SXiaoyao Li     return 0;
233f18672e4SXiaoyao Li }
234f18672e4SXiaoyao Li 
235f18672e4SXiaoyao Li static int tdx_ram_entry_compare(const void *lhs_, const void* rhs_)
236f18672e4SXiaoyao Li {
237f18672e4SXiaoyao Li     const TdxRamEntry *lhs = lhs_;
238f18672e4SXiaoyao Li     const TdxRamEntry *rhs = rhs_;
239f18672e4SXiaoyao Li 
240f18672e4SXiaoyao Li     if (lhs->address == rhs->address) {
241f18672e4SXiaoyao Li         return 0;
242f18672e4SXiaoyao Li     }
243f18672e4SXiaoyao Li     if (le64_to_cpu(lhs->address) > le64_to_cpu(rhs->address)) {
244f18672e4SXiaoyao Li         return 1;
245f18672e4SXiaoyao Li     }
246f18672e4SXiaoyao Li     return -1;
247f18672e4SXiaoyao Li }
248f18672e4SXiaoyao Li 
249f18672e4SXiaoyao Li static void tdx_init_ram_entries(void)
250f18672e4SXiaoyao Li {
251f18672e4SXiaoyao Li     unsigned i, j, nr_e820_entries;
252f18672e4SXiaoyao Li 
253f18672e4SXiaoyao Li     nr_e820_entries = e820_get_table(NULL);
254f18672e4SXiaoyao Li     tdx_guest->ram_entries = g_new(TdxRamEntry, nr_e820_entries);
255f18672e4SXiaoyao Li 
256f18672e4SXiaoyao Li     for (i = 0, j = 0; i < nr_e820_entries; i++) {
257f18672e4SXiaoyao Li         uint64_t addr, len;
258f18672e4SXiaoyao Li 
259f18672e4SXiaoyao Li         if (e820_get_entry(i, E820_RAM, &addr, &len)) {
260f18672e4SXiaoyao Li             tdx_guest->ram_entries[j].address = addr;
261f18672e4SXiaoyao Li             tdx_guest->ram_entries[j].length = len;
262f18672e4SXiaoyao Li             tdx_guest->ram_entries[j].type = TDX_RAM_UNACCEPTED;
263f18672e4SXiaoyao Li             j++;
264f18672e4SXiaoyao Li         }
265f18672e4SXiaoyao Li     }
266f18672e4SXiaoyao Li     tdx_guest->nr_ram_entries = j;
267f18672e4SXiaoyao Li }
268f18672e4SXiaoyao Li 
26941f7fd22SXiaoyao Li static void tdx_post_init_vcpus(void)
27041f7fd22SXiaoyao Li {
27141f7fd22SXiaoyao Li     TdxFirmwareEntry *hob;
27241f7fd22SXiaoyao Li     CPUState *cpu;
27341f7fd22SXiaoyao Li 
27441f7fd22SXiaoyao Li     hob = tdx_get_hob_entry(tdx_guest);
27541f7fd22SXiaoyao Li     CPU_FOREACH(cpu) {
27641f7fd22SXiaoyao Li         tdx_vcpu_ioctl(cpu, KVM_TDX_INIT_VCPU, 0, (void *)hob->address,
27741f7fd22SXiaoyao Li                        &error_fatal);
27841f7fd22SXiaoyao Li     }
27941f7fd22SXiaoyao Li }
28041f7fd22SXiaoyao Li 
2814420ba0eSXiaoyao Li static void tdx_finalize_vm(Notifier *notifier, void *unused)
2824420ba0eSXiaoyao Li {
2834420ba0eSXiaoyao Li     TdxFirmware *tdvf = &tdx_guest->tdvf;
2844420ba0eSXiaoyao Li     TdxFirmwareEntry *entry;
285ebc2d2b4SIsaku Yamahata     RAMBlock *ram_block;
286ebc2d2b4SIsaku Yamahata     Error *local_err = NULL;
287ebc2d2b4SIsaku Yamahata     int r;
2884420ba0eSXiaoyao Li 
289f18672e4SXiaoyao Li     tdx_init_ram_entries();
290f18672e4SXiaoyao Li 
2914420ba0eSXiaoyao Li     for_each_tdx_fw_entry(tdvf, entry) {
2924420ba0eSXiaoyao Li         switch (entry->type) {
2934420ba0eSXiaoyao Li         case TDVF_SECTION_TYPE_BFV:
2944420ba0eSXiaoyao Li         case TDVF_SECTION_TYPE_CFV:
2954420ba0eSXiaoyao Li             entry->mem_ptr = tdvf->mem_ptr + entry->data_offset;
2964420ba0eSXiaoyao Li             break;
2974420ba0eSXiaoyao Li         case TDVF_SECTION_TYPE_TD_HOB:
2984420ba0eSXiaoyao Li         case TDVF_SECTION_TYPE_TEMP_MEM:
2994420ba0eSXiaoyao Li             entry->mem_ptr = qemu_ram_mmap(-1, entry->size,
3004420ba0eSXiaoyao Li                                            qemu_real_host_page_size(), 0, 0);
3014420ba0eSXiaoyao Li             if (entry->mem_ptr == MAP_FAILED) {
3024420ba0eSXiaoyao Li                 error_report("Failed to mmap memory for TDVF section %d",
3034420ba0eSXiaoyao Li                              entry->type);
3044420ba0eSXiaoyao Li                 exit(1);
3054420ba0eSXiaoyao Li             }
306f18672e4SXiaoyao Li             if (tdx_accept_ram_range(entry->address, entry->size)) {
307f18672e4SXiaoyao Li                 error_report("Failed to accept memory for TDVF section %d",
308f18672e4SXiaoyao Li                              entry->type);
309f18672e4SXiaoyao Li                 qemu_ram_munmap(-1, entry->mem_ptr, entry->size);
310f18672e4SXiaoyao Li                 exit(1);
311f18672e4SXiaoyao Li             }
3124420ba0eSXiaoyao Li             break;
3134420ba0eSXiaoyao Li         default:
3144420ba0eSXiaoyao Li             error_report("Unsupported TDVF section %d", entry->type);
3154420ba0eSXiaoyao Li             exit(1);
3164420ba0eSXiaoyao Li         }
3174420ba0eSXiaoyao Li     }
318f18672e4SXiaoyao Li 
319f18672e4SXiaoyao Li     qsort(tdx_guest->ram_entries, tdx_guest->nr_ram_entries,
320f18672e4SXiaoyao Li           sizeof(TdxRamEntry), &tdx_ram_entry_compare);
321a7314259SXiaoyao Li 
322a7314259SXiaoyao Li     tdvf_hob_create(tdx_guest, tdx_get_hob_entry(tdx_guest));
323ebc2d2b4SIsaku Yamahata 
32441f7fd22SXiaoyao Li     tdx_post_init_vcpus();
32541f7fd22SXiaoyao Li 
326ebc2d2b4SIsaku Yamahata     for_each_tdx_fw_entry(tdvf, entry) {
327ebc2d2b4SIsaku Yamahata         struct kvm_tdx_init_mem_region region;
328ebc2d2b4SIsaku Yamahata         uint32_t flags;
329ebc2d2b4SIsaku Yamahata 
330ebc2d2b4SIsaku Yamahata         region = (struct kvm_tdx_init_mem_region) {
331ebc2d2b4SIsaku Yamahata             .source_addr = (uint64_t)entry->mem_ptr,
332ebc2d2b4SIsaku Yamahata             .gpa = entry->address,
333ebc2d2b4SIsaku Yamahata             .nr_pages = entry->size >> 12,
334ebc2d2b4SIsaku Yamahata         };
335ebc2d2b4SIsaku Yamahata 
336ebc2d2b4SIsaku Yamahata         flags = entry->attributes & TDVF_SECTION_ATTRIBUTES_MR_EXTEND ?
337ebc2d2b4SIsaku Yamahata                 KVM_TDX_MEASURE_MEMORY_REGION : 0;
338ebc2d2b4SIsaku Yamahata 
339ebc2d2b4SIsaku Yamahata         do {
340ebc2d2b4SIsaku Yamahata             error_free(local_err);
341ebc2d2b4SIsaku Yamahata             local_err = NULL;
342ebc2d2b4SIsaku Yamahata             r = tdx_vcpu_ioctl(first_cpu, KVM_TDX_INIT_MEM_REGION, flags,
343ebc2d2b4SIsaku Yamahata                                &region, &local_err);
344ebc2d2b4SIsaku Yamahata         } while (r == -EAGAIN || r == -EINTR);
345ebc2d2b4SIsaku Yamahata         if (r < 0) {
346ebc2d2b4SIsaku Yamahata             error_report_err(local_err);
347ebc2d2b4SIsaku Yamahata             exit(1);
348ebc2d2b4SIsaku Yamahata         }
349ebc2d2b4SIsaku Yamahata 
350ebc2d2b4SIsaku Yamahata         if (entry->type == TDVF_SECTION_TYPE_TD_HOB ||
351ebc2d2b4SIsaku Yamahata             entry->type == TDVF_SECTION_TYPE_TEMP_MEM) {
352ebc2d2b4SIsaku Yamahata             qemu_ram_munmap(-1, entry->mem_ptr, entry->size);
353ebc2d2b4SIsaku Yamahata             entry->mem_ptr = NULL;
354ebc2d2b4SIsaku Yamahata         }
355ebc2d2b4SIsaku Yamahata     }
356ebc2d2b4SIsaku Yamahata 
357ebc2d2b4SIsaku Yamahata     /*
358ebc2d2b4SIsaku Yamahata      * TDVF image has been copied into private region above via
359ebc2d2b4SIsaku Yamahata      * KVM_MEMORY_MAPPING. It becomes useless.
360ebc2d2b4SIsaku Yamahata      */
361ebc2d2b4SIsaku Yamahata     ram_block = tdx_guest->tdvf_mr->ram_block;
362ebc2d2b4SIsaku Yamahata     ram_block_discard_range(ram_block, 0, ram_block->max_length);
363ae60ff4eSXiaoyao Li 
364ae60ff4eSXiaoyao Li     tdx_vm_ioctl(KVM_TDX_FINALIZE_VM, 0, NULL, &error_fatal);
365ae60ff4eSXiaoyao Li     CONFIDENTIAL_GUEST_SUPPORT(tdx_guest)->ready = true;
3664420ba0eSXiaoyao Li }
3674420ba0eSXiaoyao Li 
3684420ba0eSXiaoyao Li static Notifier tdx_machine_done_notify = {
3694420ba0eSXiaoyao Li     .notify = tdx_finalize_vm,
3704420ba0eSXiaoyao Li };
3714420ba0eSXiaoyao Li 
3720ba06e46SXiaoyao Li /*
3730ba06e46SXiaoyao Li  * Some CPUID bits change from fixed1 to configurable bits when TDX module
3740ba06e46SXiaoyao Li  * supports TDX_FEATURES0.VE_REDUCTION. e.g., MCA/MCE/MTRR/CORE_CAPABILITY.
3750ba06e46SXiaoyao Li  *
3760ba06e46SXiaoyao Li  * To make QEMU work with all the versions of TDX module, keep the fixed1 bits
3770ba06e46SXiaoyao Li  * here if they are ever fixed1 bits in any of the version though not fixed1 in
3780ba06e46SXiaoyao Li  * the latest version. Otherwise, with the older version of TDX module, QEMU may
3790ba06e46SXiaoyao Li  * treat the fixed1 bit as unsupported.
3800ba06e46SXiaoyao Li  *
3810ba06e46SXiaoyao Li  * For newer TDX module, it does no harm to keep them in tdx_fixed1_bits even
3820ba06e46SXiaoyao Li  * though they changed to configurable bits. Because tdx_fixed1_bits is used to
3830ba06e46SXiaoyao Li  * setup the supported bits.
3840ba06e46SXiaoyao Li  */
3850ba06e46SXiaoyao Li KvmCpuidInfo tdx_fixed1_bits = {
3860ba06e46SXiaoyao Li     .cpuid.nent = 8,
3870ba06e46SXiaoyao Li     .entries[0] = {
3880ba06e46SXiaoyao Li         .function = 0x1,
3890ba06e46SXiaoyao Li         .index = 0,
3900ba06e46SXiaoyao Li         .ecx = CPUID_EXT_SSE3 | CPUID_EXT_PCLMULQDQ | CPUID_EXT_DTES64 |
3910ba06e46SXiaoyao Li                CPUID_EXT_DSCPL | CPUID_EXT_SSSE3 | CPUID_EXT_CX16 |
3920ba06e46SXiaoyao Li                CPUID_EXT_PDCM | CPUID_EXT_PCID | CPUID_EXT_SSE41 |
3930ba06e46SXiaoyao Li                CPUID_EXT_SSE42 | CPUID_EXT_X2APIC | CPUID_EXT_MOVBE |
3940ba06e46SXiaoyao Li                CPUID_EXT_POPCNT | CPUID_EXT_AES | CPUID_EXT_XSAVE |
3950ba06e46SXiaoyao Li                CPUID_EXT_RDRAND | CPUID_EXT_HYPERVISOR,
3960ba06e46SXiaoyao Li         .edx = CPUID_FP87 | CPUID_VME | CPUID_DE | CPUID_PSE | CPUID_TSC |
3970ba06e46SXiaoyao Li                CPUID_MSR | CPUID_PAE | CPUID_MCE | CPUID_CX8 | CPUID_APIC |
3980ba06e46SXiaoyao Li                CPUID_SEP | CPUID_MTRR | CPUID_PGE | CPUID_MCA | CPUID_CMOV |
3990ba06e46SXiaoyao Li                CPUID_PAT | CPUID_CLFLUSH | CPUID_DTS | CPUID_MMX | CPUID_FXSR |
4000ba06e46SXiaoyao Li                CPUID_SSE | CPUID_SSE2,
4010ba06e46SXiaoyao Li     },
4020ba06e46SXiaoyao Li     .entries[1] = {
4030ba06e46SXiaoyao Li         .function = 0x6,
4040ba06e46SXiaoyao Li         .index = 0,
4050ba06e46SXiaoyao Li         .eax = CPUID_6_EAX_ARAT,
4060ba06e46SXiaoyao Li     },
4070ba06e46SXiaoyao Li     .entries[2] = {
4080ba06e46SXiaoyao Li         .function = 0x7,
4090ba06e46SXiaoyao Li         .index = 0,
4100ba06e46SXiaoyao Li         .flags = KVM_CPUID_FLAG_SIGNIFCANT_INDEX,
4110ba06e46SXiaoyao Li         .ebx = CPUID_7_0_EBX_FSGSBASE | CPUID_7_0_EBX_FDP_EXCPTN_ONLY |
4120ba06e46SXiaoyao Li                CPUID_7_0_EBX_SMEP | CPUID_7_0_EBX_INVPCID |
4130ba06e46SXiaoyao Li                CPUID_7_0_EBX_ZERO_FCS_FDS | CPUID_7_0_EBX_RDSEED |
4140ba06e46SXiaoyao Li                CPUID_7_0_EBX_SMAP | CPUID_7_0_EBX_CLFLUSHOPT |
4150ba06e46SXiaoyao Li                CPUID_7_0_EBX_CLWB | CPUID_7_0_EBX_SHA_NI,
4160ba06e46SXiaoyao Li         .ecx = CPUID_7_0_ECX_BUS_LOCK_DETECT | CPUID_7_0_ECX_MOVDIRI |
4170ba06e46SXiaoyao Li                CPUID_7_0_ECX_MOVDIR64B,
4180ba06e46SXiaoyao Li         .edx = CPUID_7_0_EDX_MD_CLEAR | CPUID_7_0_EDX_SPEC_CTRL |
4190ba06e46SXiaoyao Li                CPUID_7_0_EDX_STIBP | CPUID_7_0_EDX_FLUSH_L1D |
4200ba06e46SXiaoyao Li                CPUID_7_0_EDX_ARCH_CAPABILITIES | CPUID_7_0_EDX_CORE_CAPABILITY |
4210ba06e46SXiaoyao Li                CPUID_7_0_EDX_SPEC_CTRL_SSBD,
4220ba06e46SXiaoyao Li     },
4230ba06e46SXiaoyao Li     .entries[3] = {
4240ba06e46SXiaoyao Li         .function = 0x7,
4250ba06e46SXiaoyao Li         .index = 2,
4260ba06e46SXiaoyao Li         .flags = KVM_CPUID_FLAG_SIGNIFCANT_INDEX,
4270ba06e46SXiaoyao Li         .edx = CPUID_7_2_EDX_PSFD | CPUID_7_2_EDX_IPRED_CTRL |
4280ba06e46SXiaoyao Li                CPUID_7_2_EDX_RRSBA_CTRL | CPUID_7_2_EDX_BHI_CTRL,
4290ba06e46SXiaoyao Li     },
4300ba06e46SXiaoyao Li     .entries[4] = {
4310ba06e46SXiaoyao Li         .function = 0xD,
4320ba06e46SXiaoyao Li         .index = 0,
4330ba06e46SXiaoyao Li         .flags = KVM_CPUID_FLAG_SIGNIFCANT_INDEX,
4340ba06e46SXiaoyao Li         .eax = XSTATE_FP_MASK | XSTATE_SSE_MASK,
4350ba06e46SXiaoyao Li     },
4360ba06e46SXiaoyao Li     .entries[5] = {
4370ba06e46SXiaoyao Li         .function = 0xD,
4380ba06e46SXiaoyao Li         .index = 1,
4390ba06e46SXiaoyao Li         .flags = KVM_CPUID_FLAG_SIGNIFCANT_INDEX,
4400ba06e46SXiaoyao Li         .eax = CPUID_XSAVE_XSAVEOPT | CPUID_XSAVE_XSAVEC|
4410ba06e46SXiaoyao Li                CPUID_XSAVE_XGETBV1 | CPUID_XSAVE_XSAVES,
4420ba06e46SXiaoyao Li     },
4430ba06e46SXiaoyao Li     .entries[6] = {
4440ba06e46SXiaoyao Li         .function = 0x80000001,
4450ba06e46SXiaoyao Li         .index = 0,
4460ba06e46SXiaoyao Li         .ecx = CPUID_EXT3_LAHF_LM | CPUID_EXT3_ABM | CPUID_EXT3_3DNOWPREFETCH,
4470ba06e46SXiaoyao Li         /*
4480ba06e46SXiaoyao Li          * Strictly speaking, SYSCALL is not fixed1 bit since it depends on
4490ba06e46SXiaoyao Li          * the CPU to be in 64-bit mode. But here fixed1 is used to serve the
4500ba06e46SXiaoyao Li          * purpose of supported bits for TDX. In this sense, SYACALL is always
4510ba06e46SXiaoyao Li          * supported.
4520ba06e46SXiaoyao Li          */
4530ba06e46SXiaoyao Li         .edx = CPUID_EXT2_SYSCALL | CPUID_EXT2_NX | CPUID_EXT2_PDPE1GB |
4540ba06e46SXiaoyao Li                CPUID_EXT2_RDTSCP | CPUID_EXT2_LM,
4550ba06e46SXiaoyao Li     },
4560ba06e46SXiaoyao Li     .entries[7] = {
4570ba06e46SXiaoyao Li         .function = 0x80000007,
4580ba06e46SXiaoyao Li         .index = 0,
4590ba06e46SXiaoyao Li         .edx = CPUID_APM_INVTSC,
4600ba06e46SXiaoyao Li     },
4610ba06e46SXiaoyao Li };
4620ba06e46SXiaoyao Li 
46331df29c5SXiaoyao Li typedef struct TdxAttrsMap {
46431df29c5SXiaoyao Li     uint32_t attr_index;
46531df29c5SXiaoyao Li     uint32_t cpuid_leaf;
46631df29c5SXiaoyao Li     uint32_t cpuid_subleaf;
46731df29c5SXiaoyao Li     int cpuid_reg;
46831df29c5SXiaoyao Li     uint32_t feat_mask;
46931df29c5SXiaoyao Li } TdxAttrsMap;
47031df29c5SXiaoyao Li 
47131df29c5SXiaoyao Li static TdxAttrsMap tdx_attrs_maps[] = {
47231df29c5SXiaoyao Li     {.attr_index = 27,
47331df29c5SXiaoyao Li      .cpuid_leaf = 7,
47431df29c5SXiaoyao Li      .cpuid_subleaf = 1,
47531df29c5SXiaoyao Li      .cpuid_reg = R_EAX,
47631df29c5SXiaoyao Li      .feat_mask = CPUID_7_1_EAX_LASS,},
47731df29c5SXiaoyao Li 
47831df29c5SXiaoyao Li     {.attr_index = 30,
47931df29c5SXiaoyao Li      .cpuid_leaf = 7,
48031df29c5SXiaoyao Li      .cpuid_subleaf = 0,
48131df29c5SXiaoyao Li      .cpuid_reg = R_ECX,
48231df29c5SXiaoyao Li      .feat_mask = CPUID_7_0_ECX_PKS,},
48331df29c5SXiaoyao Li 
48431df29c5SXiaoyao Li     {.attr_index = 31,
48531df29c5SXiaoyao Li      .cpuid_leaf = 7,
48631df29c5SXiaoyao Li      .cpuid_subleaf = 0,
48731df29c5SXiaoyao Li      .cpuid_reg = R_ECX,
48831df29c5SXiaoyao Li      .feat_mask = CPUID_7_0_ECX_KeyLocker,},
48931df29c5SXiaoyao Li };
49031df29c5SXiaoyao Li 
4918c94c84cSXiaoyao Li typedef struct TdxXFAMDep {
4928c94c84cSXiaoyao Li     int xfam_bit;
4938c94c84cSXiaoyao Li     FeatureMask feat_mask;
4948c94c84cSXiaoyao Li } TdxXFAMDep;
4958c94c84cSXiaoyao Li 
4968c94c84cSXiaoyao Li /*
4978c94c84cSXiaoyao Li  * Note, only the CPUID bits whose virtualization type are "XFAM & Native" are
4988c94c84cSXiaoyao Li  * defiend here.
4998c94c84cSXiaoyao Li  *
5008c94c84cSXiaoyao Li  * For those whose virtualization type are "XFAM & Configured & Native", they
5018c94c84cSXiaoyao Li  * are reported as configurable bits. And they are not supported if not in the
5028c94c84cSXiaoyao Li  * configureable bits list from KVM even if the corresponding XFAM bit is
5038c94c84cSXiaoyao Li  * supported.
5048c94c84cSXiaoyao Li  */
5058c94c84cSXiaoyao Li TdxXFAMDep tdx_xfam_deps[] = {
5068c94c84cSXiaoyao Li     { XSTATE_YMM_BIT,       { FEAT_1_ECX, CPUID_EXT_FMA }},
5078c94c84cSXiaoyao Li     { XSTATE_YMM_BIT,       { FEAT_7_0_EBX, CPUID_7_0_EBX_AVX2 }},
5088c94c84cSXiaoyao Li     { XSTATE_OPMASK_BIT,    { FEAT_7_0_ECX, CPUID_7_0_ECX_AVX512_VBMI}},
5098c94c84cSXiaoyao Li     { XSTATE_OPMASK_BIT,    { FEAT_7_0_EDX, CPUID_7_0_EDX_AVX512_FP16}},
5108c94c84cSXiaoyao Li     { XSTATE_PT_BIT,        { FEAT_7_0_EBX, CPUID_7_0_EBX_INTEL_PT}},
5118c94c84cSXiaoyao Li     { XSTATE_PKRU_BIT,      { FEAT_7_0_ECX, CPUID_7_0_ECX_PKU}},
5128c94c84cSXiaoyao Li     { XSTATE_XTILE_CFG_BIT, { FEAT_7_0_EDX, CPUID_7_0_EDX_AMX_BF16 }},
5138c94c84cSXiaoyao Li     { XSTATE_XTILE_CFG_BIT, { FEAT_7_0_EDX, CPUID_7_0_EDX_AMX_TILE }},
5148c94c84cSXiaoyao Li     { XSTATE_XTILE_CFG_BIT, { FEAT_7_0_EDX, CPUID_7_0_EDX_AMX_INT8 }},
5158c94c84cSXiaoyao Li };
5168c94c84cSXiaoyao Li 
5170ba06e46SXiaoyao Li static struct kvm_cpuid_entry2 *find_in_supported_entry(uint32_t function,
5180ba06e46SXiaoyao Li                                                         uint32_t index)
5190ba06e46SXiaoyao Li {
5200ba06e46SXiaoyao Li     struct kvm_cpuid_entry2 *e;
5210ba06e46SXiaoyao Li 
5220ba06e46SXiaoyao Li     e = cpuid_find_entry(tdx_supported_cpuid, function, index);
5230ba06e46SXiaoyao Li     if (!e) {
5240ba06e46SXiaoyao Li         if (tdx_supported_cpuid->nent >= KVM_MAX_CPUID_ENTRIES) {
5250ba06e46SXiaoyao Li             error_report("tdx_supported_cpuid requries more space than %d entries",
5260ba06e46SXiaoyao Li                           KVM_MAX_CPUID_ENTRIES);
5270ba06e46SXiaoyao Li             exit(1);
5280ba06e46SXiaoyao Li         }
5290ba06e46SXiaoyao Li         e = &tdx_supported_cpuid->entries[tdx_supported_cpuid->nent++];
5300ba06e46SXiaoyao Li         e->function = function;
5310ba06e46SXiaoyao Li         e->index = index;
5320ba06e46SXiaoyao Li     }
5330ba06e46SXiaoyao Li 
5340ba06e46SXiaoyao Li     return e;
5350ba06e46SXiaoyao Li }
5360ba06e46SXiaoyao Li 
5370ba06e46SXiaoyao Li static void tdx_add_supported_cpuid_by_fixed1_bits(void)
5380ba06e46SXiaoyao Li {
5390ba06e46SXiaoyao Li     struct kvm_cpuid_entry2 *e, *e1;
5400ba06e46SXiaoyao Li     int i;
5410ba06e46SXiaoyao Li 
5420ba06e46SXiaoyao Li     for (i = 0; i < tdx_fixed1_bits.cpuid.nent; i++) {
5430ba06e46SXiaoyao Li         e = &tdx_fixed1_bits.entries[i];
5440ba06e46SXiaoyao Li 
5450ba06e46SXiaoyao Li         e1 = find_in_supported_entry(e->function, e->index);
5460ba06e46SXiaoyao Li         e1->eax |= e->eax;
5470ba06e46SXiaoyao Li         e1->ebx |= e->ebx;
5480ba06e46SXiaoyao Li         e1->ecx |= e->ecx;
5490ba06e46SXiaoyao Li         e1->edx |= e->edx;
5500ba06e46SXiaoyao Li     }
5510ba06e46SXiaoyao Li }
5520ba06e46SXiaoyao Li 
55331df29c5SXiaoyao Li static void tdx_add_supported_cpuid_by_attrs(void)
55431df29c5SXiaoyao Li {
55531df29c5SXiaoyao Li     struct kvm_cpuid_entry2 *e;
55631df29c5SXiaoyao Li     TdxAttrsMap *map;
55731df29c5SXiaoyao Li     int i;
55831df29c5SXiaoyao Li 
55931df29c5SXiaoyao Li     for (i = 0; i < ARRAY_SIZE(tdx_attrs_maps); i++) {
56031df29c5SXiaoyao Li         map = &tdx_attrs_maps[i];
56131df29c5SXiaoyao Li         if (!((1ULL << map->attr_index) & tdx_caps->supported_attrs)) {
56231df29c5SXiaoyao Li             continue;
56331df29c5SXiaoyao Li         }
56431df29c5SXiaoyao Li 
56531df29c5SXiaoyao Li         e = find_in_supported_entry(map->cpuid_leaf, map->cpuid_subleaf);
56631df29c5SXiaoyao Li 
56731df29c5SXiaoyao Li         switch(map->cpuid_reg) {
56831df29c5SXiaoyao Li         case R_EAX:
56931df29c5SXiaoyao Li             e->eax |= map->feat_mask;
57031df29c5SXiaoyao Li             break;
57131df29c5SXiaoyao Li         case R_EBX:
57231df29c5SXiaoyao Li             e->ebx |= map->feat_mask;
57331df29c5SXiaoyao Li             break;
57431df29c5SXiaoyao Li         case R_ECX:
57531df29c5SXiaoyao Li             e->ecx |= map->feat_mask;
57631df29c5SXiaoyao Li             break;
57731df29c5SXiaoyao Li         case R_EDX:
57831df29c5SXiaoyao Li             e->edx |= map->feat_mask;
57931df29c5SXiaoyao Li             break;
58031df29c5SXiaoyao Li         }
58131df29c5SXiaoyao Li     }
58231df29c5SXiaoyao Li }
58331df29c5SXiaoyao Li 
5848c94c84cSXiaoyao Li static void tdx_add_supported_cpuid_by_xfam(void)
5858c94c84cSXiaoyao Li {
5868c94c84cSXiaoyao Li     struct kvm_cpuid_entry2 *e;
5878c94c84cSXiaoyao Li     int i;
5888c94c84cSXiaoyao Li 
5898c94c84cSXiaoyao Li     const TdxXFAMDep *xfam_dep;
5908c94c84cSXiaoyao Li     const FeatureWordInfo *f;
5918c94c84cSXiaoyao Li     for (i = 0; i < ARRAY_SIZE(tdx_xfam_deps); i++) {
5928c94c84cSXiaoyao Li         xfam_dep = &tdx_xfam_deps[i];
5938c94c84cSXiaoyao Li         if (!((1ULL << xfam_dep->xfam_bit) & tdx_caps->supported_xfam)) {
5948c94c84cSXiaoyao Li             continue;
5958c94c84cSXiaoyao Li         }
5968c94c84cSXiaoyao Li 
5978c94c84cSXiaoyao Li         f = &feature_word_info[xfam_dep->feat_mask.index];
5988c94c84cSXiaoyao Li         if (f->type != CPUID_FEATURE_WORD) {
5998c94c84cSXiaoyao Li             continue;
6008c94c84cSXiaoyao Li         }
6018c94c84cSXiaoyao Li 
6028c94c84cSXiaoyao Li         e = find_in_supported_entry(f->cpuid.eax, f->cpuid.ecx);
6038c94c84cSXiaoyao Li         switch(f->cpuid.reg) {
6048c94c84cSXiaoyao Li         case R_EAX:
6058c94c84cSXiaoyao Li             e->eax |= xfam_dep->feat_mask.mask;
6068c94c84cSXiaoyao Li             break;
6078c94c84cSXiaoyao Li         case R_EBX:
6088c94c84cSXiaoyao Li             e->ebx |= xfam_dep->feat_mask.mask;
6098c94c84cSXiaoyao Li             break;
6108c94c84cSXiaoyao Li         case R_ECX:
6118c94c84cSXiaoyao Li             e->ecx |= xfam_dep->feat_mask.mask;
6128c94c84cSXiaoyao Li             break;
6138c94c84cSXiaoyao Li         case R_EDX:
6148c94c84cSXiaoyao Li             e->edx |= xfam_dep->feat_mask.mask;
6158c94c84cSXiaoyao Li             break;
6168c94c84cSXiaoyao Li         }
6178c94c84cSXiaoyao Li     }
6188c94c84cSXiaoyao Li 
6198c94c84cSXiaoyao Li     e = find_in_supported_entry(0xd, 0);
6208c94c84cSXiaoyao Li     e->eax |= (tdx_caps->supported_xfam & CPUID_XSTATE_XCR0_MASK);
6218c94c84cSXiaoyao Li     e->edx |= (tdx_caps->supported_xfam & CPUID_XSTATE_XCR0_MASK) >> 32;
6228c94c84cSXiaoyao Li 
6238c94c84cSXiaoyao Li     e = find_in_supported_entry(0xd, 1);
624*9f5771c5SXiaoyao Li     /*
625*9f5771c5SXiaoyao Li      * Mark XFD always support for TDX, it will be cleared finally in
626*9f5771c5SXiaoyao Li      * tdx_adjust_cpuid_features() if XFD is unavailable on the hardware
627*9f5771c5SXiaoyao Li      * because in this case the original data has it as 0.
628*9f5771c5SXiaoyao Li      */
629*9f5771c5SXiaoyao Li     e->eax |= CPUID_XSAVE_XFD;
6308c94c84cSXiaoyao Li     e->ecx |= (tdx_caps->supported_xfam & CPUID_XSTATE_XSS_MASK);
6318c94c84cSXiaoyao Li     e->edx |= (tdx_caps->supported_xfam & CPUID_XSTATE_XSS_MASK) >> 32;
6328c94c84cSXiaoyao Li }
6338c94c84cSXiaoyao Li 
63475ec6189SXiaoyao Li static void tdx_setup_supported_cpuid(void)
63575ec6189SXiaoyao Li {
63675ec6189SXiaoyao Li     if (tdx_supported_cpuid) {
63775ec6189SXiaoyao Li         return;
63875ec6189SXiaoyao Li     }
63975ec6189SXiaoyao Li 
64075ec6189SXiaoyao Li     tdx_supported_cpuid = g_malloc0(sizeof(*tdx_supported_cpuid) +
64175ec6189SXiaoyao Li                     KVM_MAX_CPUID_ENTRIES * sizeof(struct kvm_cpuid_entry2));
64275ec6189SXiaoyao Li 
64375ec6189SXiaoyao Li     memcpy(tdx_supported_cpuid->entries, tdx_caps->cpuid.entries,
64475ec6189SXiaoyao Li            tdx_caps->cpuid.nent * sizeof(struct kvm_cpuid_entry2));
64575ec6189SXiaoyao Li     tdx_supported_cpuid->nent = tdx_caps->cpuid.nent;
6460ba06e46SXiaoyao Li 
6470ba06e46SXiaoyao Li     tdx_add_supported_cpuid_by_fixed1_bits();
64831df29c5SXiaoyao Li     tdx_add_supported_cpuid_by_attrs();
6498c94c84cSXiaoyao Li     tdx_add_supported_cpuid_by_xfam();
65075ec6189SXiaoyao Li }
65175ec6189SXiaoyao Li 
6528eddedc3SXiaoyao Li static int tdx_kvm_init(ConfidentialGuestSupport *cgs, Error **errp)
6538eddedc3SXiaoyao Li {
654810d4e83SXiaoyao Li     MachineState *ms = MACHINE(qdev_get_machine());
655810d4e83SXiaoyao Li     X86MachineState *x86ms = X86_MACHINE(ms);
6561619d0e4SXiaoyao Li     TdxGuest *tdx = TDX_GUEST(cgs);
6578eddedc3SXiaoyao Li     int r = 0;
6588eddedc3SXiaoyao Li 
6598eddedc3SXiaoyao Li     kvm_mark_guest_state_protected();
6608eddedc3SXiaoyao Li 
661810d4e83SXiaoyao Li     if (x86ms->smm == ON_OFF_AUTO_AUTO) {
662810d4e83SXiaoyao Li         x86ms->smm = ON_OFF_AUTO_OFF;
663810d4e83SXiaoyao Li     } else if (x86ms->smm == ON_OFF_AUTO_ON) {
664810d4e83SXiaoyao Li         error_setg(errp, "TDX VM doesn't support SMM");
665810d4e83SXiaoyao Li         return -EINVAL;
666810d4e83SXiaoyao Li     }
667810d4e83SXiaoyao Li 
668e7ef6089SXiaoyao Li     if (x86ms->pic == ON_OFF_AUTO_AUTO) {
669e7ef6089SXiaoyao Li         x86ms->pic = ON_OFF_AUTO_OFF;
670e7ef6089SXiaoyao Li     } else if (x86ms->pic == ON_OFF_AUTO_ON) {
671e7ef6089SXiaoyao Li         error_setg(errp, "TDX VM doesn't support PIC");
672e7ef6089SXiaoyao Li         return -EINVAL;
673e7ef6089SXiaoyao Li     }
674e7ef6089SXiaoyao Li 
675bb45580dSXiaoyao Li     if (kvm_state->kernel_irqchip_split == ON_OFF_AUTO_AUTO) {
676bb45580dSXiaoyao Li         kvm_state->kernel_irqchip_split = ON_OFF_AUTO_ON;
677bb45580dSXiaoyao Li     } else if (kvm_state->kernel_irqchip_split != ON_OFF_AUTO_ON) {
678bb45580dSXiaoyao Li         error_setg(errp, "TDX VM requires kernel_irqchip to be split");
679bb45580dSXiaoyao Li         return -EINVAL;
680bb45580dSXiaoyao Li     }
681bb45580dSXiaoyao Li 
6828eddedc3SXiaoyao Li     if (!tdx_caps) {
6838eddedc3SXiaoyao Li         r = get_tdx_capabilities(errp);
6841619d0e4SXiaoyao Li         if (r) {
6851619d0e4SXiaoyao Li             return r;
6861619d0e4SXiaoyao Li         }
6878eddedc3SXiaoyao Li     }
6888eddedc3SXiaoyao Li 
68975ec6189SXiaoyao Li     tdx_setup_supported_cpuid();
69075ec6189SXiaoyao Li 
6911ff5048dSXiaoyao Li     /* TDX relies on KVM_HC_MAP_GPA_RANGE to handle TDG.VP.VMCALL<MapGPA> */
6921ff5048dSXiaoyao Li     if (!kvm_enable_hypercall(BIT_ULL(KVM_HC_MAP_GPA_RANGE))) {
6931ff5048dSXiaoyao Li         return -EOPNOTSUPP;
6941ff5048dSXiaoyao Li     }
6951ff5048dSXiaoyao Li 
696da672865SXiaoyao Li     /*
697da672865SXiaoyao Li      * Set kvm_readonly_mem_allowed to false, because TDX only supports readonly
698da672865SXiaoyao Li      * memory for shared memory but not for private memory. Besides, whether a
699da672865SXiaoyao Li      * memslot is private or shared is not determined by QEMU.
700da672865SXiaoyao Li      *
701da672865SXiaoyao Li      * Thus, just mark readonly memory not supported for simplicity.
702da672865SXiaoyao Li      */
703da672865SXiaoyao Li     kvm_readonly_mem_allowed = false;
704da672865SXiaoyao Li 
7054420ba0eSXiaoyao Li     qemu_add_machine_init_done_notifier(&tdx_machine_done_notify);
7064420ba0eSXiaoyao Li 
7071619d0e4SXiaoyao Li     tdx_guest = tdx;
7081619d0e4SXiaoyao Li     return 0;
7098eddedc3SXiaoyao Li }
7108eddedc3SXiaoyao Li 
711b455880eSXiaoyao Li static int tdx_kvm_type(X86ConfidentialGuest *cg)
712b455880eSXiaoyao Li {
713b455880eSXiaoyao Li     /* Do the object check */
714b455880eSXiaoyao Li     TDX_GUEST(cg);
715b455880eSXiaoyao Li 
716b455880eSXiaoyao Li     return KVM_X86_TDX_VM;
717b455880eSXiaoyao Li }
718b455880eSXiaoyao Li 
7197c615242SXiaoyao Li static void tdx_cpu_instance_init(X86ConfidentialGuest *cg, CPUState *cpu)
7207c615242SXiaoyao Li {
7219002494fSXiaoyao Li     X86CPU *x86cpu = X86_CPU(cpu);
7229002494fSXiaoyao Li 
7237c615242SXiaoyao Li     object_property_set_bool(OBJECT(cpu), "pmu", false, &error_abort);
7249002494fSXiaoyao Li 
7259002494fSXiaoyao Li     x86cpu->enable_cpuid_0x1f = true;
7267c615242SXiaoyao Li }
7277c615242SXiaoyao Li 
72875ec6189SXiaoyao Li static uint32_t tdx_adjust_cpuid_features(X86ConfidentialGuest *cg,
72975ec6189SXiaoyao Li                                           uint32_t feature, uint32_t index,
73075ec6189SXiaoyao Li                                           int reg, uint32_t value)
73175ec6189SXiaoyao Li {
73275ec6189SXiaoyao Li     struct kvm_cpuid_entry2 *e;
73375ec6189SXiaoyao Li 
7340ba06e46SXiaoyao Li     e = cpuid_find_entry(&tdx_fixed1_bits.cpuid, feature, index);
7350ba06e46SXiaoyao Li     if (e) {
7360ba06e46SXiaoyao Li         value |= cpuid_entry_get_reg(e, reg);
7370ba06e46SXiaoyao Li     }
7380ba06e46SXiaoyao Li 
73975ec6189SXiaoyao Li     if (is_feature_word_cpuid(feature, index, reg)) {
74075ec6189SXiaoyao Li         e = cpuid_find_entry(tdx_supported_cpuid, feature, index);
74175ec6189SXiaoyao Li         if (e) {
74275ec6189SXiaoyao Li             value &= cpuid_entry_get_reg(e, reg);
74375ec6189SXiaoyao Li         }
74475ec6189SXiaoyao Li     }
74575ec6189SXiaoyao Li 
74675ec6189SXiaoyao Li     return value;
74775ec6189SXiaoyao Li }
74875ec6189SXiaoyao Li 
74953b6f406SXiaoyao Li static int tdx_validate_attributes(TdxGuest *tdx, Error **errp)
75053b6f406SXiaoyao Li {
75153b6f406SXiaoyao Li     if ((tdx->attributes & ~tdx_caps->supported_attrs)) {
75253b6f406SXiaoyao Li         error_setg(errp, "Invalid attributes 0x%lx for TDX VM "
75353b6f406SXiaoyao Li                    "(KVM supported: 0x%llx)", tdx->attributes,
75453b6f406SXiaoyao Li                    tdx_caps->supported_attrs);
75553b6f406SXiaoyao Li         return -1;
75653b6f406SXiaoyao Li     }
75753b6f406SXiaoyao Li 
75853b6f406SXiaoyao Li     if (tdx->attributes & ~TDX_SUPPORTED_TD_ATTRS) {
75953b6f406SXiaoyao Li         error_setg(errp, "Some QEMU unsupported TD attribute bits being "
76053b6f406SXiaoyao Li                     "requested: 0x%lx (QEMU supported: 0x%llx)",
76153b6f406SXiaoyao Li                     tdx->attributes, TDX_SUPPORTED_TD_ATTRS);
76253b6f406SXiaoyao Li         return -1;
76353b6f406SXiaoyao Li     }
76453b6f406SXiaoyao Li 
76553b6f406SXiaoyao Li     return 0;
76653b6f406SXiaoyao Li }
76753b6f406SXiaoyao Li 
76853b6f406SXiaoyao Li static int setup_td_guest_attributes(X86CPU *x86cpu, Error **errp)
769bb3be394SXiaoyao Li {
770bb3be394SXiaoyao Li     CPUX86State *env = &x86cpu->env;
771bb3be394SXiaoyao Li 
772bb3be394SXiaoyao Li     tdx_guest->attributes |= (env->features[FEAT_7_0_ECX] & CPUID_7_0_ECX_PKS) ?
773bb3be394SXiaoyao Li                              TDX_TD_ATTRIBUTES_PKS : 0;
774bb3be394SXiaoyao Li     tdx_guest->attributes |= x86cpu->enable_pmu ? TDX_TD_ATTRIBUTES_PERFMON : 0;
77553b6f406SXiaoyao Li 
77653b6f406SXiaoyao Li     return tdx_validate_attributes(tdx_guest, errp);
777bb3be394SXiaoyao Li }
778bb3be394SXiaoyao Li 
779f15898b0SXiaoyao Li static int setup_td_xfam(X86CPU *x86cpu, Error **errp)
780f15898b0SXiaoyao Li {
781f15898b0SXiaoyao Li     CPUX86State *env = &x86cpu->env;
782f15898b0SXiaoyao Li     uint64_t xfam;
783f15898b0SXiaoyao Li 
784f15898b0SXiaoyao Li     xfam = env->features[FEAT_XSAVE_XCR0_LO] |
785f15898b0SXiaoyao Li            env->features[FEAT_XSAVE_XCR0_HI] |
786f15898b0SXiaoyao Li            env->features[FEAT_XSAVE_XSS_LO] |
787f15898b0SXiaoyao Li            env->features[FEAT_XSAVE_XSS_HI];
788f15898b0SXiaoyao Li 
789f15898b0SXiaoyao Li     if (xfam & ~tdx_caps->supported_xfam) {
790f15898b0SXiaoyao Li         error_setg(errp, "Invalid XFAM 0x%lx for TDX VM (supported: 0x%llx))",
791f15898b0SXiaoyao Li                    xfam, tdx_caps->supported_xfam);
792f15898b0SXiaoyao Li         return -1;
793f15898b0SXiaoyao Li     }
794f15898b0SXiaoyao Li 
795f15898b0SXiaoyao Li     tdx_guest->xfam = xfam;
796f15898b0SXiaoyao Li     return 0;
797f15898b0SXiaoyao Li }
798f15898b0SXiaoyao Li 
799f15898b0SXiaoyao Li static void tdx_filter_cpuid(struct kvm_cpuid2 *cpuids)
800f15898b0SXiaoyao Li {
801f15898b0SXiaoyao Li     int i, dest_cnt = 0;
802f15898b0SXiaoyao Li     struct kvm_cpuid_entry2 *src, *dest, *conf;
803f15898b0SXiaoyao Li 
804f15898b0SXiaoyao Li     for (i = 0; i < cpuids->nent; i++) {
805f15898b0SXiaoyao Li         src = cpuids->entries + i;
806f15898b0SXiaoyao Li         conf = cpuid_find_entry(&tdx_caps->cpuid, src->function, src->index);
807f15898b0SXiaoyao Li         if (!conf) {
808f15898b0SXiaoyao Li             continue;
809f15898b0SXiaoyao Li         }
810f15898b0SXiaoyao Li         dest = cpuids->entries + dest_cnt;
811f15898b0SXiaoyao Li 
812f15898b0SXiaoyao Li         dest->function = src->function;
813f15898b0SXiaoyao Li         dest->index = src->index;
814f15898b0SXiaoyao Li         dest->flags = src->flags;
815f15898b0SXiaoyao Li         dest->eax = src->eax & conf->eax;
816f15898b0SXiaoyao Li         dest->ebx = src->ebx & conf->ebx;
817f15898b0SXiaoyao Li         dest->ecx = src->ecx & conf->ecx;
818f15898b0SXiaoyao Li         dest->edx = src->edx & conf->edx;
819f15898b0SXiaoyao Li 
820f15898b0SXiaoyao Li         dest_cnt++;
821f15898b0SXiaoyao Li     }
822f15898b0SXiaoyao Li     cpuids->nent = dest_cnt++;
823f15898b0SXiaoyao Li }
824f15898b0SXiaoyao Li 
825f15898b0SXiaoyao Li int tdx_pre_create_vcpu(CPUState *cpu, Error **errp)
826f15898b0SXiaoyao Li {
827f15898b0SXiaoyao Li     X86CPU *x86cpu = X86_CPU(cpu);
828f15898b0SXiaoyao Li     CPUX86State *env = &x86cpu->env;
829f15898b0SXiaoyao Li     g_autofree struct kvm_tdx_init_vm *init_vm = NULL;
830f15898b0SXiaoyao Li     Error *local_err = NULL;
831d05a0858SIsaku Yamahata     size_t data_len;
832f15898b0SXiaoyao Li     int retry = 10000;
833f15898b0SXiaoyao Li     int r = 0;
834f15898b0SXiaoyao Li 
835f15898b0SXiaoyao Li     QEMU_LOCK_GUARD(&tdx_guest->lock);
836f15898b0SXiaoyao Li     if (tdx_guest->initialized) {
837f15898b0SXiaoyao Li         return r;
838f15898b0SXiaoyao Li     }
839f15898b0SXiaoyao Li 
840f15898b0SXiaoyao Li     init_vm = g_malloc0(sizeof(struct kvm_tdx_init_vm) +
841f15898b0SXiaoyao Li                         sizeof(struct kvm_cpuid_entry2) * KVM_MAX_CPUID_ENTRIES);
842f15898b0SXiaoyao Li 
843d529a2acSXiaoyao Li     if (!kvm_check_extension(kvm_state, KVM_CAP_X86_APIC_BUS_CYCLES_NS)) {
844d529a2acSXiaoyao Li         error_setg(errp, "KVM doesn't support KVM_CAP_X86_APIC_BUS_CYCLES_NS");
845d529a2acSXiaoyao Li         return -EOPNOTSUPP;
846d529a2acSXiaoyao Li     }
847d529a2acSXiaoyao Li 
848d529a2acSXiaoyao Li     r = kvm_vm_enable_cap(kvm_state, KVM_CAP_X86_APIC_BUS_CYCLES_NS,
849d529a2acSXiaoyao Li                           0, TDX_APIC_BUS_CYCLES_NS);
850d529a2acSXiaoyao Li     if (r < 0) {
851d529a2acSXiaoyao Li         error_setg_errno(errp, -r,
852d529a2acSXiaoyao Li                          "Unable to set core crystal clock frequency to 25MHz");
853d529a2acSXiaoyao Li         return r;
854d529a2acSXiaoyao Li     }
855d529a2acSXiaoyao Li 
8560e73b843SXiaoyao Li     if (env->tsc_khz && (env->tsc_khz < TDX_MIN_TSC_FREQUENCY_KHZ ||
8570e73b843SXiaoyao Li                          env->tsc_khz > TDX_MAX_TSC_FREQUENCY_KHZ)) {
8580e73b843SXiaoyao Li         error_setg(errp, "Invalid TSC %ld KHz, must specify cpu_frequency "
8590e73b843SXiaoyao Li                          "between [%d, %d] kHz", env->tsc_khz,
8600e73b843SXiaoyao Li                          TDX_MIN_TSC_FREQUENCY_KHZ, TDX_MAX_TSC_FREQUENCY_KHZ);
8610e73b843SXiaoyao Li        return -EINVAL;
8620e73b843SXiaoyao Li     }
8630e73b843SXiaoyao Li 
8640e73b843SXiaoyao Li     if (env->tsc_khz % (25 * 1000)) {
8650e73b843SXiaoyao Li         error_setg(errp, "Invalid TSC %ld KHz, it must be multiple of 25MHz",
8660e73b843SXiaoyao Li                    env->tsc_khz);
8670e73b843SXiaoyao Li         return -EINVAL;
8680e73b843SXiaoyao Li     }
8690e73b843SXiaoyao Li 
8700e73b843SXiaoyao Li     /* it's safe even env->tsc_khz is 0. KVM uses host's tsc_khz in this case */
8710e73b843SXiaoyao Li     r = kvm_vm_ioctl(kvm_state, KVM_SET_TSC_KHZ, env->tsc_khz);
8720e73b843SXiaoyao Li     if (r < 0) {
8730e73b843SXiaoyao Li         error_setg_errno(errp, -r, "Unable to set TSC frequency to %ld kHz",
8740e73b843SXiaoyao Li                          env->tsc_khz);
8750e73b843SXiaoyao Li         return r;
8760e73b843SXiaoyao Li     }
8770e73b843SXiaoyao Li 
878d05a0858SIsaku Yamahata     if (tdx_guest->mrconfigid) {
879d05a0858SIsaku Yamahata         g_autofree uint8_t *data = qbase64_decode(tdx_guest->mrconfigid,
880d05a0858SIsaku Yamahata                               strlen(tdx_guest->mrconfigid), &data_len, errp);
881d05a0858SIsaku Yamahata         if (!data) {
882d05a0858SIsaku Yamahata             return -1;
883d05a0858SIsaku Yamahata         }
884d05a0858SIsaku Yamahata         if (data_len != QCRYPTO_HASH_DIGEST_LEN_SHA384) {
885d05a0858SIsaku Yamahata             error_setg(errp, "TDX: failed to decode mrconfigid");
886d05a0858SIsaku Yamahata             return -1;
887d05a0858SIsaku Yamahata         }
888d05a0858SIsaku Yamahata         memcpy(init_vm->mrconfigid, data, data_len);
889d05a0858SIsaku Yamahata     }
890d05a0858SIsaku Yamahata 
891d05a0858SIsaku Yamahata     if (tdx_guest->mrowner) {
892d05a0858SIsaku Yamahata         g_autofree uint8_t *data = qbase64_decode(tdx_guest->mrowner,
893d05a0858SIsaku Yamahata                               strlen(tdx_guest->mrowner), &data_len, errp);
894d05a0858SIsaku Yamahata         if (!data) {
895d05a0858SIsaku Yamahata             return -1;
896d05a0858SIsaku Yamahata         }
897d05a0858SIsaku Yamahata         if (data_len != QCRYPTO_HASH_DIGEST_LEN_SHA384) {
898d05a0858SIsaku Yamahata             error_setg(errp, "TDX: failed to decode mrowner");
899d05a0858SIsaku Yamahata             return -1;
900d05a0858SIsaku Yamahata         }
901d05a0858SIsaku Yamahata         memcpy(init_vm->mrowner, data, data_len);
902d05a0858SIsaku Yamahata     }
903d05a0858SIsaku Yamahata 
904d05a0858SIsaku Yamahata     if (tdx_guest->mrownerconfig) {
905d05a0858SIsaku Yamahata         g_autofree uint8_t *data = qbase64_decode(tdx_guest->mrownerconfig,
906d05a0858SIsaku Yamahata                             strlen(tdx_guest->mrownerconfig), &data_len, errp);
907d05a0858SIsaku Yamahata         if (!data) {
908d05a0858SIsaku Yamahata             return -1;
909d05a0858SIsaku Yamahata         }
910d05a0858SIsaku Yamahata         if (data_len != QCRYPTO_HASH_DIGEST_LEN_SHA384) {
911d05a0858SIsaku Yamahata             error_setg(errp, "TDX: failed to decode mrownerconfig");
912d05a0858SIsaku Yamahata             return -1;
913d05a0858SIsaku Yamahata         }
914d05a0858SIsaku Yamahata         memcpy(init_vm->mrownerconfig, data, data_len);
915d05a0858SIsaku Yamahata     }
916d05a0858SIsaku Yamahata 
91753b6f406SXiaoyao Li     r = setup_td_guest_attributes(x86cpu, errp);
91853b6f406SXiaoyao Li     if (r) {
91953b6f406SXiaoyao Li         return r;
92053b6f406SXiaoyao Li     }
921bb3be394SXiaoyao Li 
922f15898b0SXiaoyao Li     r = setup_td_xfam(x86cpu, errp);
923f15898b0SXiaoyao Li     if (r) {
924f15898b0SXiaoyao Li         return r;
925f15898b0SXiaoyao Li     }
926f15898b0SXiaoyao Li 
927f15898b0SXiaoyao Li     init_vm->cpuid.nent = kvm_x86_build_cpuid(env, init_vm->cpuid.entries, 0);
928f15898b0SXiaoyao Li     tdx_filter_cpuid(&init_vm->cpuid);
929f15898b0SXiaoyao Li 
930f15898b0SXiaoyao Li     init_vm->attributes = tdx_guest->attributes;
931f15898b0SXiaoyao Li     init_vm->xfam = tdx_guest->xfam;
932f15898b0SXiaoyao Li 
933f15898b0SXiaoyao Li     /*
934f15898b0SXiaoyao Li      * KVM_TDX_INIT_VM gets -EAGAIN when KVM side SEAMCALL(TDH_MNG_CREATE)
935f15898b0SXiaoyao Li      * gets TDX_RND_NO_ENTROPY due to Random number generation (e.g., RDRAND or
936f15898b0SXiaoyao Li      * RDSEED) is busy.
937f15898b0SXiaoyao Li      *
938f15898b0SXiaoyao Li      * Retry for the case.
939f15898b0SXiaoyao Li      */
940f15898b0SXiaoyao Li     do {
941f15898b0SXiaoyao Li         error_free(local_err);
942f15898b0SXiaoyao Li         local_err = NULL;
943f15898b0SXiaoyao Li         r = tdx_vm_ioctl(KVM_TDX_INIT_VM, 0, init_vm, &local_err);
944f15898b0SXiaoyao Li     } while (r == -EAGAIN && --retry);
945f15898b0SXiaoyao Li 
946f15898b0SXiaoyao Li     if (r < 0) {
947f15898b0SXiaoyao Li         if (!retry) {
948f15898b0SXiaoyao Li             error_append_hint(&local_err, "Hardware RNG (Random Number "
949f15898b0SXiaoyao Li             "Generator) is busy occupied by someone (via RDRAND/RDSEED) "
950f15898b0SXiaoyao Li             "maliciously, which leads to KVM_TDX_INIT_VM keeping failure "
951f15898b0SXiaoyao Li             "due to lack of entropy.\n");
952f15898b0SXiaoyao Li         }
953f15898b0SXiaoyao Li         error_propagate(errp, local_err);
954f15898b0SXiaoyao Li         return r;
955f15898b0SXiaoyao Li     }
956f15898b0SXiaoyao Li 
957f15898b0SXiaoyao Li     tdx_guest->initialized = true;
958f15898b0SXiaoyao Li 
959f15898b0SXiaoyao Li     return 0;
960f15898b0SXiaoyao Li }
961f15898b0SXiaoyao Li 
962cb5d65a8SXiaoyao Li int tdx_parse_tdvf(void *flash_ptr, int size)
963cb5d65a8SXiaoyao Li {
964cb5d65a8SXiaoyao Li     return tdvf_parse_metadata(&tdx_guest->tdvf, flash_ptr, size);
965cb5d65a8SXiaoyao Li }
966cb5d65a8SXiaoyao Li 
9676e250463SXiaoyao Li static void tdx_panicked_on_fatal_error(X86CPU *cpu, uint64_t error_code,
9686e250463SXiaoyao Li                                         char *message, uint64_t gpa)
9696e250463SXiaoyao Li {
9706e250463SXiaoyao Li     GuestPanicInformation *panic_info;
9716e250463SXiaoyao Li 
9726e250463SXiaoyao Li     panic_info = g_new0(GuestPanicInformation, 1);
9736e250463SXiaoyao Li     panic_info->type = GUEST_PANIC_INFORMATION_TYPE_TDX;
9746e250463SXiaoyao Li     panic_info->u.tdx.error_code = (uint32_t) error_code;
9756e250463SXiaoyao Li     panic_info->u.tdx.message = message;
9766e250463SXiaoyao Li     panic_info->u.tdx.gpa = gpa;
9776e250463SXiaoyao Li 
9786e250463SXiaoyao Li     qemu_system_guest_panicked(panic_info);
9796e250463SXiaoyao Li }
9806e250463SXiaoyao Li 
98198dbfd68SXiaoyao Li /*
98298dbfd68SXiaoyao Li  * Only 8 registers can contain valid ASCII byte stream to form the fatal
98398dbfd68SXiaoyao Li  * message, and their sequence is: R14, R15, RBX, RDI, RSI, R8, R9, RDX
98498dbfd68SXiaoyao Li  */
98598dbfd68SXiaoyao Li #define TDX_FATAL_MESSAGE_MAX        64
98698dbfd68SXiaoyao Li 
9876e250463SXiaoyao Li #define TDX_REPORT_FATAL_ERROR_GPA_VALID    BIT_ULL(63)
9886e250463SXiaoyao Li 
98998dbfd68SXiaoyao Li int tdx_handle_report_fatal_error(X86CPU *cpu, struct kvm_run *run)
99098dbfd68SXiaoyao Li {
99198dbfd68SXiaoyao Li     uint64_t error_code = run->system_event.data[R_R12];
99298dbfd68SXiaoyao Li     uint64_t reg_mask = run->system_event.data[R_ECX];
99398dbfd68SXiaoyao Li     char *message = NULL;
99498dbfd68SXiaoyao Li     uint64_t *tmp;
9956e250463SXiaoyao Li     uint64_t gpa = -1ull;
99698dbfd68SXiaoyao Li 
99798dbfd68SXiaoyao Li     if (error_code & 0xffff) {
99898dbfd68SXiaoyao Li         error_report("TDX: REPORT_FATAL_ERROR: invalid error code: 0x%lx",
99998dbfd68SXiaoyao Li                      error_code);
100098dbfd68SXiaoyao Li         return -1;
100198dbfd68SXiaoyao Li     }
100298dbfd68SXiaoyao Li 
100398dbfd68SXiaoyao Li     if (reg_mask) {
100498dbfd68SXiaoyao Li         message = g_malloc0(TDX_FATAL_MESSAGE_MAX + 1);
100598dbfd68SXiaoyao Li         tmp = (uint64_t *)message;
100698dbfd68SXiaoyao Li 
100798dbfd68SXiaoyao Li #define COPY_REG(REG)                               \
100898dbfd68SXiaoyao Li     do {                                            \
100998dbfd68SXiaoyao Li         if (reg_mask & BIT_ULL(REG)) {              \
101098dbfd68SXiaoyao Li             *(tmp++) = run->system_event.data[REG]; \
101198dbfd68SXiaoyao Li         }                                           \
101298dbfd68SXiaoyao Li     } while (0)
101398dbfd68SXiaoyao Li 
101498dbfd68SXiaoyao Li         COPY_REG(R_R14);
101598dbfd68SXiaoyao Li         COPY_REG(R_R15);
101698dbfd68SXiaoyao Li         COPY_REG(R_EBX);
101798dbfd68SXiaoyao Li         COPY_REG(R_EDI);
101898dbfd68SXiaoyao Li         COPY_REG(R_ESI);
101998dbfd68SXiaoyao Li         COPY_REG(R_R8);
102098dbfd68SXiaoyao Li         COPY_REG(R_R9);
102198dbfd68SXiaoyao Li         COPY_REG(R_EDX);
102298dbfd68SXiaoyao Li         *((char *)tmp) = '\0';
102398dbfd68SXiaoyao Li     }
102498dbfd68SXiaoyao Li #undef COPY_REG
102598dbfd68SXiaoyao Li 
10266e250463SXiaoyao Li     if (error_code & TDX_REPORT_FATAL_ERROR_GPA_VALID) {
10276e250463SXiaoyao Li         gpa = run->system_event.data[R_R13];
10286e250463SXiaoyao Li     }
10296e250463SXiaoyao Li 
10306e250463SXiaoyao Li     tdx_panicked_on_fatal_error(cpu, error_code, message, gpa);
10316e250463SXiaoyao Li 
103298dbfd68SXiaoyao Li     return -1;
103398dbfd68SXiaoyao Li }
103498dbfd68SXiaoyao Li 
10356016e297SXiaoyao Li static bool tdx_guest_get_sept_ve_disable(Object *obj, Error **errp)
10366016e297SXiaoyao Li {
10376016e297SXiaoyao Li     TdxGuest *tdx = TDX_GUEST(obj);
10386016e297SXiaoyao Li 
10396016e297SXiaoyao Li     return !!(tdx->attributes & TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE);
10406016e297SXiaoyao Li }
10416016e297SXiaoyao Li 
10426016e297SXiaoyao Li static void tdx_guest_set_sept_ve_disable(Object *obj, bool value, Error **errp)
10436016e297SXiaoyao Li {
10446016e297SXiaoyao Li     TdxGuest *tdx = TDX_GUEST(obj);
10456016e297SXiaoyao Li 
10466016e297SXiaoyao Li     if (value) {
10476016e297SXiaoyao Li         tdx->attributes |= TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE;
10486016e297SXiaoyao Li     } else {
10496016e297SXiaoyao Li         tdx->attributes &= ~TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE;
10506016e297SXiaoyao Li     }
10516016e297SXiaoyao Li }
10526016e297SXiaoyao Li 
1053d05a0858SIsaku Yamahata static char *tdx_guest_get_mrconfigid(Object *obj, Error **errp)
1054d05a0858SIsaku Yamahata {
1055d05a0858SIsaku Yamahata     TdxGuest *tdx = TDX_GUEST(obj);
1056d05a0858SIsaku Yamahata 
1057d05a0858SIsaku Yamahata     return g_strdup(tdx->mrconfigid);
1058d05a0858SIsaku Yamahata }
1059d05a0858SIsaku Yamahata 
1060d05a0858SIsaku Yamahata static void tdx_guest_set_mrconfigid(Object *obj, const char *value, Error **errp)
1061d05a0858SIsaku Yamahata {
1062d05a0858SIsaku Yamahata     TdxGuest *tdx = TDX_GUEST(obj);
1063d05a0858SIsaku Yamahata 
1064d05a0858SIsaku Yamahata     g_free(tdx->mrconfigid);
1065d05a0858SIsaku Yamahata     tdx->mrconfigid = g_strdup(value);
1066d05a0858SIsaku Yamahata }
1067d05a0858SIsaku Yamahata 
1068d05a0858SIsaku Yamahata static char *tdx_guest_get_mrowner(Object *obj, Error **errp)
1069d05a0858SIsaku Yamahata {
1070d05a0858SIsaku Yamahata     TdxGuest *tdx = TDX_GUEST(obj);
1071d05a0858SIsaku Yamahata 
1072d05a0858SIsaku Yamahata     return g_strdup(tdx->mrowner);
1073d05a0858SIsaku Yamahata }
1074d05a0858SIsaku Yamahata 
1075d05a0858SIsaku Yamahata static void tdx_guest_set_mrowner(Object *obj, const char *value, Error **errp)
1076d05a0858SIsaku Yamahata {
1077d05a0858SIsaku Yamahata     TdxGuest *tdx = TDX_GUEST(obj);
1078d05a0858SIsaku Yamahata 
1079d05a0858SIsaku Yamahata     g_free(tdx->mrowner);
1080d05a0858SIsaku Yamahata     tdx->mrowner = g_strdup(value);
1081d05a0858SIsaku Yamahata }
1082d05a0858SIsaku Yamahata 
1083d05a0858SIsaku Yamahata static char *tdx_guest_get_mrownerconfig(Object *obj, Error **errp)
1084d05a0858SIsaku Yamahata {
1085d05a0858SIsaku Yamahata     TdxGuest *tdx = TDX_GUEST(obj);
1086d05a0858SIsaku Yamahata 
1087d05a0858SIsaku Yamahata     return g_strdup(tdx->mrownerconfig);
1088d05a0858SIsaku Yamahata }
1089d05a0858SIsaku Yamahata 
1090d05a0858SIsaku Yamahata static void tdx_guest_set_mrownerconfig(Object *obj, const char *value, Error **errp)
1091d05a0858SIsaku Yamahata {
1092d05a0858SIsaku Yamahata     TdxGuest *tdx = TDX_GUEST(obj);
1093d05a0858SIsaku Yamahata 
1094d05a0858SIsaku Yamahata     g_free(tdx->mrownerconfig);
1095d05a0858SIsaku Yamahata     tdx->mrownerconfig = g_strdup(value);
1096d05a0858SIsaku Yamahata }
1097d05a0858SIsaku Yamahata 
1098756e12e7SXiaoyao Li /* tdx guest */
1099756e12e7SXiaoyao Li OBJECT_DEFINE_TYPE_WITH_INTERFACES(TdxGuest,
1100756e12e7SXiaoyao Li                                    tdx_guest,
1101756e12e7SXiaoyao Li                                    TDX_GUEST,
1102756e12e7SXiaoyao Li                                    X86_CONFIDENTIAL_GUEST,
1103756e12e7SXiaoyao Li                                    { TYPE_USER_CREATABLE },
1104756e12e7SXiaoyao Li                                    { NULL })
1105756e12e7SXiaoyao Li 
1106756e12e7SXiaoyao Li static void tdx_guest_init(Object *obj)
1107756e12e7SXiaoyao Li {
1108756e12e7SXiaoyao Li     ConfidentialGuestSupport *cgs = CONFIDENTIAL_GUEST_SUPPORT(obj);
1109756e12e7SXiaoyao Li     TdxGuest *tdx = TDX_GUEST(obj);
1110756e12e7SXiaoyao Li 
1111f15898b0SXiaoyao Li     qemu_mutex_init(&tdx->lock);
1112f15898b0SXiaoyao Li 
1113756e12e7SXiaoyao Li     cgs->require_guest_memfd = true;
1114714af522SIsaku Yamahata     tdx->attributes = TDX_TD_ATTRIBUTES_SEPT_VE_DISABLE;
1115756e12e7SXiaoyao Li 
1116756e12e7SXiaoyao Li     object_property_add_uint64_ptr(obj, "attributes", &tdx->attributes,
1117756e12e7SXiaoyao Li                                    OBJ_PROP_FLAG_READWRITE);
11186016e297SXiaoyao Li     object_property_add_bool(obj, "sept-ve-disable",
11196016e297SXiaoyao Li                              tdx_guest_get_sept_ve_disable,
11206016e297SXiaoyao Li                              tdx_guest_set_sept_ve_disable);
1121d05a0858SIsaku Yamahata     object_property_add_str(obj, "mrconfigid",
1122d05a0858SIsaku Yamahata                             tdx_guest_get_mrconfigid,
1123d05a0858SIsaku Yamahata                             tdx_guest_set_mrconfigid);
1124d05a0858SIsaku Yamahata     object_property_add_str(obj, "mrowner",
1125d05a0858SIsaku Yamahata                             tdx_guest_get_mrowner, tdx_guest_set_mrowner);
1126d05a0858SIsaku Yamahata     object_property_add_str(obj, "mrownerconfig",
1127d05a0858SIsaku Yamahata                             tdx_guest_get_mrownerconfig,
1128d05a0858SIsaku Yamahata                             tdx_guest_set_mrownerconfig);
1129756e12e7SXiaoyao Li }
1130756e12e7SXiaoyao Li 
1131756e12e7SXiaoyao Li static void tdx_guest_finalize(Object *obj)
1132756e12e7SXiaoyao Li {
1133756e12e7SXiaoyao Li }
1134756e12e7SXiaoyao Li 
1135756e12e7SXiaoyao Li static void tdx_guest_class_init(ObjectClass *oc, const void *data)
1136756e12e7SXiaoyao Li {
1137631a2ac5SXiaoyao Li     ConfidentialGuestSupportClass *klass = CONFIDENTIAL_GUEST_SUPPORT_CLASS(oc);
1138b455880eSXiaoyao Li     X86ConfidentialGuestClass *x86_klass = X86_CONFIDENTIAL_GUEST_CLASS(oc);
1139b455880eSXiaoyao Li 
1140631a2ac5SXiaoyao Li     klass->kvm_init = tdx_kvm_init;
1141b455880eSXiaoyao Li     x86_klass->kvm_type = tdx_kvm_type;
11427c615242SXiaoyao Li     x86_klass->cpu_instance_init = tdx_cpu_instance_init;
114375ec6189SXiaoyao Li     x86_klass->adjust_cpuid_features = tdx_adjust_cpuid_features;
1144756e12e7SXiaoyao Li }
1145