xref: /openbmc/qemu/target/riscv/kvm/kvm-cpu.c (revision d74169e09e1d424aaca138966f460520a0d4dd0d)
1 /*
2  * RISC-V implementation of KVM hooks
3  *
4  * Copyright (c) 2020 Huawei Technologies Co., Ltd
5  *
6  * This program is free software; you can redistribute it and/or modify it
7  * under the terms and conditions of the GNU General Public License,
8  * version 2 or later, as published by the Free Software Foundation.
9  *
10  * This program is distributed in the hope it will be useful, but WITHOUT
11  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
13  * more details.
14  *
15  * You should have received a copy of the GNU General Public License along with
16  * this program.  If not, see <http://www.gnu.org/licenses/>.
17  */
18 
19 #include "qemu/osdep.h"
20 #include <sys/ioctl.h>
21 #include <sys/prctl.h>
22 
23 #include <linux/kvm.h>
24 
25 #include "qemu/timer.h"
26 #include "qapi/error.h"
27 #include "qemu/error-report.h"
28 #include "qemu/main-loop.h"
29 #include "qapi/visitor.h"
30 #include "system/system.h"
31 #include "system/kvm.h"
32 #include "system/kvm_int.h"
33 #include "cpu.h"
34 #include "trace.h"
35 #include "accel/accel-cpu-target.h"
36 #include "hw/pci/pci.h"
37 #include "exec/memattrs.h"
38 #include "system/address-spaces.h"
39 #include "hw/boards.h"
40 #include "hw/irq.h"
41 #include "hw/intc/riscv_imsic.h"
42 #include "qemu/log.h"
43 #include "hw/loader.h"
44 #include "kvm_riscv.h"
45 #include "sbi_ecall_interface.h"
46 #include "chardev/char-fe.h"
47 #include "migration/misc.h"
48 #include "system/runstate.h"
49 #include "hw/riscv/numa.h"
50 
51 #define PR_RISCV_V_SET_CONTROL            69
52 #define PR_RISCV_V_VSTATE_CTRL_ON          2
53 
54 void riscv_kvm_aplic_request(void *opaque, int irq, int level)
55 {
56     kvm_set_irq(kvm_state, irq, !!level);
57 }
58 
59 static bool cap_has_mp_state;
60 
61 #define KVM_RISCV_REG_ID_U32(type, idx) (KVM_REG_RISCV | KVM_REG_SIZE_U32 | \
62                                          type | idx)
63 
64 #define KVM_RISCV_REG_ID_U64(type, idx) (KVM_REG_RISCV | KVM_REG_SIZE_U64 | \
65                                          type | idx)
66 
67 #if defined(TARGET_RISCV64)
68 #define KVM_RISCV_REG_ID_ULONG(type, idx) KVM_RISCV_REG_ID_U64(type, idx)
69 #else
70 #define KVM_RISCV_REG_ID_ULONG(type, idx) KVM_RISCV_REG_ID_U32(type, idx)
71 #endif
72 
73 static uint64_t kvm_encode_reg_size_id(uint64_t id, size_t size_b)
74 {
75     uint64_t size_ctz = __builtin_ctz(size_b);
76 
77     return id | (size_ctz << KVM_REG_SIZE_SHIFT);
78 }
79 
80 static uint64_t kvm_riscv_vector_reg_id(RISCVCPU *cpu,
81                                         uint64_t idx)
82 {
83     uint64_t id;
84     size_t size_b;
85 
86     g_assert(idx < 32);
87 
88     id = KVM_REG_RISCV | KVM_REG_RISCV_VECTOR | KVM_REG_RISCV_VECTOR_REG(idx);
89     size_b = cpu->cfg.vlenb;
90 
91     return kvm_encode_reg_size_id(id, size_b);
92 }
93 
94 #define RISCV_CORE_REG(name) \
95     KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_CORE, \
96                            KVM_REG_RISCV_CORE_REG(name))
97 
98 #define RISCV_CSR_REG(name) \
99     KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_CSR, \
100                            KVM_REG_RISCV_CSR_REG(name))
101 
102 #define RISCV_CONFIG_REG(name) \
103     KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_CONFIG, \
104                            KVM_REG_RISCV_CONFIG_REG(name))
105 
106 #define RISCV_TIMER_REG(name)  KVM_RISCV_REG_ID_U64(KVM_REG_RISCV_TIMER, \
107                  KVM_REG_RISCV_TIMER_REG(name))
108 
109 #define RISCV_FP_F_REG(idx)  KVM_RISCV_REG_ID_U32(KVM_REG_RISCV_FP_F, idx)
110 
111 #define RISCV_FP_D_REG(idx)  KVM_RISCV_REG_ID_U64(KVM_REG_RISCV_FP_D, idx)
112 
113 #define RISCV_VECTOR_CSR_REG(name) \
114     KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_VECTOR, \
115                            KVM_REG_RISCV_VECTOR_CSR_REG(name))
116 
117 #define KVM_RISCV_GET_TIMER(cs, name, reg) \
118     do { \
119         int ret = kvm_get_one_reg(cs, RISCV_TIMER_REG(name), &reg); \
120         if (ret) { \
121             abort(); \
122         } \
123     } while (0)
124 
125 #define KVM_RISCV_SET_TIMER(cs, name, reg) \
126     do { \
127         int ret = kvm_set_one_reg(cs, RISCV_TIMER_REG(name), &reg); \
128         if (ret) { \
129             abort(); \
130         } \
131     } while (0)
132 
133 typedef struct KVMCPUConfig {
134     const char *name;
135     const char *description;
136     target_ulong offset;
137     uint64_t kvm_reg_id;
138     uint32_t prop_size;
139     bool user_set;
140     bool supported;
141 } KVMCPUConfig;
142 
143 #define KVM_MISA_CFG(_bit, _reg_id) \
144     {.offset = _bit, .kvm_reg_id = _reg_id}
145 
146 /* KVM ISA extensions */
147 static KVMCPUConfig kvm_misa_ext_cfgs[] = {
148     KVM_MISA_CFG(RVA, KVM_RISCV_ISA_EXT_A),
149     KVM_MISA_CFG(RVC, KVM_RISCV_ISA_EXT_C),
150     KVM_MISA_CFG(RVD, KVM_RISCV_ISA_EXT_D),
151     KVM_MISA_CFG(RVF, KVM_RISCV_ISA_EXT_F),
152     KVM_MISA_CFG(RVH, KVM_RISCV_ISA_EXT_H),
153     KVM_MISA_CFG(RVI, KVM_RISCV_ISA_EXT_I),
154     KVM_MISA_CFG(RVM, KVM_RISCV_ISA_EXT_M),
155     KVM_MISA_CFG(RVV, KVM_RISCV_ISA_EXT_V),
156 };
157 
158 static void kvm_cpu_get_misa_ext_cfg(Object *obj, Visitor *v,
159                                      const char *name,
160                                      void *opaque, Error **errp)
161 {
162     KVMCPUConfig *misa_ext_cfg = opaque;
163     target_ulong misa_bit = misa_ext_cfg->offset;
164     RISCVCPU *cpu = RISCV_CPU(obj);
165     CPURISCVState *env = &cpu->env;
166     bool value = env->misa_ext_mask & misa_bit;
167 
168     visit_type_bool(v, name, &value, errp);
169 }
170 
171 static void kvm_cpu_set_misa_ext_cfg(Object *obj, Visitor *v,
172                                      const char *name,
173                                      void *opaque, Error **errp)
174 {
175     KVMCPUConfig *misa_ext_cfg = opaque;
176     target_ulong misa_bit = misa_ext_cfg->offset;
177     RISCVCPU *cpu = RISCV_CPU(obj);
178     CPURISCVState *env = &cpu->env;
179     bool value, host_bit;
180 
181     if (!visit_type_bool(v, name, &value, errp)) {
182         return;
183     }
184 
185     host_bit = env->misa_ext_mask & misa_bit;
186 
187     if (value == host_bit) {
188         return;
189     }
190 
191     if (!value) {
192         misa_ext_cfg->user_set = true;
193         return;
194     }
195 
196     /*
197      * Forbid users to enable extensions that aren't
198      * available in the hart.
199      */
200     error_setg(errp, "Enabling MISA bit '%s' is not allowed: it's not "
201                "enabled in the host", misa_ext_cfg->name);
202 }
203 
204 static void kvm_riscv_update_cpu_misa_ext(RISCVCPU *cpu, CPUState *cs)
205 {
206     CPURISCVState *env = &cpu->env;
207     uint64_t id, reg;
208     int i, ret;
209 
210     for (i = 0; i < ARRAY_SIZE(kvm_misa_ext_cfgs); i++) {
211         KVMCPUConfig *misa_cfg = &kvm_misa_ext_cfgs[i];
212         target_ulong misa_bit = misa_cfg->offset;
213 
214         if (!misa_cfg->user_set) {
215             continue;
216         }
217 
218         /* If we're here we're going to disable the MISA bit */
219         reg = 0;
220         id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_ISA_EXT,
221                                     misa_cfg->kvm_reg_id);
222         ret = kvm_set_one_reg(cs, id, &reg);
223         if (ret != 0) {
224             /*
225              * We're not checking for -EINVAL because if the bit is about
226              * to be disabled, it means that it was already enabled by
227              * KVM. We determined that by fetching the 'isa' register
228              * during init() time. Any error at this point is worth
229              * aborting.
230              */
231             error_report("Unable to set KVM reg %s, error %d",
232                          misa_cfg->name, ret);
233             exit(EXIT_FAILURE);
234         }
235         env->misa_ext &= ~misa_bit;
236     }
237 }
238 
239 #define KVM_CSR_CFG(_name, _env_prop, reg_id) \
240     {.name = _name, .offset = ENV_CSR_OFFSET(_env_prop), \
241      .prop_size = sizeof(((CPURISCVState *)0)->_env_prop), \
242      .kvm_reg_id = reg_id}
243 
244 static KVMCPUConfig kvm_csr_cfgs[] = {
245     KVM_CSR_CFG("sstatus",    mstatus,    RISCV_CSR_REG(sstatus)),
246     KVM_CSR_CFG("sie",        mie,        RISCV_CSR_REG(sie)),
247     KVM_CSR_CFG("stvec",      stvec,      RISCV_CSR_REG(stvec)),
248     KVM_CSR_CFG("sscratch",   sscratch,   RISCV_CSR_REG(sscratch)),
249     KVM_CSR_CFG("sepc",       sepc,       RISCV_CSR_REG(sepc)),
250     KVM_CSR_CFG("scause",     scause,     RISCV_CSR_REG(scause)),
251     KVM_CSR_CFG("stval",      stval,      RISCV_CSR_REG(stval)),
252     KVM_CSR_CFG("sip",        mip,        RISCV_CSR_REG(sip)),
253     KVM_CSR_CFG("satp",       satp,       RISCV_CSR_REG(satp)),
254     KVM_CSR_CFG("scounteren", scounteren, RISCV_CSR_REG(scounteren)),
255     KVM_CSR_CFG("senvcfg",    senvcfg,    RISCV_CSR_REG(senvcfg)),
256 };
257 
258 static void *kvmconfig_get_env_addr(RISCVCPU *cpu, KVMCPUConfig *csr_cfg)
259 {
260     return (void *)&cpu->env + csr_cfg->offset;
261 }
262 
263 static uint32_t kvm_cpu_csr_get_u32(RISCVCPU *cpu, KVMCPUConfig *csr_cfg)
264 {
265     uint32_t *val32 = kvmconfig_get_env_addr(cpu, csr_cfg);
266     return *val32;
267 }
268 
269 static uint64_t kvm_cpu_csr_get_u64(RISCVCPU *cpu, KVMCPUConfig *csr_cfg)
270 {
271     uint64_t *val64 = kvmconfig_get_env_addr(cpu, csr_cfg);
272     return *val64;
273 }
274 
275 static void kvm_cpu_csr_set_u32(RISCVCPU *cpu, KVMCPUConfig *csr_cfg,
276                                 uint32_t val)
277 {
278     uint32_t *val32 = kvmconfig_get_env_addr(cpu, csr_cfg);
279     *val32 = val;
280 }
281 
282 static void kvm_cpu_csr_set_u64(RISCVCPU *cpu, KVMCPUConfig *csr_cfg,
283                                 uint64_t val)
284 {
285     uint64_t *val64 = kvmconfig_get_env_addr(cpu, csr_cfg);
286     *val64 = val;
287 }
288 
289 #define KVM_EXT_CFG(_name, _prop, _reg_id) \
290     {.name = _name, .offset = CPU_CFG_OFFSET(_prop), \
291      .kvm_reg_id = _reg_id}
292 
293 static KVMCPUConfig kvm_multi_ext_cfgs[] = {
294     KVM_EXT_CFG("zicbom", ext_zicbom, KVM_RISCV_ISA_EXT_ZICBOM),
295     KVM_EXT_CFG("zicboz", ext_zicboz, KVM_RISCV_ISA_EXT_ZICBOZ),
296     KVM_EXT_CFG("ziccrse", ext_ziccrse, KVM_RISCV_ISA_EXT_ZICCRSE),
297     KVM_EXT_CFG("zicntr", ext_zicntr, KVM_RISCV_ISA_EXT_ZICNTR),
298     KVM_EXT_CFG("zicond", ext_zicond, KVM_RISCV_ISA_EXT_ZICOND),
299     KVM_EXT_CFG("zicsr", ext_zicsr, KVM_RISCV_ISA_EXT_ZICSR),
300     KVM_EXT_CFG("zifencei", ext_zifencei, KVM_RISCV_ISA_EXT_ZIFENCEI),
301     KVM_EXT_CFG("zihintntl", ext_zihintntl, KVM_RISCV_ISA_EXT_ZIHINTNTL),
302     KVM_EXT_CFG("zihintpause", ext_zihintpause, KVM_RISCV_ISA_EXT_ZIHINTPAUSE),
303     KVM_EXT_CFG("zihpm", ext_zihpm, KVM_RISCV_ISA_EXT_ZIHPM),
304     KVM_EXT_CFG("zimop", ext_zimop, KVM_RISCV_ISA_EXT_ZIMOP),
305     KVM_EXT_CFG("zcmop", ext_zcmop, KVM_RISCV_ISA_EXT_ZCMOP),
306     KVM_EXT_CFG("zabha", ext_zabha, KVM_RISCV_ISA_EXT_ZABHA),
307     KVM_EXT_CFG("zacas", ext_zacas, KVM_RISCV_ISA_EXT_ZACAS),
308     KVM_EXT_CFG("zawrs", ext_zawrs, KVM_RISCV_ISA_EXT_ZAWRS),
309     KVM_EXT_CFG("zfa", ext_zfa, KVM_RISCV_ISA_EXT_ZFA),
310     KVM_EXT_CFG("zfh", ext_zfh, KVM_RISCV_ISA_EXT_ZFH),
311     KVM_EXT_CFG("zfhmin", ext_zfhmin, KVM_RISCV_ISA_EXT_ZFHMIN),
312     KVM_EXT_CFG("zba", ext_zba, KVM_RISCV_ISA_EXT_ZBA),
313     KVM_EXT_CFG("zbb", ext_zbb, KVM_RISCV_ISA_EXT_ZBB),
314     KVM_EXT_CFG("zbc", ext_zbc, KVM_RISCV_ISA_EXT_ZBC),
315     KVM_EXT_CFG("zbkb", ext_zbkb, KVM_RISCV_ISA_EXT_ZBKB),
316     KVM_EXT_CFG("zbkc", ext_zbkc, KVM_RISCV_ISA_EXT_ZBKC),
317     KVM_EXT_CFG("zbkx", ext_zbkx, KVM_RISCV_ISA_EXT_ZBKX),
318     KVM_EXT_CFG("zbs", ext_zbs, KVM_RISCV_ISA_EXT_ZBS),
319     KVM_EXT_CFG("zca", ext_zca, KVM_RISCV_ISA_EXT_ZCA),
320     KVM_EXT_CFG("zcb", ext_zcb, KVM_RISCV_ISA_EXT_ZCB),
321     KVM_EXT_CFG("zcd", ext_zcd, KVM_RISCV_ISA_EXT_ZCD),
322     KVM_EXT_CFG("zcf", ext_zcf, KVM_RISCV_ISA_EXT_ZCF),
323     KVM_EXT_CFG("zknd", ext_zknd, KVM_RISCV_ISA_EXT_ZKND),
324     KVM_EXT_CFG("zkne", ext_zkne, KVM_RISCV_ISA_EXT_ZKNE),
325     KVM_EXT_CFG("zknh", ext_zknh, KVM_RISCV_ISA_EXT_ZKNH),
326     KVM_EXT_CFG("zkr", ext_zkr, KVM_RISCV_ISA_EXT_ZKR),
327     KVM_EXT_CFG("zksed", ext_zksed, KVM_RISCV_ISA_EXT_ZKSED),
328     KVM_EXT_CFG("zksh", ext_zksh, KVM_RISCV_ISA_EXT_ZKSH),
329     KVM_EXT_CFG("zkt", ext_zkt, KVM_RISCV_ISA_EXT_ZKT),
330     KVM_EXT_CFG("ztso", ext_ztso, KVM_RISCV_ISA_EXT_ZTSO),
331     KVM_EXT_CFG("zvbb", ext_zvbb, KVM_RISCV_ISA_EXT_ZVBB),
332     KVM_EXT_CFG("zvbc", ext_zvbc, KVM_RISCV_ISA_EXT_ZVBC),
333     KVM_EXT_CFG("zvfh", ext_zvfh, KVM_RISCV_ISA_EXT_ZVFH),
334     KVM_EXT_CFG("zvfhmin", ext_zvfhmin, KVM_RISCV_ISA_EXT_ZVFHMIN),
335     KVM_EXT_CFG("zvkb", ext_zvkb, KVM_RISCV_ISA_EXT_ZVKB),
336     KVM_EXT_CFG("zvkg", ext_zvkg, KVM_RISCV_ISA_EXT_ZVKG),
337     KVM_EXT_CFG("zvkned", ext_zvkned, KVM_RISCV_ISA_EXT_ZVKNED),
338     KVM_EXT_CFG("zvknha", ext_zvknha, KVM_RISCV_ISA_EXT_ZVKNHA),
339     KVM_EXT_CFG("zvknhb", ext_zvknhb, KVM_RISCV_ISA_EXT_ZVKNHB),
340     KVM_EXT_CFG("zvksed", ext_zvksed, KVM_RISCV_ISA_EXT_ZVKSED),
341     KVM_EXT_CFG("zvksh", ext_zvksh, KVM_RISCV_ISA_EXT_ZVKSH),
342     KVM_EXT_CFG("zvkt", ext_zvkt, KVM_RISCV_ISA_EXT_ZVKT),
343     KVM_EXT_CFG("smnpm", ext_smnpm, KVM_RISCV_ISA_EXT_SMNPM),
344     KVM_EXT_CFG("smstateen", ext_smstateen, KVM_RISCV_ISA_EXT_SMSTATEEN),
345     KVM_EXT_CFG("ssaia", ext_ssaia, KVM_RISCV_ISA_EXT_SSAIA),
346     KVM_EXT_CFG("sscofpmf", ext_sscofpmf, KVM_RISCV_ISA_EXT_SSCOFPMF),
347     KVM_EXT_CFG("ssnpm", ext_ssnpm, KVM_RISCV_ISA_EXT_SSNPM),
348     KVM_EXT_CFG("sstc", ext_sstc, KVM_RISCV_ISA_EXT_SSTC),
349     KVM_EXT_CFG("svade", ext_svade, KVM_RISCV_ISA_EXT_SVADE),
350     KVM_EXT_CFG("svadu", ext_svadu, KVM_RISCV_ISA_EXT_SVADU),
351     KVM_EXT_CFG("svinval", ext_svinval, KVM_RISCV_ISA_EXT_SVINVAL),
352     KVM_EXT_CFG("svnapot", ext_svnapot, KVM_RISCV_ISA_EXT_SVNAPOT),
353     KVM_EXT_CFG("svpbmt", ext_svpbmt, KVM_RISCV_ISA_EXT_SVPBMT),
354     KVM_EXT_CFG("svvptc", ext_svvptc, KVM_RISCV_ISA_EXT_SVVPTC),
355 };
356 
357 static void *kvmconfig_get_cfg_addr(RISCVCPU *cpu, KVMCPUConfig *kvmcfg)
358 {
359     return (void *)&cpu->cfg + kvmcfg->offset;
360 }
361 
362 static void kvm_cpu_cfg_set(RISCVCPU *cpu, KVMCPUConfig *multi_ext,
363                             uint32_t val)
364 {
365     bool *ext_enabled = kvmconfig_get_cfg_addr(cpu, multi_ext);
366 
367     *ext_enabled = val;
368 }
369 
370 static uint32_t kvm_cpu_cfg_get(RISCVCPU *cpu,
371                                 KVMCPUConfig *multi_ext)
372 {
373     bool *ext_enabled = kvmconfig_get_cfg_addr(cpu, multi_ext);
374 
375     return *ext_enabled;
376 }
377 
378 static void kvm_cpu_get_multi_ext_cfg(Object *obj, Visitor *v,
379                                       const char *name,
380                                       void *opaque, Error **errp)
381 {
382     KVMCPUConfig *multi_ext_cfg = opaque;
383     RISCVCPU *cpu = RISCV_CPU(obj);
384     bool value = kvm_cpu_cfg_get(cpu, multi_ext_cfg);
385 
386     visit_type_bool(v, name, &value, errp);
387 }
388 
389 static void kvm_cpu_set_multi_ext_cfg(Object *obj, Visitor *v,
390                                       const char *name,
391                                       void *opaque, Error **errp)
392 {
393     KVMCPUConfig *multi_ext_cfg = opaque;
394     RISCVCPU *cpu = RISCV_CPU(obj);
395     bool value, host_val;
396 
397     if (!visit_type_bool(v, name, &value, errp)) {
398         return;
399     }
400 
401     host_val = kvm_cpu_cfg_get(cpu, multi_ext_cfg);
402 
403     /*
404      * Ignore if the user is setting the same value
405      * as the host.
406      */
407     if (value == host_val) {
408         return;
409     }
410 
411     if (!multi_ext_cfg->supported) {
412         /*
413          * Error out if the user is trying to enable an
414          * extension that KVM doesn't support. Ignore
415          * option otherwise.
416          */
417         if (value) {
418             error_setg(errp, "KVM does not support disabling extension %s",
419                        multi_ext_cfg->name);
420         }
421 
422         return;
423     }
424 
425     multi_ext_cfg->user_set = true;
426     kvm_cpu_cfg_set(cpu, multi_ext_cfg, value);
427 }
428 
429 static KVMCPUConfig kvm_cbom_blocksize = {
430     .name = "cbom_blocksize",
431     .offset = CPU_CFG_OFFSET(cbom_blocksize),
432     .kvm_reg_id = KVM_REG_RISCV_CONFIG_REG(zicbom_block_size)
433 };
434 
435 static KVMCPUConfig kvm_cboz_blocksize = {
436     .name = "cboz_blocksize",
437     .offset = CPU_CFG_OFFSET(cboz_blocksize),
438     .kvm_reg_id = KVM_REG_RISCV_CONFIG_REG(zicboz_block_size)
439 };
440 
441 static KVMCPUConfig kvm_v_vlenb = {
442     .name = "vlenb",
443     .offset = CPU_CFG_OFFSET(vlenb),
444     .kvm_reg_id =  KVM_REG_RISCV | KVM_REG_SIZE_U64 | KVM_REG_RISCV_VECTOR |
445                    KVM_REG_RISCV_VECTOR_CSR_REG(vlenb)
446 };
447 
448 static KVMCPUConfig kvm_sbi_dbcn = {
449     .name = "sbi_dbcn",
450     .kvm_reg_id = KVM_REG_RISCV | KVM_REG_SIZE_U64 |
451                   KVM_REG_RISCV_SBI_EXT | KVM_RISCV_SBI_EXT_DBCN
452 };
453 
454 static void kvm_riscv_update_cpu_cfg_isa_ext(RISCVCPU *cpu, CPUState *cs)
455 {
456     uint64_t id, reg;
457     int i, ret;
458 
459     for (i = 0; i < ARRAY_SIZE(kvm_multi_ext_cfgs); i++) {
460         KVMCPUConfig *multi_ext_cfg = &kvm_multi_ext_cfgs[i];
461 
462         if (!multi_ext_cfg->user_set) {
463             continue;
464         }
465 
466         id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_ISA_EXT,
467                                     multi_ext_cfg->kvm_reg_id);
468         reg = kvm_cpu_cfg_get(cpu, multi_ext_cfg);
469         ret = kvm_set_one_reg(cs, id, &reg);
470         if (ret != 0) {
471             if (!reg && ret == -EINVAL) {
472                 warn_report("KVM cannot disable extension %s",
473                             multi_ext_cfg->name);
474             } else {
475                 error_report("Unable to enable extension %s in KVM, error %d",
476                              multi_ext_cfg->name, ret);
477                 exit(EXIT_FAILURE);
478             }
479         }
480     }
481 }
482 
483 static void cpu_get_cfg_unavailable(Object *obj, Visitor *v,
484                                     const char *name,
485                                     void *opaque, Error **errp)
486 {
487     bool value = false;
488 
489     visit_type_bool(v, name, &value, errp);
490 }
491 
492 static void cpu_set_cfg_unavailable(Object *obj, Visitor *v,
493                                     const char *name,
494                                     void *opaque, Error **errp)
495 {
496     const char *propname = opaque;
497     bool value;
498 
499     if (!visit_type_bool(v, name, &value, errp)) {
500         return;
501     }
502 
503     if (value) {
504         error_setg(errp, "'%s' is not available with KVM",
505                    propname);
506     }
507 }
508 
509 static void riscv_cpu_add_kvm_unavail_prop(Object *obj, const char *prop_name)
510 {
511     /* Check if KVM created the property already */
512     if (object_property_find(obj, prop_name)) {
513         return;
514     }
515 
516     /*
517      * Set the default to disabled for every extension
518      * unknown to KVM and error out if the user attempts
519      * to enable any of them.
520      */
521     object_property_add(obj, prop_name, "bool",
522                         cpu_get_cfg_unavailable,
523                         cpu_set_cfg_unavailable,
524                         NULL, (void *)prop_name);
525 }
526 
527 static void riscv_cpu_add_kvm_unavail_prop_array(Object *obj,
528                                         const RISCVCPUMultiExtConfig *array)
529 {
530     const RISCVCPUMultiExtConfig *prop;
531 
532     g_assert(array);
533 
534     for (prop = array; prop && prop->name; prop++) {
535         riscv_cpu_add_kvm_unavail_prop(obj, prop->name);
536     }
537 }
538 
539 static void kvm_riscv_add_cpu_user_properties(Object *cpu_obj)
540 {
541     int i;
542 
543     riscv_add_satp_mode_properties(cpu_obj);
544 
545     for (i = 0; i < ARRAY_SIZE(kvm_misa_ext_cfgs); i++) {
546         KVMCPUConfig *misa_cfg = &kvm_misa_ext_cfgs[i];
547         int bit = misa_cfg->offset;
548 
549         misa_cfg->name = riscv_get_misa_ext_name(bit);
550         misa_cfg->description = riscv_get_misa_ext_description(bit);
551 
552         object_property_add(cpu_obj, misa_cfg->name, "bool",
553                             kvm_cpu_get_misa_ext_cfg,
554                             kvm_cpu_set_misa_ext_cfg,
555                             NULL, misa_cfg);
556         object_property_set_description(cpu_obj, misa_cfg->name,
557                                         misa_cfg->description);
558     }
559 
560     for (i = 0; misa_bits[i] != 0; i++) {
561         const char *ext_name = riscv_get_misa_ext_name(misa_bits[i]);
562         riscv_cpu_add_kvm_unavail_prop(cpu_obj, ext_name);
563     }
564 
565     for (i = 0; i < ARRAY_SIZE(kvm_multi_ext_cfgs); i++) {
566         KVMCPUConfig *multi_cfg = &kvm_multi_ext_cfgs[i];
567 
568         object_property_add(cpu_obj, multi_cfg->name, "bool",
569                             kvm_cpu_get_multi_ext_cfg,
570                             kvm_cpu_set_multi_ext_cfg,
571                             NULL, multi_cfg);
572     }
573 
574     riscv_cpu_add_kvm_unavail_prop_array(cpu_obj, riscv_cpu_extensions);
575     riscv_cpu_add_kvm_unavail_prop_array(cpu_obj, riscv_cpu_vendor_exts);
576     riscv_cpu_add_kvm_unavail_prop_array(cpu_obj, riscv_cpu_experimental_exts);
577 
578    /* We don't have the needed KVM support for profiles */
579     for (i = 0; riscv_profiles[i] != NULL; i++) {
580         riscv_cpu_add_kvm_unavail_prop(cpu_obj, riscv_profiles[i]->name);
581     }
582 }
583 
584 static int kvm_riscv_get_regs_core(CPUState *cs)
585 {
586     int ret = 0;
587     int i;
588     target_ulong reg;
589     CPURISCVState *env = &RISCV_CPU(cs)->env;
590 
591     ret = kvm_get_one_reg(cs, RISCV_CORE_REG(regs.pc), &reg);
592     if (ret) {
593         return ret;
594     }
595     env->pc = reg;
596 
597     for (i = 1; i < 32; i++) {
598         uint64_t id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_CORE, i);
599         ret = kvm_get_one_reg(cs, id, &reg);
600         if (ret) {
601             return ret;
602         }
603         env->gpr[i] = reg;
604     }
605 
606     return ret;
607 }
608 
609 static int kvm_riscv_put_regs_core(CPUState *cs)
610 {
611     int ret = 0;
612     int i;
613     target_ulong reg;
614     CPURISCVState *env = &RISCV_CPU(cs)->env;
615 
616     reg = env->pc;
617     ret = kvm_set_one_reg(cs, RISCV_CORE_REG(regs.pc), &reg);
618     if (ret) {
619         return ret;
620     }
621 
622     for (i = 1; i < 32; i++) {
623         uint64_t id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_CORE, i);
624         reg = env->gpr[i];
625         ret = kvm_set_one_reg(cs, id, &reg);
626         if (ret) {
627             return ret;
628         }
629     }
630 
631     return ret;
632 }
633 
634 static int kvm_riscv_get_regs_csr(CPUState *cs)
635 {
636     RISCVCPU *cpu = RISCV_CPU(cs);
637     uint64_t reg;
638     int i, ret;
639 
640     for (i = 0; i < ARRAY_SIZE(kvm_csr_cfgs); i++) {
641         KVMCPUConfig *csr_cfg = &kvm_csr_cfgs[i];
642 
643         if (!csr_cfg->supported) {
644             continue;
645         }
646 
647         ret = kvm_get_one_reg(cs, csr_cfg->kvm_reg_id, &reg);
648         if (ret) {
649             return ret;
650         }
651 
652         if (csr_cfg->prop_size == sizeof(uint32_t)) {
653             kvm_cpu_csr_set_u32(cpu, csr_cfg, (uint32_t)reg);
654         } else if (csr_cfg->prop_size == sizeof(uint64_t)) {
655             kvm_cpu_csr_set_u64(cpu, csr_cfg, reg);
656         } else {
657             g_assert_not_reached();
658         }
659     }
660 
661     return 0;
662 }
663 
664 static int kvm_riscv_put_regs_csr(CPUState *cs)
665 {
666     RISCVCPU *cpu = RISCV_CPU(cs);
667     uint64_t reg;
668     int i, ret;
669 
670     for (i = 0; i < ARRAY_SIZE(kvm_csr_cfgs); i++) {
671         KVMCPUConfig *csr_cfg = &kvm_csr_cfgs[i];
672 
673         if (!csr_cfg->supported) {
674             continue;
675         }
676 
677         if (csr_cfg->prop_size == sizeof(uint32_t)) {
678             reg = kvm_cpu_csr_get_u32(cpu, csr_cfg);
679         } else if (csr_cfg->prop_size == sizeof(uint64_t)) {
680             reg = kvm_cpu_csr_get_u64(cpu, csr_cfg);
681         } else {
682             g_assert_not_reached();
683         }
684 
685         ret = kvm_set_one_reg(cs, csr_cfg->kvm_reg_id, &reg);
686         if (ret) {
687             return ret;
688         }
689     }
690 
691     return 0;
692 }
693 
694 static void kvm_riscv_reset_regs_csr(CPURISCVState *env)
695 {
696     env->mstatus = 0;
697     env->mie = 0;
698     env->stvec = 0;
699     env->sscratch = 0;
700     env->sepc = 0;
701     env->scause = 0;
702     env->stval = 0;
703     env->mip = 0;
704     env->satp = 0;
705     env->scounteren = 0;
706     env->senvcfg = 0;
707 }
708 
709 static int kvm_riscv_get_regs_fp(CPUState *cs)
710 {
711     int ret = 0;
712     int i;
713     CPURISCVState *env = &RISCV_CPU(cs)->env;
714 
715     if (riscv_has_ext(env, RVD)) {
716         uint64_t reg;
717         for (i = 0; i < 32; i++) {
718             ret = kvm_get_one_reg(cs, RISCV_FP_D_REG(i), &reg);
719             if (ret) {
720                 return ret;
721             }
722             env->fpr[i] = reg;
723         }
724         return ret;
725     }
726 
727     if (riscv_has_ext(env, RVF)) {
728         uint32_t reg;
729         for (i = 0; i < 32; i++) {
730             ret = kvm_get_one_reg(cs, RISCV_FP_F_REG(i), &reg);
731             if (ret) {
732                 return ret;
733             }
734             env->fpr[i] = reg;
735         }
736         return ret;
737     }
738 
739     return ret;
740 }
741 
742 static int kvm_riscv_put_regs_fp(CPUState *cs)
743 {
744     int ret = 0;
745     int i;
746     CPURISCVState *env = &RISCV_CPU(cs)->env;
747 
748     if (riscv_has_ext(env, RVD)) {
749         uint64_t reg;
750         for (i = 0; i < 32; i++) {
751             reg = env->fpr[i];
752             ret = kvm_set_one_reg(cs, RISCV_FP_D_REG(i), &reg);
753             if (ret) {
754                 return ret;
755             }
756         }
757         return ret;
758     }
759 
760     if (riscv_has_ext(env, RVF)) {
761         uint32_t reg;
762         for (i = 0; i < 32; i++) {
763             reg = env->fpr[i];
764             ret = kvm_set_one_reg(cs, RISCV_FP_F_REG(i), &reg);
765             if (ret) {
766                 return ret;
767             }
768         }
769         return ret;
770     }
771 
772     return ret;
773 }
774 
775 static void kvm_riscv_get_regs_timer(CPUState *cs)
776 {
777     CPURISCVState *env = &RISCV_CPU(cs)->env;
778 
779     if (env->kvm_timer_dirty) {
780         return;
781     }
782 
783     KVM_RISCV_GET_TIMER(cs, time, env->kvm_timer_time);
784     KVM_RISCV_GET_TIMER(cs, compare, env->kvm_timer_compare);
785     KVM_RISCV_GET_TIMER(cs, state, env->kvm_timer_state);
786     KVM_RISCV_GET_TIMER(cs, frequency, env->kvm_timer_frequency);
787 
788     env->kvm_timer_dirty = true;
789 }
790 
791 static void kvm_riscv_put_regs_timer(CPUState *cs)
792 {
793     uint64_t reg;
794     CPURISCVState *env = &RISCV_CPU(cs)->env;
795 
796     if (!env->kvm_timer_dirty) {
797         return;
798     }
799 
800     KVM_RISCV_SET_TIMER(cs, time, env->kvm_timer_time);
801     KVM_RISCV_SET_TIMER(cs, compare, env->kvm_timer_compare);
802 
803     /*
804      * To set register of RISCV_TIMER_REG(state) will occur a error from KVM
805      * on env->kvm_timer_state == 0, It's better to adapt in KVM, but it
806      * doesn't matter that adaping in QEMU now.
807      * TODO If KVM changes, adapt here.
808      */
809     if (env->kvm_timer_state) {
810         KVM_RISCV_SET_TIMER(cs, state, env->kvm_timer_state);
811     }
812 
813     /*
814      * For now, migration will not work between Hosts with different timer
815      * frequency. Therefore, we should check whether they are the same here
816      * during the migration.
817      */
818     if (migration_is_running()) {
819         KVM_RISCV_GET_TIMER(cs, frequency, reg);
820         if (reg != env->kvm_timer_frequency) {
821             error_report("Dst Hosts timer frequency != Src Hosts");
822         }
823     }
824 
825     env->kvm_timer_dirty = false;
826 }
827 
828 uint64_t kvm_riscv_get_timebase_frequency(RISCVCPU *cpu)
829 {
830     uint64_t reg;
831 
832     KVM_RISCV_GET_TIMER(CPU(cpu), frequency, reg);
833 
834     return reg;
835 }
836 
837 static int kvm_riscv_get_regs_vector(CPUState *cs)
838 {
839     RISCVCPU *cpu = RISCV_CPU(cs);
840     CPURISCVState *env = &cpu->env;
841     target_ulong reg;
842     uint64_t vreg_id;
843     int vreg_idx, ret = 0;
844 
845     if (!riscv_has_ext(env, RVV)) {
846         return 0;
847     }
848 
849     ret = kvm_get_one_reg(cs, RISCV_VECTOR_CSR_REG(vstart), &reg);
850     if (ret) {
851         return ret;
852     }
853     env->vstart = reg;
854 
855     ret = kvm_get_one_reg(cs, RISCV_VECTOR_CSR_REG(vl), &reg);
856     if (ret) {
857         return ret;
858     }
859     env->vl = reg;
860 
861     ret = kvm_get_one_reg(cs, RISCV_VECTOR_CSR_REG(vtype), &reg);
862     if (ret) {
863         return ret;
864     }
865     env->vtype = reg;
866 
867     if (kvm_v_vlenb.supported) {
868         ret = kvm_get_one_reg(cs, RISCV_VECTOR_CSR_REG(vlenb), &reg);
869         if (ret) {
870             return ret;
871         }
872         cpu->cfg.vlenb = reg;
873 
874         for (int i = 0; i < 32; i++) {
875             /*
876              * vreg[] is statically allocated using RV_VLEN_MAX.
877              * Use it instead of vlenb to calculate vreg_idx for
878              * simplicity.
879              */
880             vreg_idx = i * RV_VLEN_MAX / 64;
881             vreg_id = kvm_riscv_vector_reg_id(cpu, i);
882 
883             ret = kvm_get_one_reg(cs, vreg_id, &env->vreg[vreg_idx]);
884             if (ret) {
885                 return ret;
886             }
887         }
888     }
889 
890     return 0;
891 }
892 
893 static int kvm_riscv_put_regs_vector(CPUState *cs)
894 {
895     RISCVCPU *cpu = RISCV_CPU(cs);
896     CPURISCVState *env = &cpu->env;
897     target_ulong reg;
898     uint64_t vreg_id;
899     int vreg_idx, ret = 0;
900 
901     if (!riscv_has_ext(env, RVV)) {
902         return 0;
903     }
904 
905     reg = env->vstart;
906     ret = kvm_set_one_reg(cs, RISCV_VECTOR_CSR_REG(vstart), &reg);
907     if (ret) {
908         return ret;
909     }
910 
911     reg = env->vl;
912     ret = kvm_set_one_reg(cs, RISCV_VECTOR_CSR_REG(vl), &reg);
913     if (ret) {
914         return ret;
915     }
916 
917     reg = env->vtype;
918     ret = kvm_set_one_reg(cs, RISCV_VECTOR_CSR_REG(vtype), &reg);
919     if (ret) {
920         return ret;
921     }
922 
923     if (kvm_v_vlenb.supported) {
924         reg = cpu->cfg.vlenb;
925         ret = kvm_set_one_reg(cs, RISCV_VECTOR_CSR_REG(vlenb), &reg);
926 
927         for (int i = 0; i < 32; i++) {
928             /*
929              * vreg[] is statically allocated using RV_VLEN_MAX.
930              * Use it instead of vlenb to calculate vreg_idx for
931              * simplicity.
932              */
933             vreg_idx = i * RV_VLEN_MAX / 64;
934             vreg_id = kvm_riscv_vector_reg_id(cpu, i);
935 
936             ret = kvm_set_one_reg(cs, vreg_id, &env->vreg[vreg_idx]);
937             if (ret) {
938                 return ret;
939             }
940         }
941     }
942 
943     return ret;
944 }
945 
946 typedef struct KVMScratchCPU {
947     int kvmfd;
948     int vmfd;
949     int cpufd;
950 } KVMScratchCPU;
951 
952 /*
953  * Heavily inspired by kvm_arm_create_scratch_host_vcpu()
954  * from target/arm/kvm.c.
955  */
956 static bool kvm_riscv_create_scratch_vcpu(KVMScratchCPU *scratch)
957 {
958     int kvmfd = -1, vmfd = -1, cpufd = -1;
959 
960     kvmfd = qemu_open_old("/dev/kvm", O_RDWR);
961     if (kvmfd < 0) {
962         goto err;
963     }
964     do {
965         vmfd = ioctl(kvmfd, KVM_CREATE_VM, 0);
966     } while (vmfd == -1 && errno == EINTR);
967     if (vmfd < 0) {
968         goto err;
969     }
970     cpufd = ioctl(vmfd, KVM_CREATE_VCPU, 0);
971     if (cpufd < 0) {
972         goto err;
973     }
974 
975     scratch->kvmfd =  kvmfd;
976     scratch->vmfd = vmfd;
977     scratch->cpufd = cpufd;
978 
979     return true;
980 
981  err:
982     if (cpufd >= 0) {
983         close(cpufd);
984     }
985     if (vmfd >= 0) {
986         close(vmfd);
987     }
988     if (kvmfd >= 0) {
989         close(kvmfd);
990     }
991 
992     return false;
993 }
994 
995 static void kvm_riscv_destroy_scratch_vcpu(KVMScratchCPU *scratch)
996 {
997     close(scratch->cpufd);
998     close(scratch->vmfd);
999     close(scratch->kvmfd);
1000 }
1001 
1002 static void kvm_riscv_init_machine_ids(RISCVCPU *cpu, KVMScratchCPU *kvmcpu)
1003 {
1004     struct kvm_one_reg reg;
1005     int ret;
1006 
1007     reg.id = RISCV_CONFIG_REG(mvendorid);
1008     reg.addr = (uint64_t)&cpu->cfg.mvendorid;
1009     ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1010     if (ret != 0) {
1011         error_report("Unable to retrieve mvendorid from host, error %d", ret);
1012     }
1013 
1014     reg.id = RISCV_CONFIG_REG(marchid);
1015     reg.addr = (uint64_t)&cpu->cfg.marchid;
1016     ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1017     if (ret != 0) {
1018         error_report("Unable to retrieve marchid from host, error %d", ret);
1019     }
1020 
1021     reg.id = RISCV_CONFIG_REG(mimpid);
1022     reg.addr = (uint64_t)&cpu->cfg.mimpid;
1023     ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1024     if (ret != 0) {
1025         error_report("Unable to retrieve mimpid from host, error %d", ret);
1026     }
1027 }
1028 
1029 static void kvm_riscv_init_misa_ext_mask(RISCVCPU *cpu,
1030                                          KVMScratchCPU *kvmcpu)
1031 {
1032     CPURISCVState *env = &cpu->env;
1033     struct kvm_one_reg reg;
1034     int ret;
1035 
1036     reg.id = RISCV_CONFIG_REG(isa);
1037     reg.addr = (uint64_t)&env->misa_ext_mask;
1038     ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1039 
1040     if (ret) {
1041         error_report("Unable to fetch ISA register from KVM, "
1042                      "error %d", ret);
1043         kvm_riscv_destroy_scratch_vcpu(kvmcpu);
1044         exit(EXIT_FAILURE);
1045     }
1046 
1047     env->misa_ext = env->misa_ext_mask;
1048 }
1049 
1050 static void kvm_riscv_read_cbomz_blksize(RISCVCPU *cpu, KVMScratchCPU *kvmcpu,
1051                                          KVMCPUConfig *cbomz_cfg)
1052 {
1053     struct kvm_one_reg reg;
1054     int ret;
1055 
1056     reg.id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_CONFIG,
1057                                     cbomz_cfg->kvm_reg_id);
1058     reg.addr = (uint64_t)kvmconfig_get_cfg_addr(cpu, cbomz_cfg);
1059     ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1060     if (ret != 0) {
1061         error_report("Unable to read KVM reg %s, error %d",
1062                      cbomz_cfg->name, ret);
1063         exit(EXIT_FAILURE);
1064     }
1065 }
1066 
1067 static void kvm_riscv_read_multiext_legacy(RISCVCPU *cpu,
1068                                            KVMScratchCPU *kvmcpu)
1069 {
1070     uint64_t val;
1071     int i, ret;
1072 
1073     for (i = 0; i < ARRAY_SIZE(kvm_multi_ext_cfgs); i++) {
1074         KVMCPUConfig *multi_ext_cfg = &kvm_multi_ext_cfgs[i];
1075         struct kvm_one_reg reg;
1076 
1077         reg.id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_ISA_EXT,
1078                                         multi_ext_cfg->kvm_reg_id);
1079         reg.addr = (uint64_t)&val;
1080         ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1081         if (ret != 0) {
1082             if (errno == EINVAL) {
1083                 /* Silently default to 'false' if KVM does not support it. */
1084                 multi_ext_cfg->supported = false;
1085                 val = false;
1086             } else {
1087                 error_report("Unable to read ISA_EXT KVM register %s: %s",
1088                              multi_ext_cfg->name, strerror(errno));
1089                 exit(EXIT_FAILURE);
1090             }
1091         } else {
1092             multi_ext_cfg->supported = true;
1093         }
1094 
1095         kvm_cpu_cfg_set(cpu, multi_ext_cfg, val);
1096     }
1097 
1098     if (cpu->cfg.ext_zicbom) {
1099         kvm_riscv_read_cbomz_blksize(cpu, kvmcpu, &kvm_cbom_blocksize);
1100     }
1101 
1102     if (cpu->cfg.ext_zicboz) {
1103         kvm_riscv_read_cbomz_blksize(cpu, kvmcpu, &kvm_cboz_blocksize);
1104     }
1105 }
1106 
1107 static void kvm_riscv_read_csr_cfg_legacy(KVMScratchCPU *kvmcpu)
1108 {
1109     uint64_t val;
1110     int i, ret;
1111 
1112     for (i = 0; i < ARRAY_SIZE(kvm_csr_cfgs); i++) {
1113         KVMCPUConfig *csr_cfg = &kvm_csr_cfgs[i];
1114         struct kvm_one_reg reg;
1115 
1116         reg.id = csr_cfg->kvm_reg_id;
1117         reg.addr = (uint64_t)&val;
1118         ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1119         if (ret != 0) {
1120             if (errno == EINVAL) {
1121                 csr_cfg->supported = false;
1122             } else {
1123                 error_report("Unable to read KVM CSR %s: %s",
1124                              csr_cfg->name, strerror(errno));
1125                 exit(EXIT_FAILURE);
1126             }
1127         } else {
1128             csr_cfg->supported = true;
1129         }
1130     }
1131 }
1132 
1133 static int uint64_cmp(const void *a, const void *b)
1134 {
1135     uint64_t val1 = *(const uint64_t *)a;
1136     uint64_t val2 = *(const uint64_t *)b;
1137 
1138     if (val1 < val2) {
1139         return -1;
1140     }
1141 
1142     if (val1 > val2) {
1143         return 1;
1144     }
1145 
1146     return 0;
1147 }
1148 
1149 static void kvm_riscv_check_sbi_dbcn_support(RISCVCPU *cpu,
1150                                              struct kvm_reg_list *reglist)
1151 {
1152     struct kvm_reg_list *reg_search;
1153 
1154     reg_search = bsearch(&kvm_sbi_dbcn.kvm_reg_id, reglist->reg, reglist->n,
1155                          sizeof(uint64_t), uint64_cmp);
1156 
1157     if (reg_search) {
1158         kvm_sbi_dbcn.supported = true;
1159     }
1160 }
1161 
1162 static void kvm_riscv_read_vlenb(RISCVCPU *cpu, KVMScratchCPU *kvmcpu,
1163                                  struct kvm_reg_list *reglist)
1164 {
1165     struct kvm_one_reg reg;
1166     struct kvm_reg_list *reg_search;
1167     uint64_t val;
1168     int ret;
1169 
1170     reg_search = bsearch(&kvm_v_vlenb.kvm_reg_id, reglist->reg, reglist->n,
1171                          sizeof(uint64_t), uint64_cmp);
1172 
1173     if (reg_search) {
1174         reg.id = kvm_v_vlenb.kvm_reg_id;
1175         reg.addr = (uint64_t)&val;
1176 
1177         ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1178         if (ret != 0) {
1179             error_report("Unable to read vlenb register, error code: %d",
1180                          errno);
1181             exit(EXIT_FAILURE);
1182         }
1183 
1184         kvm_v_vlenb.supported = true;
1185         cpu->cfg.vlenb = val;
1186     }
1187 }
1188 
1189 static void kvm_riscv_read_csr_cfg(struct kvm_reg_list *reglist)
1190 {
1191     struct kvm_reg_list *reg_search;
1192     uint64_t reg_id;
1193 
1194     for (int i = 0; i < ARRAY_SIZE(kvm_csr_cfgs); i++) {
1195         KVMCPUConfig *csr_cfg = &kvm_csr_cfgs[i];
1196 
1197         reg_id = csr_cfg->kvm_reg_id;
1198         reg_search = bsearch(&reg_id, reglist->reg, reglist->n,
1199                              sizeof(uint64_t), uint64_cmp);
1200         if (!reg_search) {
1201             continue;
1202         }
1203 
1204         csr_cfg->supported = true;
1205     }
1206 }
1207 
1208 static void kvm_riscv_init_cfg(RISCVCPU *cpu, KVMScratchCPU *kvmcpu)
1209 {
1210     g_autofree struct kvm_reg_list *reglist = NULL;
1211     KVMCPUConfig *multi_ext_cfg;
1212     struct kvm_one_reg reg;
1213     struct kvm_reg_list rl_struct;
1214     uint64_t val, reg_id, *reg_search;
1215     int i, ret;
1216 
1217     rl_struct.n = 0;
1218     ret = ioctl(kvmcpu->cpufd, KVM_GET_REG_LIST, &rl_struct);
1219 
1220     /*
1221      * If KVM_GET_REG_LIST isn't supported we'll get errno 22
1222      * (EINVAL). Use read_legacy() in this case.
1223      */
1224     if (errno == EINVAL) {
1225         kvm_riscv_read_multiext_legacy(cpu, kvmcpu);
1226         kvm_riscv_read_csr_cfg_legacy(kvmcpu);
1227         return;
1228     } else if (errno != E2BIG) {
1229         /*
1230          * E2BIG is an expected error message for the API since we
1231          * don't know the number of registers. The right amount will
1232          * be written in rl_struct.n.
1233          *
1234          * Error out if we get any other errno.
1235          */
1236         error_report("Error when accessing get-reg-list: %s",
1237                      strerror(errno));
1238         exit(EXIT_FAILURE);
1239     }
1240 
1241     reglist = g_malloc(sizeof(struct kvm_reg_list) +
1242                        rl_struct.n * sizeof(uint64_t));
1243     reglist->n = rl_struct.n;
1244     ret = ioctl(kvmcpu->cpufd, KVM_GET_REG_LIST, reglist);
1245     if (ret) {
1246         error_report("Error when reading KVM_GET_REG_LIST: %s",
1247                      strerror(errno));
1248         exit(EXIT_FAILURE);
1249     }
1250 
1251     /* sort reglist to use bsearch() */
1252     qsort(&reglist->reg, reglist->n, sizeof(uint64_t), uint64_cmp);
1253 
1254     for (i = 0; i < ARRAY_SIZE(kvm_multi_ext_cfgs); i++) {
1255         multi_ext_cfg = &kvm_multi_ext_cfgs[i];
1256         reg_id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_ISA_EXT,
1257                                         multi_ext_cfg->kvm_reg_id);
1258         reg_search = bsearch(&reg_id, reglist->reg, reglist->n,
1259                              sizeof(uint64_t), uint64_cmp);
1260         if (!reg_search) {
1261             continue;
1262         }
1263 
1264         reg.id = reg_id;
1265         reg.addr = (uint64_t)&val;
1266         ret = ioctl(kvmcpu->cpufd, KVM_GET_ONE_REG, &reg);
1267         if (ret != 0) {
1268             error_report("Unable to read ISA_EXT KVM register %s: %s",
1269                          multi_ext_cfg->name, strerror(errno));
1270             exit(EXIT_FAILURE);
1271         }
1272 
1273         multi_ext_cfg->supported = true;
1274         kvm_cpu_cfg_set(cpu, multi_ext_cfg, val);
1275     }
1276 
1277     if (cpu->cfg.ext_zicbom) {
1278         kvm_riscv_read_cbomz_blksize(cpu, kvmcpu, &kvm_cbom_blocksize);
1279     }
1280 
1281     if (cpu->cfg.ext_zicboz) {
1282         kvm_riscv_read_cbomz_blksize(cpu, kvmcpu, &kvm_cboz_blocksize);
1283     }
1284 
1285     if (riscv_has_ext(&cpu->env, RVV)) {
1286         kvm_riscv_read_vlenb(cpu, kvmcpu, reglist);
1287     }
1288 
1289     kvm_riscv_check_sbi_dbcn_support(cpu, reglist);
1290     kvm_riscv_read_csr_cfg(reglist);
1291 }
1292 
1293 static void riscv_init_kvm_registers(Object *cpu_obj)
1294 {
1295     RISCVCPU *cpu = RISCV_CPU(cpu_obj);
1296     KVMScratchCPU kvmcpu;
1297 
1298     if (!kvm_riscv_create_scratch_vcpu(&kvmcpu)) {
1299         return;
1300     }
1301 
1302     kvm_riscv_init_machine_ids(cpu, &kvmcpu);
1303     kvm_riscv_init_misa_ext_mask(cpu, &kvmcpu);
1304     kvm_riscv_init_cfg(cpu, &kvmcpu);
1305 
1306     kvm_riscv_destroy_scratch_vcpu(&kvmcpu);
1307 }
1308 
1309 const KVMCapabilityInfo kvm_arch_required_capabilities[] = {
1310     KVM_CAP_LAST_INFO
1311 };
1312 
1313 int kvm_arch_get_registers(CPUState *cs, Error **errp)
1314 {
1315     int ret = 0;
1316 
1317     ret = kvm_riscv_get_regs_core(cs);
1318     if (ret) {
1319         return ret;
1320     }
1321 
1322     ret = kvm_riscv_get_regs_csr(cs);
1323     if (ret) {
1324         return ret;
1325     }
1326 
1327     ret = kvm_riscv_get_regs_fp(cs);
1328     if (ret) {
1329         return ret;
1330     }
1331 
1332     ret = kvm_riscv_get_regs_vector(cs);
1333     if (ret) {
1334         return ret;
1335     }
1336 
1337     return ret;
1338 }
1339 
1340 int kvm_riscv_sync_mpstate_to_kvm(RISCVCPU *cpu, int state)
1341 {
1342     if (cap_has_mp_state) {
1343         struct kvm_mp_state mp_state = {
1344             .mp_state = state
1345         };
1346 
1347         int ret = kvm_vcpu_ioctl(CPU(cpu), KVM_SET_MP_STATE, &mp_state);
1348         if (ret) {
1349             fprintf(stderr, "%s: failed to sync MP_STATE %d/%s\n",
1350                     __func__, ret, strerror(-ret));
1351             return -1;
1352         }
1353     }
1354 
1355     return 0;
1356 }
1357 
1358 int kvm_arch_put_registers(CPUState *cs, int level, Error **errp)
1359 {
1360     int ret = 0;
1361 
1362     ret = kvm_riscv_put_regs_core(cs);
1363     if (ret) {
1364         return ret;
1365     }
1366 
1367     ret = kvm_riscv_put_regs_csr(cs);
1368     if (ret) {
1369         return ret;
1370     }
1371 
1372     ret = kvm_riscv_put_regs_fp(cs);
1373     if (ret) {
1374         return ret;
1375     }
1376 
1377     ret = kvm_riscv_put_regs_vector(cs);
1378     if (ret) {
1379         return ret;
1380     }
1381 
1382     if (KVM_PUT_RESET_STATE == level) {
1383         RISCVCPU *cpu = RISCV_CPU(cs);
1384         if (cs->cpu_index == 0) {
1385             ret = kvm_riscv_sync_mpstate_to_kvm(cpu, KVM_MP_STATE_RUNNABLE);
1386         } else {
1387             ret = kvm_riscv_sync_mpstate_to_kvm(cpu, KVM_MP_STATE_STOPPED);
1388         }
1389         if (ret) {
1390             return ret;
1391         }
1392     }
1393 
1394     return ret;
1395 }
1396 
1397 int kvm_arch_release_virq_post(int virq)
1398 {
1399     return 0;
1400 }
1401 
1402 int kvm_arch_fixup_msi_route(struct kvm_irq_routing_entry *route,
1403                              uint64_t address, uint32_t data, PCIDevice *dev)
1404 {
1405     return 0;
1406 }
1407 
1408 int kvm_arch_destroy_vcpu(CPUState *cs)
1409 {
1410     return 0;
1411 }
1412 
1413 unsigned long kvm_arch_vcpu_id(CPUState *cpu)
1414 {
1415     return cpu->cpu_index;
1416 }
1417 
1418 static void kvm_riscv_vm_state_change(void *opaque, bool running,
1419                                       RunState state)
1420 {
1421     CPUState *cs = opaque;
1422 
1423     if (running) {
1424         kvm_riscv_put_regs_timer(cs);
1425     } else {
1426         kvm_riscv_get_regs_timer(cs);
1427     }
1428 }
1429 
1430 void kvm_arch_init_irq_routing(KVMState *s)
1431 {
1432 }
1433 
1434 static int kvm_vcpu_set_machine_ids(RISCVCPU *cpu, CPUState *cs)
1435 {
1436     target_ulong reg;
1437     uint64_t id;
1438     int ret;
1439 
1440     id = RISCV_CONFIG_REG(mvendorid);
1441     /*
1442      * cfg.mvendorid is an uint32 but a target_ulong will
1443      * be written. Assign it to a target_ulong var to avoid
1444      * writing pieces of other cpu->cfg fields in the reg.
1445      */
1446     reg = cpu->cfg.mvendorid;
1447     ret = kvm_set_one_reg(cs, id, &reg);
1448     if (ret != 0) {
1449         return ret;
1450     }
1451 
1452     id = RISCV_CONFIG_REG(marchid);
1453     ret = kvm_set_one_reg(cs, id, &cpu->cfg.marchid);
1454     if (ret != 0) {
1455         return ret;
1456     }
1457 
1458     id = RISCV_CONFIG_REG(mimpid);
1459     ret = kvm_set_one_reg(cs, id, &cpu->cfg.mimpid);
1460 
1461     return ret;
1462 }
1463 
1464 static int kvm_vcpu_enable_sbi_dbcn(RISCVCPU *cpu, CPUState *cs)
1465 {
1466     target_ulong reg = 1;
1467 
1468     if (!kvm_sbi_dbcn.supported) {
1469         return 0;
1470     }
1471 
1472     return kvm_set_one_reg(cs, kvm_sbi_dbcn.kvm_reg_id, &reg);
1473 }
1474 
1475 int kvm_arch_init_vcpu(CPUState *cs)
1476 {
1477     int ret = 0;
1478     RISCVCPU *cpu = RISCV_CPU(cs);
1479 
1480     qemu_add_vm_change_state_handler(kvm_riscv_vm_state_change, cs);
1481 
1482     if (!object_dynamic_cast(OBJECT(cpu), TYPE_RISCV_CPU_HOST)) {
1483         ret = kvm_vcpu_set_machine_ids(cpu, cs);
1484         if (ret != 0) {
1485             return ret;
1486         }
1487     }
1488 
1489     kvm_riscv_update_cpu_misa_ext(cpu, cs);
1490     kvm_riscv_update_cpu_cfg_isa_ext(cpu, cs);
1491 
1492     ret = kvm_vcpu_enable_sbi_dbcn(cpu, cs);
1493 
1494     return ret;
1495 }
1496 
1497 int kvm_arch_msi_data_to_gsi(uint32_t data)
1498 {
1499     abort();
1500 }
1501 
1502 int kvm_arch_add_msi_route_post(struct kvm_irq_routing_entry *route,
1503                                 int vector, PCIDevice *dev)
1504 {
1505     return 0;
1506 }
1507 
1508 int kvm_arch_get_default_type(MachineState *ms)
1509 {
1510     return 0;
1511 }
1512 
1513 int kvm_arch_init(MachineState *ms, KVMState *s)
1514 {
1515     cap_has_mp_state = kvm_check_extension(s, KVM_CAP_MP_STATE);
1516     return 0;
1517 }
1518 
1519 int kvm_arch_irqchip_create(KVMState *s)
1520 {
1521     /*
1522      * We can create the VAIA using the newer device control API.
1523      */
1524     return kvm_check_extension(s, KVM_CAP_DEVICE_CTRL);
1525 }
1526 
1527 int kvm_arch_process_async_events(CPUState *cs)
1528 {
1529     return 0;
1530 }
1531 
1532 void kvm_arch_pre_run(CPUState *cs, struct kvm_run *run)
1533 {
1534 }
1535 
1536 MemTxAttrs kvm_arch_post_run(CPUState *cs, struct kvm_run *run)
1537 {
1538     return MEMTXATTRS_UNSPECIFIED;
1539 }
1540 
1541 bool kvm_arch_stop_on_emulation_error(CPUState *cs)
1542 {
1543     return true;
1544 }
1545 
1546 static void kvm_riscv_handle_sbi_dbcn(CPUState *cs, struct kvm_run *run)
1547 {
1548     g_autofree uint8_t *buf = NULL;
1549     RISCVCPU *cpu = RISCV_CPU(cs);
1550     target_ulong num_bytes;
1551     uint64_t addr;
1552     unsigned char ch;
1553     int ret;
1554 
1555     switch (run->riscv_sbi.function_id) {
1556     case SBI_EXT_DBCN_CONSOLE_READ:
1557     case SBI_EXT_DBCN_CONSOLE_WRITE:
1558         num_bytes = run->riscv_sbi.args[0];
1559 
1560         if (num_bytes == 0) {
1561             run->riscv_sbi.ret[0] = SBI_SUCCESS;
1562             run->riscv_sbi.ret[1] = 0;
1563             break;
1564         }
1565 
1566         addr = run->riscv_sbi.args[1];
1567 
1568         /*
1569          * Handle the case where a 32 bit CPU is running in a
1570          * 64 bit addressing env.
1571          */
1572         if (riscv_cpu_mxl(&cpu->env) == MXL_RV32) {
1573             addr |= (uint64_t)run->riscv_sbi.args[2] << 32;
1574         }
1575 
1576         buf = g_malloc0(num_bytes);
1577 
1578         if (run->riscv_sbi.function_id == SBI_EXT_DBCN_CONSOLE_READ) {
1579             ret = qemu_chr_fe_read_all(serial_hd(0)->be, buf, num_bytes);
1580             if (ret < 0) {
1581                 error_report("SBI_EXT_DBCN_CONSOLE_READ: error when "
1582                              "reading chardev");
1583                 exit(1);
1584             }
1585 
1586             cpu_physical_memory_write(addr, buf, ret);
1587         } else {
1588             cpu_physical_memory_read(addr, buf, num_bytes);
1589 
1590             ret = qemu_chr_fe_write_all(serial_hd(0)->be, buf, num_bytes);
1591             if (ret < 0) {
1592                 error_report("SBI_EXT_DBCN_CONSOLE_WRITE: error when "
1593                              "writing chardev");
1594                 exit(1);
1595             }
1596         }
1597 
1598         run->riscv_sbi.ret[0] = SBI_SUCCESS;
1599         run->riscv_sbi.ret[1] = ret;
1600         break;
1601     case SBI_EXT_DBCN_CONSOLE_WRITE_BYTE:
1602         ch = run->riscv_sbi.args[0];
1603         ret = qemu_chr_fe_write(serial_hd(0)->be, &ch, sizeof(ch));
1604 
1605         if (ret < 0) {
1606             error_report("SBI_EXT_DBCN_CONSOLE_WRITE_BYTE: error when "
1607                          "writing chardev");
1608             exit(1);
1609         }
1610 
1611         run->riscv_sbi.ret[0] = SBI_SUCCESS;
1612         run->riscv_sbi.ret[1] = 0;
1613         break;
1614     default:
1615         run->riscv_sbi.ret[0] = SBI_ERR_NOT_SUPPORTED;
1616     }
1617 }
1618 
1619 static int kvm_riscv_handle_sbi(CPUState *cs, struct kvm_run *run)
1620 {
1621     int ret = 0;
1622     unsigned char ch;
1623     switch (run->riscv_sbi.extension_id) {
1624     case SBI_EXT_0_1_CONSOLE_PUTCHAR:
1625         ch = run->riscv_sbi.args[0];
1626         qemu_chr_fe_write(serial_hd(0)->be, &ch, sizeof(ch));
1627         break;
1628     case SBI_EXT_0_1_CONSOLE_GETCHAR:
1629         ret = qemu_chr_fe_read_all(serial_hd(0)->be, &ch, sizeof(ch));
1630         if (ret == sizeof(ch)) {
1631             run->riscv_sbi.ret[0] = ch;
1632         } else {
1633             run->riscv_sbi.ret[0] = -1;
1634         }
1635         ret = 0;
1636         break;
1637     case SBI_EXT_DBCN:
1638         kvm_riscv_handle_sbi_dbcn(cs, run);
1639         break;
1640     default:
1641         qemu_log_mask(LOG_UNIMP,
1642                       "%s: un-handled SBI EXIT, specific reasons is %lu\n",
1643                       __func__, run->riscv_sbi.extension_id);
1644         ret = -1;
1645         break;
1646     }
1647     return ret;
1648 }
1649 
1650 static int kvm_riscv_handle_csr(CPUState *cs, struct kvm_run *run)
1651 {
1652     target_ulong csr_num = run->riscv_csr.csr_num;
1653     target_ulong new_value = run->riscv_csr.new_value;
1654     target_ulong write_mask = run->riscv_csr.write_mask;
1655     int ret = 0;
1656 
1657     switch (csr_num) {
1658     case CSR_SEED:
1659         run->riscv_csr.ret_value = riscv_new_csr_seed(new_value, write_mask);
1660         break;
1661     default:
1662         qemu_log_mask(LOG_UNIMP,
1663                       "%s: un-handled CSR EXIT for CSR %lx\n",
1664                       __func__, csr_num);
1665         ret = -1;
1666         break;
1667     }
1668 
1669     return ret;
1670 }
1671 
1672 static bool kvm_riscv_handle_debug(CPUState *cs)
1673 {
1674     RISCVCPU *cpu = RISCV_CPU(cs);
1675     CPURISCVState *env = &cpu->env;
1676 
1677     /* Ensure PC is synchronised */
1678     kvm_cpu_synchronize_state(cs);
1679 
1680     if (kvm_find_sw_breakpoint(cs, env->pc)) {
1681         return true;
1682     }
1683 
1684     return false;
1685 }
1686 
1687 int kvm_arch_handle_exit(CPUState *cs, struct kvm_run *run)
1688 {
1689     int ret = 0;
1690     switch (run->exit_reason) {
1691     case KVM_EXIT_RISCV_SBI:
1692         ret = kvm_riscv_handle_sbi(cs, run);
1693         break;
1694     case KVM_EXIT_RISCV_CSR:
1695         ret = kvm_riscv_handle_csr(cs, run);
1696         break;
1697     case KVM_EXIT_DEBUG:
1698         if (kvm_riscv_handle_debug(cs)) {
1699             ret = EXCP_DEBUG;
1700         }
1701         break;
1702     default:
1703         qemu_log_mask(LOG_UNIMP, "%s: un-handled exit reason %d\n",
1704                       __func__, run->exit_reason);
1705         ret = -1;
1706         break;
1707     }
1708     return ret;
1709 }
1710 
1711 void kvm_riscv_reset_vcpu(RISCVCPU *cpu)
1712 {
1713     CPURISCVState *env = &cpu->env;
1714     int i;
1715 
1716     for (i = 0; i < 32; i++) {
1717         env->gpr[i] = 0;
1718     }
1719     env->pc = cpu->env.kernel_addr;
1720     env->gpr[10] = kvm_arch_vcpu_id(CPU(cpu)); /* a0 */
1721     env->gpr[11] = cpu->env.fdt_addr;          /* a1 */
1722 
1723     kvm_riscv_reset_regs_csr(env);
1724 }
1725 
1726 void kvm_riscv_set_irq(RISCVCPU *cpu, int irq, int level)
1727 {
1728     int ret;
1729     unsigned virq = level ? KVM_INTERRUPT_SET : KVM_INTERRUPT_UNSET;
1730 
1731     if (irq != IRQ_S_EXT) {
1732         perror("kvm riscv set irq != IRQ_S_EXT\n");
1733         abort();
1734     }
1735 
1736     ret = kvm_vcpu_ioctl(CPU(cpu), KVM_INTERRUPT, &virq);
1737     if (ret < 0) {
1738         perror("Set irq failed");
1739         abort();
1740     }
1741 }
1742 
1743 static int aia_mode;
1744 
1745 static const char *kvm_aia_mode_str(uint64_t mode)
1746 {
1747     switch (mode) {
1748     case KVM_DEV_RISCV_AIA_MODE_EMUL:
1749         return "emul";
1750     case KVM_DEV_RISCV_AIA_MODE_HWACCEL:
1751         return "hwaccel";
1752     case KVM_DEV_RISCV_AIA_MODE_AUTO:
1753     default:
1754         return "auto";
1755     };
1756 }
1757 
1758 static char *riscv_get_kvm_aia(Object *obj, Error **errp)
1759 {
1760     return g_strdup(kvm_aia_mode_str(aia_mode));
1761 }
1762 
1763 static void riscv_set_kvm_aia(Object *obj, const char *val, Error **errp)
1764 {
1765     if (!strcmp(val, "emul")) {
1766         aia_mode = KVM_DEV_RISCV_AIA_MODE_EMUL;
1767     } else if (!strcmp(val, "hwaccel")) {
1768         aia_mode = KVM_DEV_RISCV_AIA_MODE_HWACCEL;
1769     } else if (!strcmp(val, "auto")) {
1770         aia_mode = KVM_DEV_RISCV_AIA_MODE_AUTO;
1771     } else {
1772         error_setg(errp, "Invalid KVM AIA mode");
1773         error_append_hint(errp, "Valid values are emul, hwaccel, and auto.\n");
1774     }
1775 }
1776 
1777 void kvm_arch_accel_class_init(ObjectClass *oc)
1778 {
1779     object_class_property_add_str(oc, "riscv-aia", riscv_get_kvm_aia,
1780                                   riscv_set_kvm_aia);
1781     object_class_property_set_description(oc, "riscv-aia",
1782         "Set KVM AIA mode. Valid values are 'emul', 'hwaccel' and 'auto'. "
1783         "Changing KVM AIA modes relies on host support. Defaults to 'auto' "
1784         "if the host supports it");
1785     object_property_set_default_str(object_class_property_find(oc, "riscv-aia"),
1786                                     "auto");
1787 }
1788 
1789 void kvm_riscv_aia_create(MachineState *machine, uint64_t group_shift,
1790                           uint64_t aia_irq_num, uint64_t aia_msi_num,
1791                           uint64_t aplic_base, uint64_t imsic_base,
1792                           uint64_t guest_num)
1793 {
1794     int ret, i;
1795     int aia_fd = -1;
1796     uint64_t default_aia_mode;
1797     uint64_t socket_count = riscv_socket_count(machine);
1798     uint64_t max_hart_per_socket = 0;
1799     uint64_t socket, base_hart, hart_count, socket_imsic_base, imsic_addr;
1800     uint64_t socket_bits, hart_bits, guest_bits;
1801     uint64_t max_group_id;
1802 
1803     aia_fd = kvm_create_device(kvm_state, KVM_DEV_TYPE_RISCV_AIA, false);
1804 
1805     if (aia_fd < 0) {
1806         error_report("Unable to create in-kernel irqchip");
1807         exit(1);
1808     }
1809 
1810     ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
1811                             KVM_DEV_RISCV_AIA_CONFIG_MODE,
1812                             &default_aia_mode, false, NULL);
1813     if (ret < 0) {
1814         error_report("KVM AIA: failed to get current KVM AIA mode");
1815         exit(1);
1816     }
1817 
1818     if (default_aia_mode != aia_mode) {
1819         ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
1820                                 KVM_DEV_RISCV_AIA_CONFIG_MODE,
1821                                 &aia_mode, true, NULL);
1822         if (ret < 0) {
1823             warn_report("KVM AIA: failed to set KVM AIA mode '%s', using "
1824                         "default host mode '%s'",
1825                         kvm_aia_mode_str(aia_mode),
1826                         kvm_aia_mode_str(default_aia_mode));
1827 
1828             /* failed to change AIA mode, use default */
1829             aia_mode = default_aia_mode;
1830         }
1831     }
1832 
1833     /*
1834      * Skip APLIC creation in KVM if we're running split mode.
1835      * This is done by leaving KVM_DEV_RISCV_AIA_CONFIG_SRCS
1836      * unset. We can also skip KVM_DEV_RISCV_AIA_ADDR_APLIC
1837      * since KVM won't be using it.
1838      */
1839     if (!kvm_kernel_irqchip_split()) {
1840         ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
1841                                 KVM_DEV_RISCV_AIA_CONFIG_SRCS,
1842                                 &aia_irq_num, true, NULL);
1843         if (ret < 0) {
1844             error_report("KVM AIA: failed to set number of input irq lines");
1845             exit(1);
1846         }
1847 
1848         ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_ADDR,
1849                                 KVM_DEV_RISCV_AIA_ADDR_APLIC,
1850                                 &aplic_base, true, NULL);
1851         if (ret < 0) {
1852             error_report("KVM AIA: failed to set the base address of APLIC");
1853             exit(1);
1854         }
1855      }
1856 
1857     ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
1858                             KVM_DEV_RISCV_AIA_CONFIG_IDS,
1859                             &aia_msi_num, true, NULL);
1860     if (ret < 0) {
1861         error_report("KVM AIA: failed to set number of msi");
1862         exit(1);
1863     }
1864 
1865 
1866     if (socket_count > 1) {
1867         max_group_id = socket_count - 1;
1868         socket_bits = find_last_bit(&max_group_id, BITS_PER_LONG) + 1;
1869         ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
1870                                 KVM_DEV_RISCV_AIA_CONFIG_GROUP_BITS,
1871                                 &socket_bits, true, NULL);
1872         if (ret < 0) {
1873             error_report("KVM AIA: failed to set group_bits");
1874             exit(1);
1875         }
1876 
1877         ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
1878                                 KVM_DEV_RISCV_AIA_CONFIG_GROUP_SHIFT,
1879                                 &group_shift, true, NULL);
1880         if (ret < 0) {
1881             error_report("KVM AIA: failed to set group_shift");
1882             exit(1);
1883         }
1884     }
1885 
1886     guest_bits = guest_num == 0 ? 0 :
1887                  find_last_bit(&guest_num, BITS_PER_LONG) + 1;
1888     ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
1889                             KVM_DEV_RISCV_AIA_CONFIG_GUEST_BITS,
1890                             &guest_bits, true, NULL);
1891     if (ret < 0) {
1892         error_report("KVM AIA: failed to set guest_bits");
1893         exit(1);
1894     }
1895 
1896     for (socket = 0; socket < socket_count; socket++) {
1897         socket_imsic_base = imsic_base + socket * (1U << group_shift);
1898         hart_count = riscv_socket_hart_count(machine, socket);
1899         base_hart = riscv_socket_first_hartid(machine, socket);
1900 
1901         if (max_hart_per_socket < hart_count) {
1902             max_hart_per_socket = hart_count;
1903         }
1904 
1905         for (i = 0; i < hart_count; i++) {
1906             imsic_addr = socket_imsic_base + i * IMSIC_HART_SIZE(guest_bits);
1907             ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_ADDR,
1908                                     KVM_DEV_RISCV_AIA_ADDR_IMSIC(i + base_hart),
1909                                     &imsic_addr, true, NULL);
1910             if (ret < 0) {
1911                 error_report("KVM AIA: failed to set the IMSIC address for hart %d", i);
1912                 exit(1);
1913             }
1914         }
1915     }
1916 
1917 
1918     if (max_hart_per_socket > 1) {
1919         max_hart_per_socket--;
1920         hart_bits = find_last_bit(&max_hart_per_socket, BITS_PER_LONG) + 1;
1921     } else {
1922         hart_bits = 0;
1923     }
1924 
1925     ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
1926                             KVM_DEV_RISCV_AIA_CONFIG_HART_BITS,
1927                             &hart_bits, true, NULL);
1928     if (ret < 0) {
1929         error_report("KVM AIA: failed to set hart_bits");
1930         exit(1);
1931     }
1932 
1933     if (kvm_has_gsi_routing()) {
1934         for (uint64_t idx = 0; idx < aia_irq_num + 1; ++idx) {
1935             /* KVM AIA only has one APLIC instance */
1936             kvm_irqchip_add_irq_route(kvm_state, idx, 0, idx);
1937         }
1938         kvm_gsi_routing_allowed = true;
1939         kvm_irqchip_commit_routes(kvm_state);
1940     }
1941 
1942     ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CTRL,
1943                             KVM_DEV_RISCV_AIA_CTRL_INIT,
1944                             NULL, true, NULL);
1945     if (ret < 0) {
1946         error_report("KVM AIA: initialized fail");
1947         exit(1);
1948     }
1949 
1950     kvm_msi_via_irqfd_allowed = true;
1951 }
1952 
1953 static void kvm_cpu_instance_init(CPUState *cs)
1954 {
1955     Object *obj = OBJECT(RISCV_CPU(cs));
1956 
1957     riscv_init_kvm_registers(obj);
1958 
1959     kvm_riscv_add_cpu_user_properties(obj);
1960 }
1961 
1962 /*
1963  * We'll get here via the following path:
1964  *
1965  * riscv_cpu_realize()
1966  *   -> cpu_exec_realizefn()
1967  *      -> kvm_cpu_realize() (via accel_cpu_common_realize())
1968  */
1969 static bool kvm_cpu_realize(CPUState *cs, Error **errp)
1970 {
1971     RISCVCPU *cpu = RISCV_CPU(cs);
1972     int ret;
1973 
1974     if (riscv_has_ext(&cpu->env, RVV)) {
1975         ret = prctl(PR_RISCV_V_SET_CONTROL, PR_RISCV_V_VSTATE_CTRL_ON);
1976         if (ret) {
1977             error_setg(errp, "Error in prctl PR_RISCV_V_SET_CONTROL, code: %s",
1978                        strerrorname_np(errno));
1979             return false;
1980         }
1981     }
1982 
1983    return true;
1984 }
1985 
1986 void riscv_kvm_cpu_finalize_features(RISCVCPU *cpu, Error **errp)
1987 {
1988     CPURISCVState *env = &cpu->env;
1989     KVMScratchCPU kvmcpu;
1990     struct kvm_one_reg reg;
1991     uint64_t val;
1992     int ret;
1993 
1994     /* short-circuit without spinning the scratch CPU */
1995     if (!cpu->cfg.ext_zicbom && !cpu->cfg.ext_zicboz &&
1996         !riscv_has_ext(env, RVV)) {
1997         return;
1998     }
1999 
2000     if (!kvm_riscv_create_scratch_vcpu(&kvmcpu)) {
2001         error_setg(errp, "Unable to create scratch KVM cpu");
2002         return;
2003     }
2004 
2005     if (cpu->cfg.ext_zicbom &&
2006         riscv_cpu_option_set(kvm_cbom_blocksize.name)) {
2007 
2008         reg.id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_CONFIG,
2009                                         kvm_cbom_blocksize.kvm_reg_id);
2010         reg.addr = (uint64_t)&val;
2011         ret = ioctl(kvmcpu.cpufd, KVM_GET_ONE_REG, &reg);
2012         if (ret != 0) {
2013             error_setg(errp, "Unable to read cbom_blocksize, error %d", errno);
2014             return;
2015         }
2016 
2017         if (cpu->cfg.cbom_blocksize != val) {
2018             error_setg(errp, "Unable to set cbom_blocksize to a different "
2019                        "value than the host (%lu)", val);
2020             return;
2021         }
2022     }
2023 
2024     if (cpu->cfg.ext_zicboz &&
2025         riscv_cpu_option_set(kvm_cboz_blocksize.name)) {
2026 
2027         reg.id = KVM_RISCV_REG_ID_ULONG(KVM_REG_RISCV_CONFIG,
2028                                         kvm_cboz_blocksize.kvm_reg_id);
2029         reg.addr = (uint64_t)&val;
2030         ret = ioctl(kvmcpu.cpufd, KVM_GET_ONE_REG, &reg);
2031         if (ret != 0) {
2032             error_setg(errp, "Unable to read cboz_blocksize, error %d", errno);
2033             return;
2034         }
2035 
2036         if (cpu->cfg.cboz_blocksize != val) {
2037             error_setg(errp, "Unable to set cboz_blocksize to a different "
2038                        "value than the host (%lu)", val);
2039             return;
2040         }
2041     }
2042 
2043     /* Users are setting vlen, not vlenb */
2044     if (riscv_has_ext(env, RVV) && riscv_cpu_option_set("vlen")) {
2045         if (!kvm_v_vlenb.supported) {
2046             error_setg(errp, "Unable to set 'vlenb': register not supported");
2047             return;
2048         }
2049 
2050         reg.id = kvm_v_vlenb.kvm_reg_id;
2051         reg.addr = (uint64_t)&val;
2052         ret = ioctl(kvmcpu.cpufd, KVM_GET_ONE_REG, &reg);
2053         if (ret != 0) {
2054             error_setg(errp, "Unable to read vlenb register, error %d", errno);
2055             return;
2056         }
2057 
2058         if (cpu->cfg.vlenb != val) {
2059             error_setg(errp, "Unable to set 'vlen' to a different "
2060                        "value than the host (%lu)", val * 8);
2061             return;
2062         }
2063     }
2064 
2065     kvm_riscv_destroy_scratch_vcpu(&kvmcpu);
2066 }
2067 
2068 static void kvm_cpu_accel_class_init(ObjectClass *oc, const void *data)
2069 {
2070     AccelCPUClass *acc = ACCEL_CPU_CLASS(oc);
2071 
2072     acc->cpu_instance_init = kvm_cpu_instance_init;
2073     acc->cpu_target_realize = kvm_cpu_realize;
2074 }
2075 
2076 static const TypeInfo kvm_cpu_accel_type_info = {
2077     .name = ACCEL_CPU_NAME("kvm"),
2078 
2079     .parent = TYPE_ACCEL_CPU,
2080     .class_init = kvm_cpu_accel_class_init,
2081     .abstract = true,
2082 };
2083 static void kvm_cpu_accel_register_types(void)
2084 {
2085     type_register_static(&kvm_cpu_accel_type_info);
2086 }
2087 type_init(kvm_cpu_accel_register_types);
2088 
2089 static const TypeInfo riscv_kvm_cpu_type_infos[] = {
2090     {
2091         .name = TYPE_RISCV_CPU_HOST,
2092         .parent = TYPE_RISCV_CPU,
2093 #if defined(TARGET_RISCV32)
2094         .class_data = &(const RISCVCPUDef) {
2095             .misa_mxl_max = MXL_RV32,
2096             .priv_spec = RISCV_PROFILE_ATTR_UNUSED,
2097             .vext_spec = RISCV_PROFILE_ATTR_UNUSED,
2098             .cfg.max_satp_mode = -1,
2099         },
2100 #elif defined(TARGET_RISCV64)
2101         .class_data = &(const RISCVCPUDef) {
2102             .misa_mxl_max = MXL_RV64,
2103             .priv_spec = RISCV_PROFILE_ATTR_UNUSED,
2104             .vext_spec = RISCV_PROFILE_ATTR_UNUSED,
2105             .cfg.max_satp_mode = -1,
2106         },
2107 #endif
2108     }
2109 };
2110 
2111 DEFINE_TYPES(riscv_kvm_cpu_type_infos)
2112 
2113 static const uint32_t ebreak_insn = 0x00100073;
2114 static const uint16_t c_ebreak_insn = 0x9002;
2115 
2116 int kvm_arch_insert_sw_breakpoint(CPUState *cs, struct kvm_sw_breakpoint *bp)
2117 {
2118     if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn, 2, 0)) {
2119         return -EINVAL;
2120     }
2121 
2122     if ((bp->saved_insn & 0x3) == 0x3) {
2123         if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn, 4, 0)
2124             || cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&ebreak_insn, 4, 1)) {
2125             return -EINVAL;
2126         }
2127     } else {
2128         if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&c_ebreak_insn, 2, 1)) {
2129             return -EINVAL;
2130         }
2131     }
2132 
2133     return 0;
2134 }
2135 
2136 int kvm_arch_remove_sw_breakpoint(CPUState *cs, struct kvm_sw_breakpoint *bp)
2137 {
2138     uint32_t ebreak;
2139     uint16_t c_ebreak;
2140 
2141     if ((bp->saved_insn & 0x3) == 0x3) {
2142         if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&ebreak, 4, 0) ||
2143             ebreak != ebreak_insn ||
2144             cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn, 4, 1)) {
2145             return -EINVAL;
2146         }
2147     } else {
2148         if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&c_ebreak, 2, 0) ||
2149             c_ebreak != c_ebreak_insn ||
2150             cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn, 2, 1)) {
2151             return -EINVAL;
2152         }
2153     }
2154 
2155     return 0;
2156 }
2157 
2158 int kvm_arch_insert_hw_breakpoint(vaddr addr, vaddr len, int type)
2159 {
2160     /* TODO; To be implemented later. */
2161     return -EINVAL;
2162 }
2163 
2164 int kvm_arch_remove_hw_breakpoint(vaddr addr, vaddr len, int type)
2165 {
2166     /* TODO; To be implemented later. */
2167     return -EINVAL;
2168 }
2169 
2170 void kvm_arch_remove_all_hw_breakpoints(void)
2171 {
2172     /* TODO; To be implemented later. */
2173 }
2174 
2175 void kvm_arch_update_guest_debug(CPUState *cs, struct kvm_guest_debug *dbg)
2176 {
2177     if (kvm_sw_breakpoints_active(cs)) {
2178         dbg->control |= KVM_GUESTDBG_ENABLE;
2179     }
2180 }
2181