xref: /openbmc/qemu/hw/ppc/spapr.c (revision ae4de14c)
153018216SPaolo Bonzini /*
253018216SPaolo Bonzini  * QEMU PowerPC pSeries Logical Partition (aka sPAPR) hardware System Emulator
353018216SPaolo Bonzini  *
453018216SPaolo Bonzini  * Copyright (c) 2004-2007 Fabrice Bellard
553018216SPaolo Bonzini  * Copyright (c) 2007 Jocelyn Mayer
653018216SPaolo Bonzini  * Copyright (c) 2010 David Gibson, IBM Corporation.
753018216SPaolo Bonzini  *
853018216SPaolo Bonzini  * Permission is hereby granted, free of charge, to any person obtaining a copy
953018216SPaolo Bonzini  * of this software and associated documentation files (the "Software"), to deal
1053018216SPaolo Bonzini  * in the Software without restriction, including without limitation the rights
1153018216SPaolo Bonzini  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
1253018216SPaolo Bonzini  * copies of the Software, and to permit persons to whom the Software is
1353018216SPaolo Bonzini  * furnished to do so, subject to the following conditions:
1453018216SPaolo Bonzini  *
1553018216SPaolo Bonzini  * The above copyright notice and this permission notice shall be included in
1653018216SPaolo Bonzini  * all copies or substantial portions of the Software.
1753018216SPaolo Bonzini  *
1853018216SPaolo Bonzini  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1953018216SPaolo Bonzini  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
2053018216SPaolo Bonzini  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
2153018216SPaolo Bonzini  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
2253018216SPaolo Bonzini  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
2353018216SPaolo Bonzini  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
2453018216SPaolo Bonzini  * THE SOFTWARE.
2553018216SPaolo Bonzini  *
2653018216SPaolo Bonzini  */
270d75590dSPeter Maydell #include "qemu/osdep.h"
28da34e65cSMarkus Armbruster #include "qapi/error.h"
2953018216SPaolo Bonzini #include "sysemu/sysemu.h"
30e35704baSEduardo Habkost #include "sysemu/numa.h"
3153018216SPaolo Bonzini #include "hw/hw.h"
3203dd024fSPaolo Bonzini #include "qemu/log.h"
3371461b0fSAlexey Kardashevskiy #include "hw/fw-path-provider.h"
3453018216SPaolo Bonzini #include "elf.h"
3553018216SPaolo Bonzini #include "net/net.h"
36ad440b4aSAndrew Jones #include "sysemu/device_tree.h"
37fa1d36dfSMarkus Armbruster #include "sysemu/block-backend.h"
3853018216SPaolo Bonzini #include "sysemu/cpus.h"
3953018216SPaolo Bonzini #include "sysemu/kvm.h"
40c20d332aSBharata B Rao #include "sysemu/device_tree.h"
4153018216SPaolo Bonzini #include "kvm_ppc.h"
42ff14e817SDr. David Alan Gilbert #include "migration/migration.h"
434be21d56SDavid Gibson #include "mmu-hash64.h"
443794d548SAlexey Kardashevskiy #include "qom/cpu.h"
4553018216SPaolo Bonzini 
4653018216SPaolo Bonzini #include "hw/boards.h"
470d09e41aSPaolo Bonzini #include "hw/ppc/ppc.h"
4853018216SPaolo Bonzini #include "hw/loader.h"
4953018216SPaolo Bonzini 
500d09e41aSPaolo Bonzini #include "hw/ppc/spapr.h"
510d09e41aSPaolo Bonzini #include "hw/ppc/spapr_vio.h"
520d09e41aSPaolo Bonzini #include "hw/pci-host/spapr.h"
530d09e41aSPaolo Bonzini #include "hw/ppc/xics.h"
5453018216SPaolo Bonzini #include "hw/pci/msi.h"
5553018216SPaolo Bonzini 
5653018216SPaolo Bonzini #include "hw/pci/pci.h"
5771461b0fSAlexey Kardashevskiy #include "hw/scsi/scsi.h"
5871461b0fSAlexey Kardashevskiy #include "hw/virtio/virtio-scsi.h"
5953018216SPaolo Bonzini 
6053018216SPaolo Bonzini #include "exec/address-spaces.h"
6153018216SPaolo Bonzini #include "hw/usb.h"
6253018216SPaolo Bonzini #include "qemu/config-file.h"
63135a129aSAneesh Kumar K.V #include "qemu/error-report.h"
642a6593cbSAlexey Kardashevskiy #include "trace.h"
6534316482SAlexey Kardashevskiy #include "hw/nmi.h"
6653018216SPaolo Bonzini 
6768a27b20SMichael S. Tsirkin #include "hw/compat.h"
68f348b6d1SVeronia Bahaa #include "qemu/cutils.h"
6994a94e4cSBharata B Rao #include "hw/ppc/spapr_cpu_core.h"
702474bfd4SIgor Mammedov #include "qmp-commands.h"
7168a27b20SMichael S. Tsirkin 
7253018216SPaolo Bonzini #include <libfdt.h>
7353018216SPaolo Bonzini 
7453018216SPaolo Bonzini /* SLOF memory layout:
7553018216SPaolo Bonzini  *
7653018216SPaolo Bonzini  * SLOF raw image loaded at 0, copies its romfs right below the flat
7753018216SPaolo Bonzini  * device-tree, then position SLOF itself 31M below that
7853018216SPaolo Bonzini  *
7953018216SPaolo Bonzini  * So we set FW_OVERHEAD to 40MB which should account for all of that
8053018216SPaolo Bonzini  * and more
8153018216SPaolo Bonzini  *
8253018216SPaolo Bonzini  * We load our kernel at 4M, leaving space for SLOF initial image
8353018216SPaolo Bonzini  */
8438b02bd8SAlexey Kardashevskiy #define FDT_MAX_SIZE            0x100000
8553018216SPaolo Bonzini #define RTAS_MAX_SIZE           0x10000
86b7d1f77aSBenjamin Herrenschmidt #define RTAS_MAX_ADDR           0x80000000 /* RTAS must stay below that */
8753018216SPaolo Bonzini #define FW_MAX_SIZE             0x400000
8853018216SPaolo Bonzini #define FW_FILE_NAME            "slof.bin"
8953018216SPaolo Bonzini #define FW_OVERHEAD             0x2800000
9053018216SPaolo Bonzini #define KERNEL_LOAD_ADDR        FW_MAX_SIZE
9153018216SPaolo Bonzini 
9253018216SPaolo Bonzini #define MIN_RMA_SLOF            128UL
9353018216SPaolo Bonzini 
9453018216SPaolo Bonzini #define PHANDLE_XICP            0x00001111
9553018216SPaolo Bonzini 
9653018216SPaolo Bonzini #define HTAB_SIZE(spapr)        (1ULL << ((spapr)->htab_shift))
9753018216SPaolo Bonzini 
98c04d6cfaSAnthony Liguori static XICSState *try_create_xics(const char *type, int nr_servers,
9934f2af3dSMarkus Armbruster                                   int nr_irqs, Error **errp)
100c04d6cfaSAnthony Liguori {
10134f2af3dSMarkus Armbruster     Error *err = NULL;
102c04d6cfaSAnthony Liguori     DeviceState *dev;
103c04d6cfaSAnthony Liguori 
104c04d6cfaSAnthony Liguori     dev = qdev_create(NULL, type);
105c04d6cfaSAnthony Liguori     qdev_prop_set_uint32(dev, "nr_servers", nr_servers);
106c04d6cfaSAnthony Liguori     qdev_prop_set_uint32(dev, "nr_irqs", nr_irqs);
10734f2af3dSMarkus Armbruster     object_property_set_bool(OBJECT(dev), true, "realized", &err);
10834f2af3dSMarkus Armbruster     if (err) {
10934f2af3dSMarkus Armbruster         error_propagate(errp, err);
11034f2af3dSMarkus Armbruster         object_unparent(OBJECT(dev));
111c04d6cfaSAnthony Liguori         return NULL;
112c04d6cfaSAnthony Liguori     }
1135a3d7b23SAlexey Kardashevskiy     return XICS_COMMON(dev);
114c04d6cfaSAnthony Liguori }
115c04d6cfaSAnthony Liguori 
116446f16a6SMarcel Apfelbaum static XICSState *xics_system_init(MachineState *machine,
1171e49182dSDavid Gibson                                    int nr_servers, int nr_irqs, Error **errp)
118c04d6cfaSAnthony Liguori {
11927f24582SBenjamin Herrenschmidt     XICSState *xics = NULL;
120c04d6cfaSAnthony Liguori 
12111ad93f6SDavid Gibson     if (kvm_enabled()) {
12234f2af3dSMarkus Armbruster         Error *err = NULL;
12334f2af3dSMarkus Armbruster 
124446f16a6SMarcel Apfelbaum         if (machine_kernel_irqchip_allowed(machine)) {
12527f24582SBenjamin Herrenschmidt             xics = try_create_xics(TYPE_XICS_SPAPR_KVM, nr_servers, nr_irqs,
126161deaf2SBenjamin Herrenschmidt                                    &err);
12711ad93f6SDavid Gibson         }
12827f24582SBenjamin Herrenschmidt         if (machine_kernel_irqchip_required(machine) && !xics) {
129b83baa60SMarkus Armbruster             error_reportf_err(err,
130b83baa60SMarkus Armbruster                               "kernel_irqchip requested but unavailable: ");
131b83baa60SMarkus Armbruster         } else {
132903a41d3SStefano Dong (董兴水)             error_free(err);
13311ad93f6SDavid Gibson         }
134b83baa60SMarkus Armbruster     }
13511ad93f6SDavid Gibson 
13627f24582SBenjamin Herrenschmidt     if (!xics) {
13727f24582SBenjamin Herrenschmidt         xics = try_create_xics(TYPE_XICS_SPAPR, nr_servers, nr_irqs, errp);
138c04d6cfaSAnthony Liguori     }
139c04d6cfaSAnthony Liguori 
14027f24582SBenjamin Herrenschmidt     return xics;
141c04d6cfaSAnthony Liguori }
142c04d6cfaSAnthony Liguori 
143833d4668SAlexey Kardashevskiy static int spapr_fixup_cpu_smt_dt(void *fdt, int offset, PowerPCCPU *cpu,
144833d4668SAlexey Kardashevskiy                                   int smt_threads)
145833d4668SAlexey Kardashevskiy {
146833d4668SAlexey Kardashevskiy     int i, ret = 0;
147833d4668SAlexey Kardashevskiy     uint32_t servers_prop[smt_threads];
148833d4668SAlexey Kardashevskiy     uint32_t gservers_prop[smt_threads * 2];
149833d4668SAlexey Kardashevskiy     int index = ppc_get_vcpu_dt_id(cpu);
150833d4668SAlexey Kardashevskiy 
1516d9412eaSAlexey Kardashevskiy     if (cpu->cpu_version) {
1524bce526eSLaurent Dufour         ret = fdt_setprop_cell(fdt, offset, "cpu-version", cpu->cpu_version);
1536d9412eaSAlexey Kardashevskiy         if (ret < 0) {
1546d9412eaSAlexey Kardashevskiy             return ret;
1556d9412eaSAlexey Kardashevskiy         }
1566d9412eaSAlexey Kardashevskiy     }
1576d9412eaSAlexey Kardashevskiy 
158833d4668SAlexey Kardashevskiy     /* Build interrupt servers and gservers properties */
159833d4668SAlexey Kardashevskiy     for (i = 0; i < smt_threads; i++) {
160833d4668SAlexey Kardashevskiy         servers_prop[i] = cpu_to_be32(index + i);
161833d4668SAlexey Kardashevskiy         /* Hack, direct the group queues back to cpu 0 */
162833d4668SAlexey Kardashevskiy         gservers_prop[i*2] = cpu_to_be32(index + i);
163833d4668SAlexey Kardashevskiy         gservers_prop[i*2 + 1] = 0;
164833d4668SAlexey Kardashevskiy     }
165833d4668SAlexey Kardashevskiy     ret = fdt_setprop(fdt, offset, "ibm,ppc-interrupt-server#s",
166833d4668SAlexey Kardashevskiy                       servers_prop, sizeof(servers_prop));
167833d4668SAlexey Kardashevskiy     if (ret < 0) {
168833d4668SAlexey Kardashevskiy         return ret;
169833d4668SAlexey Kardashevskiy     }
170833d4668SAlexey Kardashevskiy     ret = fdt_setprop(fdt, offset, "ibm,ppc-interrupt-gserver#s",
171833d4668SAlexey Kardashevskiy                       gservers_prop, sizeof(gservers_prop));
172833d4668SAlexey Kardashevskiy 
173833d4668SAlexey Kardashevskiy     return ret;
174833d4668SAlexey Kardashevskiy }
175833d4668SAlexey Kardashevskiy 
1760da6f3feSBharata B Rao static int spapr_fixup_cpu_numa_dt(void *fdt, int offset, CPUState *cs)
1770da6f3feSBharata B Rao {
1780da6f3feSBharata B Rao     int ret = 0;
1790da6f3feSBharata B Rao     PowerPCCPU *cpu = POWERPC_CPU(cs);
1800da6f3feSBharata B Rao     int index = ppc_get_vcpu_dt_id(cpu);
1810da6f3feSBharata B Rao     uint32_t associativity[] = {cpu_to_be32(0x5),
1820da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1830da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1840da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1850da6f3feSBharata B Rao                                 cpu_to_be32(cs->numa_node),
1860da6f3feSBharata B Rao                                 cpu_to_be32(index)};
1870da6f3feSBharata B Rao 
1880da6f3feSBharata B Rao     /* Advertise NUMA via ibm,associativity */
1890da6f3feSBharata B Rao     if (nb_numa_nodes > 1) {
1900da6f3feSBharata B Rao         ret = fdt_setprop(fdt, offset, "ibm,associativity", associativity,
1910da6f3feSBharata B Rao                           sizeof(associativity));
1920da6f3feSBharata B Rao     }
1930da6f3feSBharata B Rao 
1940da6f3feSBharata B Rao     return ret;
1950da6f3feSBharata B Rao }
1960da6f3feSBharata B Rao 
19728e02042SDavid Gibson static int spapr_fixup_cpu_dt(void *fdt, sPAPRMachineState *spapr)
19853018216SPaolo Bonzini {
19982677ed2SAlexey Kardashevskiy     int ret = 0, offset, cpus_offset;
20082677ed2SAlexey Kardashevskiy     CPUState *cs;
20153018216SPaolo Bonzini     char cpu_model[32];
20253018216SPaolo Bonzini     int smt = kvmppc_smt_threads();
20353018216SPaolo Bonzini     uint32_t pft_size_prop[] = {0, cpu_to_be32(spapr->htab_shift)};
20453018216SPaolo Bonzini 
20582677ed2SAlexey Kardashevskiy     CPU_FOREACH(cs) {
20682677ed2SAlexey Kardashevskiy         PowerPCCPU *cpu = POWERPC_CPU(cs);
20782677ed2SAlexey Kardashevskiy         DeviceClass *dc = DEVICE_GET_CLASS(cs);
20882677ed2SAlexey Kardashevskiy         int index = ppc_get_vcpu_dt_id(cpu);
20953018216SPaolo Bonzini 
2100f20ba62SAlexey Kardashevskiy         if ((index % smt) != 0) {
21153018216SPaolo Bonzini             continue;
21253018216SPaolo Bonzini         }
21353018216SPaolo Bonzini 
21482677ed2SAlexey Kardashevskiy         snprintf(cpu_model, 32, "%s@%x", dc->fw_name, index);
21553018216SPaolo Bonzini 
21682677ed2SAlexey Kardashevskiy         cpus_offset = fdt_path_offset(fdt, "/cpus");
21782677ed2SAlexey Kardashevskiy         if (cpus_offset < 0) {
21882677ed2SAlexey Kardashevskiy             cpus_offset = fdt_add_subnode(fdt, fdt_path_offset(fdt, "/"),
21982677ed2SAlexey Kardashevskiy                                           "cpus");
22082677ed2SAlexey Kardashevskiy             if (cpus_offset < 0) {
22182677ed2SAlexey Kardashevskiy                 return cpus_offset;
22282677ed2SAlexey Kardashevskiy             }
22382677ed2SAlexey Kardashevskiy         }
22482677ed2SAlexey Kardashevskiy         offset = fdt_subnode_offset(fdt, cpus_offset, cpu_model);
22582677ed2SAlexey Kardashevskiy         if (offset < 0) {
22682677ed2SAlexey Kardashevskiy             offset = fdt_add_subnode(fdt, cpus_offset, cpu_model);
22753018216SPaolo Bonzini             if (offset < 0) {
22853018216SPaolo Bonzini                 return offset;
22953018216SPaolo Bonzini             }
23082677ed2SAlexey Kardashevskiy         }
23153018216SPaolo Bonzini 
2320da6f3feSBharata B Rao         ret = fdt_setprop(fdt, offset, "ibm,pft-size",
2330da6f3feSBharata B Rao                           pft_size_prop, sizeof(pft_size_prop));
23453018216SPaolo Bonzini         if (ret < 0) {
23553018216SPaolo Bonzini             return ret;
23653018216SPaolo Bonzini         }
23753018216SPaolo Bonzini 
2380da6f3feSBharata B Rao         ret = spapr_fixup_cpu_numa_dt(fdt, offset, cs);
23953018216SPaolo Bonzini         if (ret < 0) {
24053018216SPaolo Bonzini             return ret;
24153018216SPaolo Bonzini         }
242833d4668SAlexey Kardashevskiy 
24382677ed2SAlexey Kardashevskiy         ret = spapr_fixup_cpu_smt_dt(fdt, offset, cpu,
2442a48d993SAlexey Kardashevskiy                                      ppc_get_compat_smt_threads(cpu));
245833d4668SAlexey Kardashevskiy         if (ret < 0) {
246833d4668SAlexey Kardashevskiy             return ret;
247833d4668SAlexey Kardashevskiy         }
24853018216SPaolo Bonzini     }
24953018216SPaolo Bonzini     return ret;
25053018216SPaolo Bonzini }
25153018216SPaolo Bonzini 
25253018216SPaolo Bonzini 
25353018216SPaolo Bonzini static size_t create_page_sizes_prop(CPUPPCState *env, uint32_t *prop,
25453018216SPaolo Bonzini                                      size_t maxsize)
25553018216SPaolo Bonzini {
25653018216SPaolo Bonzini     size_t maxcells = maxsize / sizeof(uint32_t);
25753018216SPaolo Bonzini     int i, j, count;
25853018216SPaolo Bonzini     uint32_t *p = prop;
25953018216SPaolo Bonzini 
26053018216SPaolo Bonzini     for (i = 0; i < PPC_PAGE_SIZES_MAX_SZ; i++) {
26153018216SPaolo Bonzini         struct ppc_one_seg_page_size *sps = &env->sps.sps[i];
26253018216SPaolo Bonzini 
26353018216SPaolo Bonzini         if (!sps->page_shift) {
26453018216SPaolo Bonzini             break;
26553018216SPaolo Bonzini         }
26653018216SPaolo Bonzini         for (count = 0; count < PPC_PAGE_SIZES_MAX_SZ; count++) {
26753018216SPaolo Bonzini             if (sps->enc[count].page_shift == 0) {
26853018216SPaolo Bonzini                 break;
26953018216SPaolo Bonzini             }
27053018216SPaolo Bonzini         }
27153018216SPaolo Bonzini         if ((p - prop) >= (maxcells - 3 - count * 2)) {
27253018216SPaolo Bonzini             break;
27353018216SPaolo Bonzini         }
27453018216SPaolo Bonzini         *(p++) = cpu_to_be32(sps->page_shift);
27553018216SPaolo Bonzini         *(p++) = cpu_to_be32(sps->slb_enc);
27653018216SPaolo Bonzini         *(p++) = cpu_to_be32(count);
27753018216SPaolo Bonzini         for (j = 0; j < count; j++) {
27853018216SPaolo Bonzini             *(p++) = cpu_to_be32(sps->enc[j].page_shift);
27953018216SPaolo Bonzini             *(p++) = cpu_to_be32(sps->enc[j].pte_enc);
28053018216SPaolo Bonzini         }
28153018216SPaolo Bonzini     }
28253018216SPaolo Bonzini 
28353018216SPaolo Bonzini     return (p - prop) * sizeof(uint32_t);
28453018216SPaolo Bonzini }
28553018216SPaolo Bonzini 
286b082d65aSAlexey Kardashevskiy static hwaddr spapr_node0_size(void)
287b082d65aSAlexey Kardashevskiy {
288fb164994SDavid Gibson     MachineState *machine = MACHINE(qdev_get_machine());
289fb164994SDavid Gibson 
290b082d65aSAlexey Kardashevskiy     if (nb_numa_nodes) {
291b082d65aSAlexey Kardashevskiy         int i;
292b082d65aSAlexey Kardashevskiy         for (i = 0; i < nb_numa_nodes; ++i) {
293b082d65aSAlexey Kardashevskiy             if (numa_info[i].node_mem) {
294fb164994SDavid Gibson                 return MIN(pow2floor(numa_info[i].node_mem),
295fb164994SDavid Gibson                            machine->ram_size);
296b082d65aSAlexey Kardashevskiy             }
297b082d65aSAlexey Kardashevskiy         }
298b082d65aSAlexey Kardashevskiy     }
299fb164994SDavid Gibson     return machine->ram_size;
300b082d65aSAlexey Kardashevskiy }
301b082d65aSAlexey Kardashevskiy 
30253018216SPaolo Bonzini #define _FDT(exp) \
30353018216SPaolo Bonzini     do { \
30453018216SPaolo Bonzini         int ret = (exp);                                           \
30553018216SPaolo Bonzini         if (ret < 0) {                                             \
30653018216SPaolo Bonzini             fprintf(stderr, "qemu: error creating device tree: %s: %s\n", \
30753018216SPaolo Bonzini                     #exp, fdt_strerror(ret));                      \
30853018216SPaolo Bonzini             exit(1);                                               \
30953018216SPaolo Bonzini         }                                                          \
31053018216SPaolo Bonzini     } while (0)
31153018216SPaolo Bonzini 
312a1d59c0fSAlexey Kardashevskiy static void add_str(GString *s, const gchar *s1)
313a1d59c0fSAlexey Kardashevskiy {
314a1d59c0fSAlexey Kardashevskiy     g_string_append_len(s, s1, strlen(s1) + 1);
315a1d59c0fSAlexey Kardashevskiy }
31653018216SPaolo Bonzini 
3173bbf37f2SAndreas Färber static void *spapr_create_fdt_skel(hwaddr initrd_base,
31853018216SPaolo Bonzini                                    hwaddr initrd_size,
31953018216SPaolo Bonzini                                    hwaddr kernel_size,
32016457e7fSBenjamin Herrenschmidt                                    bool little_endian,
32153018216SPaolo Bonzini                                    const char *kernel_cmdline,
32253018216SPaolo Bonzini                                    uint32_t epow_irq)
32353018216SPaolo Bonzini {
32453018216SPaolo Bonzini     void *fdt;
32553018216SPaolo Bonzini     uint32_t start_prop = cpu_to_be32(initrd_base);
32653018216SPaolo Bonzini     uint32_t end_prop = cpu_to_be32(initrd_base + initrd_size);
327a1d59c0fSAlexey Kardashevskiy     GString *hypertas = g_string_sized_new(256);
328a1d59c0fSAlexey Kardashevskiy     GString *qemu_hypertas = g_string_sized_new(256);
32953018216SPaolo Bonzini     uint32_t refpoints[] = {cpu_to_be32(0x4), cpu_to_be32(0x4)};
3309e734e3dSBharata B Rao     uint32_t interrupt_server_ranges_prop[] = {0, cpu_to_be32(max_cpus)};
33153018216SPaolo Bonzini     unsigned char vec5[] = {0x0, 0x0, 0x0, 0x0, 0x0, 0x80};
332ef951443SNikunj A Dadhania     char *buf;
33353018216SPaolo Bonzini 
334a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-pft");
335a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-term");
336a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-dabr");
337a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-interrupt");
338a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-tce");
339a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-vio");
340a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-splpar");
341a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-bulk");
342a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-set-mode");
3436cc09e26SThomas Huth     add_str(hypertas, "hcall-sprg0");
3446cc09e26SThomas Huth     add_str(hypertas, "hcall-copy");
3456cc09e26SThomas Huth     add_str(hypertas, "hcall-debug");
346a1d59c0fSAlexey Kardashevskiy     add_str(qemu_hypertas, "hcall-memop1");
347a1d59c0fSAlexey Kardashevskiy 
34853018216SPaolo Bonzini     fdt = g_malloc0(FDT_MAX_SIZE);
34953018216SPaolo Bonzini     _FDT((fdt_create(fdt, FDT_MAX_SIZE)));
35053018216SPaolo Bonzini 
35153018216SPaolo Bonzini     if (kernel_size) {
35253018216SPaolo Bonzini         _FDT((fdt_add_reservemap_entry(fdt, KERNEL_LOAD_ADDR, kernel_size)));
35353018216SPaolo Bonzini     }
35453018216SPaolo Bonzini     if (initrd_size) {
35553018216SPaolo Bonzini         _FDT((fdt_add_reservemap_entry(fdt, initrd_base, initrd_size)));
35653018216SPaolo Bonzini     }
35753018216SPaolo Bonzini     _FDT((fdt_finish_reservemap(fdt)));
35853018216SPaolo Bonzini 
35953018216SPaolo Bonzini     /* Root node */
36053018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "")));
36153018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type", "chrp")));
36253018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "model", "IBM pSeries (emulated by qemu)")));
363fa388916SAnthony Liguori     _FDT((fdt_property_string(fdt, "compatible", "qemu,pseries")));
36453018216SPaolo Bonzini 
365ef951443SNikunj A Dadhania     /*
366ef951443SNikunj A Dadhania      * Add info to guest to indentify which host is it being run on
367ef951443SNikunj A Dadhania      * and what is the uuid of the guest
368ef951443SNikunj A Dadhania      */
369ef951443SNikunj A Dadhania     if (kvmppc_get_host_model(&buf)) {
370ef951443SNikunj A Dadhania         _FDT((fdt_property_string(fdt, "host-model", buf)));
371ef951443SNikunj A Dadhania         g_free(buf);
372ef951443SNikunj A Dadhania     }
373ef951443SNikunj A Dadhania     if (kvmppc_get_host_serial(&buf)) {
374ef951443SNikunj A Dadhania         _FDT((fdt_property_string(fdt, "host-serial", buf)));
375ef951443SNikunj A Dadhania         g_free(buf);
376ef951443SNikunj A Dadhania     }
377ef951443SNikunj A Dadhania 
378ef951443SNikunj A Dadhania     buf = g_strdup_printf(UUID_FMT, qemu_uuid[0], qemu_uuid[1],
379ef951443SNikunj A Dadhania                           qemu_uuid[2], qemu_uuid[3], qemu_uuid[4],
380ef951443SNikunj A Dadhania                           qemu_uuid[5], qemu_uuid[6], qemu_uuid[7],
381ef951443SNikunj A Dadhania                           qemu_uuid[8], qemu_uuid[9], qemu_uuid[10],
382ef951443SNikunj A Dadhania                           qemu_uuid[11], qemu_uuid[12], qemu_uuid[13],
383ef951443SNikunj A Dadhania                           qemu_uuid[14], qemu_uuid[15]);
384ef951443SNikunj A Dadhania 
385ef951443SNikunj A Dadhania     _FDT((fdt_property_string(fdt, "vm,uuid", buf)));
3863dc0a66dSAlexey Kardashevskiy     if (qemu_uuid_set) {
3873dc0a66dSAlexey Kardashevskiy         _FDT((fdt_property_string(fdt, "system-id", buf)));
3883dc0a66dSAlexey Kardashevskiy     }
389ef951443SNikunj A Dadhania     g_free(buf);
390ef951443SNikunj A Dadhania 
3912c1aaa81SSam Bobroff     if (qemu_get_vm_name()) {
3922c1aaa81SSam Bobroff         _FDT((fdt_property_string(fdt, "ibm,partition-name",
3932c1aaa81SSam Bobroff                                   qemu_get_vm_name())));
3942c1aaa81SSam Bobroff     }
3952c1aaa81SSam Bobroff 
39653018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#address-cells", 0x2)));
39753018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#size-cells", 0x2)));
39853018216SPaolo Bonzini 
39953018216SPaolo Bonzini     /* /chosen */
40053018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "chosen")));
40153018216SPaolo Bonzini 
40253018216SPaolo Bonzini     /* Set Form1_affinity */
40353018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,architecture-vec-5", vec5, sizeof(vec5))));
40453018216SPaolo Bonzini 
40553018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "bootargs", kernel_cmdline)));
40653018216SPaolo Bonzini     _FDT((fdt_property(fdt, "linux,initrd-start",
40753018216SPaolo Bonzini                        &start_prop, sizeof(start_prop))));
40853018216SPaolo Bonzini     _FDT((fdt_property(fdt, "linux,initrd-end",
40953018216SPaolo Bonzini                        &end_prop, sizeof(end_prop))));
41053018216SPaolo Bonzini     if (kernel_size) {
41153018216SPaolo Bonzini         uint64_t kprop[2] = { cpu_to_be64(KERNEL_LOAD_ADDR),
41253018216SPaolo Bonzini                               cpu_to_be64(kernel_size) };
41353018216SPaolo Bonzini 
41453018216SPaolo Bonzini         _FDT((fdt_property(fdt, "qemu,boot-kernel", &kprop, sizeof(kprop))));
41516457e7fSBenjamin Herrenschmidt         if (little_endian) {
41616457e7fSBenjamin Herrenschmidt             _FDT((fdt_property(fdt, "qemu,boot-kernel-le", NULL, 0)));
41716457e7fSBenjamin Herrenschmidt         }
41853018216SPaolo Bonzini     }
419cc84c0f3SAvik Sil     if (boot_menu) {
420cc84c0f3SAvik Sil         _FDT((fdt_property_cell(fdt, "qemu,boot-menu", boot_menu)));
421cc84c0f3SAvik Sil     }
42253018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-width", graphic_width)));
42353018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-height", graphic_height)));
42453018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-depth", graphic_depth)));
42553018216SPaolo Bonzini 
42653018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
42753018216SPaolo Bonzini 
42853018216SPaolo Bonzini     /* RTAS */
42953018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "rtas")));
43053018216SPaolo Bonzini 
431da95324eSAlexey Kardashevskiy     if (!kvm_enabled() || kvmppc_spapr_use_multitce()) {
432da95324eSAlexey Kardashevskiy         add_str(hypertas, "hcall-multi-tce");
433da95324eSAlexey Kardashevskiy     }
434a1d59c0fSAlexey Kardashevskiy     _FDT((fdt_property(fdt, "ibm,hypertas-functions", hypertas->str,
435a1d59c0fSAlexey Kardashevskiy                        hypertas->len)));
436a1d59c0fSAlexey Kardashevskiy     g_string_free(hypertas, TRUE);
437a1d59c0fSAlexey Kardashevskiy     _FDT((fdt_property(fdt, "qemu,hypertas-functions", qemu_hypertas->str,
438a1d59c0fSAlexey Kardashevskiy                        qemu_hypertas->len)));
439a1d59c0fSAlexey Kardashevskiy     g_string_free(qemu_hypertas, TRUE);
44053018216SPaolo Bonzini 
44153018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,associativity-reference-points",
44253018216SPaolo Bonzini         refpoints, sizeof(refpoints))));
44353018216SPaolo Bonzini 
44453018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "rtas-error-log-max", RTAS_ERROR_LOG_MAX)));
44579853e18STyrel Datwyler     _FDT((fdt_property_cell(fdt, "rtas-event-scan-rate",
44679853e18STyrel Datwyler                             RTAS_EVENT_SCAN_RATE)));
44753018216SPaolo Bonzini 
448226419d6SMichael S. Tsirkin     if (msi_nonbroken) {
449a95f9922SSam Bobroff         _FDT((fdt_property(fdt, "ibm,change-msix-capable", NULL, 0)));
450a95f9922SSam Bobroff     }
451a95f9922SSam Bobroff 
4522e14072fSNikunj A Dadhania     /*
4539d632f5fSzhanghailiang      * According to PAPR, rtas ibm,os-term does not guarantee a return
4542e14072fSNikunj A Dadhania      * back to the guest cpu.
4552e14072fSNikunj A Dadhania      *
4562e14072fSNikunj A Dadhania      * While an additional ibm,extended-os-term property indicates that
4572e14072fSNikunj A Dadhania      * rtas call return will always occur. Set this property.
4582e14072fSNikunj A Dadhania      */
4592e14072fSNikunj A Dadhania     _FDT((fdt_property(fdt, "ibm,extended-os-term", NULL, 0)));
4602e14072fSNikunj A Dadhania 
46153018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
46253018216SPaolo Bonzini 
46353018216SPaolo Bonzini     /* interrupt controller */
46453018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "interrupt-controller")));
46553018216SPaolo Bonzini 
46653018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type",
46753018216SPaolo Bonzini                               "PowerPC-External-Interrupt-Presentation")));
46853018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "compatible", "IBM,ppc-xicp")));
46953018216SPaolo Bonzini     _FDT((fdt_property(fdt, "interrupt-controller", NULL, 0)));
47053018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,interrupt-server-ranges",
47153018216SPaolo Bonzini                        interrupt_server_ranges_prop,
47253018216SPaolo Bonzini                        sizeof(interrupt_server_ranges_prop))));
47353018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#interrupt-cells", 2)));
47453018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "linux,phandle", PHANDLE_XICP)));
47553018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "phandle", PHANDLE_XICP)));
47653018216SPaolo Bonzini 
47753018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
47853018216SPaolo Bonzini 
47953018216SPaolo Bonzini     /* vdevice */
48053018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "vdevice")));
48153018216SPaolo Bonzini 
48253018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type", "vdevice")));
48353018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "compatible", "IBM,vdevice")));
48453018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#address-cells", 0x1)));
48553018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#size-cells", 0x0)));
48653018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#interrupt-cells", 0x2)));
48753018216SPaolo Bonzini     _FDT((fdt_property(fdt, "interrupt-controller", NULL, 0)));
48853018216SPaolo Bonzini 
48953018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
49053018216SPaolo Bonzini 
49153018216SPaolo Bonzini     /* event-sources */
49253018216SPaolo Bonzini     spapr_events_fdt_skel(fdt, epow_irq);
49353018216SPaolo Bonzini 
494f7d69146SAlexander Graf     /* /hypervisor node */
495f7d69146SAlexander Graf     if (kvm_enabled()) {
496f7d69146SAlexander Graf         uint8_t hypercall[16];
497f7d69146SAlexander Graf 
498f7d69146SAlexander Graf         /* indicate KVM hypercall interface */
499f7d69146SAlexander Graf         _FDT((fdt_begin_node(fdt, "hypervisor")));
500f7d69146SAlexander Graf         _FDT((fdt_property_string(fdt, "compatible", "linux,kvm")));
501f7d69146SAlexander Graf         if (kvmppc_has_cap_fixup_hcalls()) {
502f7d69146SAlexander Graf             /*
503f7d69146SAlexander Graf              * Older KVM versions with older guest kernels were broken with the
504f7d69146SAlexander Graf              * magic page, don't allow the guest to map it.
505f7d69146SAlexander Graf              */
5060ddbd053SAlexey Kardashevskiy             if (!kvmppc_get_hypercall(first_cpu->env_ptr, hypercall,
5070ddbd053SAlexey Kardashevskiy                                       sizeof(hypercall))) {
508f7d69146SAlexander Graf                 _FDT((fdt_property(fdt, "hcall-instructions", hypercall,
509f7d69146SAlexander Graf                                    sizeof(hypercall))));
510f7d69146SAlexander Graf             }
5110ddbd053SAlexey Kardashevskiy         }
512f7d69146SAlexander Graf         _FDT((fdt_end_node(fdt)));
513f7d69146SAlexander Graf     }
514f7d69146SAlexander Graf 
51553018216SPaolo Bonzini     _FDT((fdt_end_node(fdt))); /* close root node */
51653018216SPaolo Bonzini     _FDT((fdt_finish(fdt)));
51753018216SPaolo Bonzini 
51853018216SPaolo Bonzini     return fdt;
51953018216SPaolo Bonzini }
52053018216SPaolo Bonzini 
52103d196b7SBharata B Rao static int spapr_populate_memory_node(void *fdt, int nodeid, hwaddr start,
52226a8c353SAlexey Kardashevskiy                                        hwaddr size)
52326a8c353SAlexey Kardashevskiy {
52426a8c353SAlexey Kardashevskiy     uint32_t associativity[] = {
52526a8c353SAlexey Kardashevskiy         cpu_to_be32(0x4), /* length */
52626a8c353SAlexey Kardashevskiy         cpu_to_be32(0x0), cpu_to_be32(0x0),
527c3b4f589SAlexey Kardashevskiy         cpu_to_be32(0x0), cpu_to_be32(nodeid)
52826a8c353SAlexey Kardashevskiy     };
52926a8c353SAlexey Kardashevskiy     char mem_name[32];
53026a8c353SAlexey Kardashevskiy     uint64_t mem_reg_property[2];
53126a8c353SAlexey Kardashevskiy     int off;
53226a8c353SAlexey Kardashevskiy 
53326a8c353SAlexey Kardashevskiy     mem_reg_property[0] = cpu_to_be64(start);
53426a8c353SAlexey Kardashevskiy     mem_reg_property[1] = cpu_to_be64(size);
53526a8c353SAlexey Kardashevskiy 
53626a8c353SAlexey Kardashevskiy     sprintf(mem_name, "memory@" TARGET_FMT_lx, start);
53726a8c353SAlexey Kardashevskiy     off = fdt_add_subnode(fdt, 0, mem_name);
53826a8c353SAlexey Kardashevskiy     _FDT(off);
53926a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop_string(fdt, off, "device_type", "memory")));
54026a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop(fdt, off, "reg", mem_reg_property,
54126a8c353SAlexey Kardashevskiy                       sizeof(mem_reg_property))));
54226a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop(fdt, off, "ibm,associativity", associativity,
54326a8c353SAlexey Kardashevskiy                       sizeof(associativity))));
54403d196b7SBharata B Rao     return off;
54526a8c353SAlexey Kardashevskiy }
54626a8c353SAlexey Kardashevskiy 
54728e02042SDavid Gibson static int spapr_populate_memory(sPAPRMachineState *spapr, void *fdt)
54853018216SPaolo Bonzini {
549fb164994SDavid Gibson     MachineState *machine = MACHINE(spapr);
5507db8a127SAlexey Kardashevskiy     hwaddr mem_start, node_size;
5517db8a127SAlexey Kardashevskiy     int i, nb_nodes = nb_numa_nodes;
5527db8a127SAlexey Kardashevskiy     NodeInfo *nodes = numa_info;
5537db8a127SAlexey Kardashevskiy     NodeInfo ramnode;
55453018216SPaolo Bonzini 
5557db8a127SAlexey Kardashevskiy     /* No NUMA nodes, assume there is just one node with whole RAM */
5567db8a127SAlexey Kardashevskiy     if (!nb_numa_nodes) {
5577db8a127SAlexey Kardashevskiy         nb_nodes = 1;
558fb164994SDavid Gibson         ramnode.node_mem = machine->ram_size;
5597db8a127SAlexey Kardashevskiy         nodes = &ramnode;
5605fe269b1SPaul Mackerras     }
56153018216SPaolo Bonzini 
5627db8a127SAlexey Kardashevskiy     for (i = 0, mem_start = 0; i < nb_nodes; ++i) {
5637db8a127SAlexey Kardashevskiy         if (!nodes[i].node_mem) {
5647db8a127SAlexey Kardashevskiy             continue;
56553018216SPaolo Bonzini         }
566fb164994SDavid Gibson         if (mem_start >= machine->ram_size) {
5675fe269b1SPaul Mackerras             node_size = 0;
5685fe269b1SPaul Mackerras         } else {
5697db8a127SAlexey Kardashevskiy             node_size = nodes[i].node_mem;
570fb164994SDavid Gibson             if (node_size > machine->ram_size - mem_start) {
571fb164994SDavid Gibson                 node_size = machine->ram_size - mem_start;
5725fe269b1SPaul Mackerras             }
5735fe269b1SPaul Mackerras         }
5747db8a127SAlexey Kardashevskiy         if (!mem_start) {
5757db8a127SAlexey Kardashevskiy             /* ppc_spapr_init() checks for rma_size <= node0_size already */
576e8f986fcSBharata B Rao             spapr_populate_memory_node(fdt, i, 0, spapr->rma_size);
5777db8a127SAlexey Kardashevskiy             mem_start += spapr->rma_size;
5787db8a127SAlexey Kardashevskiy             node_size -= spapr->rma_size;
5797db8a127SAlexey Kardashevskiy         }
5806010818cSAlexey Kardashevskiy         for ( ; node_size; ) {
5816010818cSAlexey Kardashevskiy             hwaddr sizetmp = pow2floor(node_size);
5826010818cSAlexey Kardashevskiy 
5836010818cSAlexey Kardashevskiy             /* mem_start != 0 here */
5846010818cSAlexey Kardashevskiy             if (ctzl(mem_start) < ctzl(sizetmp)) {
5856010818cSAlexey Kardashevskiy                 sizetmp = 1ULL << ctzl(mem_start);
5866010818cSAlexey Kardashevskiy             }
5876010818cSAlexey Kardashevskiy 
5886010818cSAlexey Kardashevskiy             spapr_populate_memory_node(fdt, i, mem_start, sizetmp);
5896010818cSAlexey Kardashevskiy             node_size -= sizetmp;
5906010818cSAlexey Kardashevskiy             mem_start += sizetmp;
5916010818cSAlexey Kardashevskiy         }
59253018216SPaolo Bonzini     }
59353018216SPaolo Bonzini 
59453018216SPaolo Bonzini     return 0;
59553018216SPaolo Bonzini }
59653018216SPaolo Bonzini 
5970da6f3feSBharata B Rao static void spapr_populate_cpu_dt(CPUState *cs, void *fdt, int offset,
5980da6f3feSBharata B Rao                                   sPAPRMachineState *spapr)
5990da6f3feSBharata B Rao {
6000da6f3feSBharata B Rao     PowerPCCPU *cpu = POWERPC_CPU(cs);
6010da6f3feSBharata B Rao     CPUPPCState *env = &cpu->env;
6020da6f3feSBharata B Rao     PowerPCCPUClass *pcc = POWERPC_CPU_GET_CLASS(cs);
6030da6f3feSBharata B Rao     int index = ppc_get_vcpu_dt_id(cpu);
6040da6f3feSBharata B Rao     uint32_t segs[] = {cpu_to_be32(28), cpu_to_be32(40),
6050da6f3feSBharata B Rao                        0xffffffff, 0xffffffff};
606afd10a0fSBharata B Rao     uint32_t tbfreq = kvm_enabled() ? kvmppc_get_tbfreq()
607afd10a0fSBharata B Rao         : SPAPR_TIMEBASE_FREQ;
6080da6f3feSBharata B Rao     uint32_t cpufreq = kvm_enabled() ? kvmppc_get_clockfreq() : 1000000000;
6090da6f3feSBharata B Rao     uint32_t page_sizes_prop[64];
6100da6f3feSBharata B Rao     size_t page_sizes_prop_size;
61122419c2aSDavid Gibson     uint32_t vcpus_per_socket = smp_threads * smp_cores;
6120da6f3feSBharata B Rao     uint32_t pft_size_prop[] = {0, cpu_to_be32(spapr->htab_shift)};
613af81cf32SBharata B Rao     sPAPRDRConnector *drc;
614af81cf32SBharata B Rao     sPAPRDRConnectorClass *drck;
615af81cf32SBharata B Rao     int drc_index;
616af81cf32SBharata B Rao 
617af81cf32SBharata B Rao     drc = spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_CPU, index);
618af81cf32SBharata B Rao     if (drc) {
619af81cf32SBharata B Rao         drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
620af81cf32SBharata B Rao         drc_index = drck->get_index(drc);
621af81cf32SBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "ibm,my-drc-index", drc_index)));
622af81cf32SBharata B Rao     }
6230da6f3feSBharata B Rao 
62490da0d5aSBenjamin Herrenschmidt     /* Note: we keep CI large pages off for now because a 64K capable guest
62590da0d5aSBenjamin Herrenschmidt      * provisioned with large pages might otherwise try to map a qemu
62690da0d5aSBenjamin Herrenschmidt      * framebuffer (or other kind of memory mapped PCI BAR) using 64K pages
62790da0d5aSBenjamin Herrenschmidt      * even if that qemu runs on a 4k host.
62890da0d5aSBenjamin Herrenschmidt      *
62990da0d5aSBenjamin Herrenschmidt      * We can later add this bit back when we are confident this is not
63090da0d5aSBenjamin Herrenschmidt      * an issue (!HV KVM or 64K host)
63190da0d5aSBenjamin Herrenschmidt      */
63290da0d5aSBenjamin Herrenschmidt     uint8_t pa_features_206[] = { 6, 0,
63390da0d5aSBenjamin Herrenschmidt         0xf6, 0x1f, 0xc7, 0x00, 0x80, 0xc0 };
63490da0d5aSBenjamin Herrenschmidt     uint8_t pa_features_207[] = { 24, 0,
63590da0d5aSBenjamin Herrenschmidt         0xf6, 0x1f, 0xc7, 0xc0, 0x80, 0xf0,
63690da0d5aSBenjamin Herrenschmidt         0x80, 0x00, 0x00, 0x00, 0x00, 0x00,
63790da0d5aSBenjamin Herrenschmidt         0x00, 0x00, 0x00, 0x00, 0x80, 0x00,
63890da0d5aSBenjamin Herrenschmidt         0x80, 0x00, 0x80, 0x00, 0x80, 0x00 };
63990da0d5aSBenjamin Herrenschmidt     uint8_t *pa_features;
64090da0d5aSBenjamin Herrenschmidt     size_t pa_size;
64190da0d5aSBenjamin Herrenschmidt 
6420da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "reg", index)));
6430da6f3feSBharata B Rao     _FDT((fdt_setprop_string(fdt, offset, "device_type", "cpu")));
6440da6f3feSBharata B Rao 
6450da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "cpu-version", env->spr[SPR_PVR])));
6460da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "d-cache-block-size",
6470da6f3feSBharata B Rao                            env->dcache_line_size)));
6480da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "d-cache-line-size",
6490da6f3feSBharata B Rao                            env->dcache_line_size)));
6500da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "i-cache-block-size",
6510da6f3feSBharata B Rao                            env->icache_line_size)));
6520da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "i-cache-line-size",
6530da6f3feSBharata B Rao                            env->icache_line_size)));
6540da6f3feSBharata B Rao 
6550da6f3feSBharata B Rao     if (pcc->l1_dcache_size) {
6560da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "d-cache-size",
6570da6f3feSBharata B Rao                                pcc->l1_dcache_size)));
6580da6f3feSBharata B Rao     } else {
6590da6f3feSBharata B Rao         fprintf(stderr, "Warning: Unknown L1 dcache size for cpu\n");
6600da6f3feSBharata B Rao     }
6610da6f3feSBharata B Rao     if (pcc->l1_icache_size) {
6620da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "i-cache-size",
6630da6f3feSBharata B Rao                                pcc->l1_icache_size)));
6640da6f3feSBharata B Rao     } else {
6650da6f3feSBharata B Rao         fprintf(stderr, "Warning: Unknown L1 icache size for cpu\n");
6660da6f3feSBharata B Rao     }
6670da6f3feSBharata B Rao 
6680da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "timebase-frequency", tbfreq)));
6690da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "clock-frequency", cpufreq)));
670fd5da5c4SThomas Huth     _FDT((fdt_setprop_cell(fdt, offset, "slb-size", env->slb_nr)));
6710da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "ibm,slb-size", env->slb_nr)));
6720da6f3feSBharata B Rao     _FDT((fdt_setprop_string(fdt, offset, "status", "okay")));
6730da6f3feSBharata B Rao     _FDT((fdt_setprop(fdt, offset, "64-bit", NULL, 0)));
6740da6f3feSBharata B Rao 
6750da6f3feSBharata B Rao     if (env->spr_cb[SPR_PURR].oea_read) {
6760da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,purr", NULL, 0)));
6770da6f3feSBharata B Rao     }
6780da6f3feSBharata B Rao 
6790da6f3feSBharata B Rao     if (env->mmu_model & POWERPC_MMU_1TSEG) {
6800da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,processor-segment-sizes",
6810da6f3feSBharata B Rao                           segs, sizeof(segs))));
6820da6f3feSBharata B Rao     }
6830da6f3feSBharata B Rao 
6840da6f3feSBharata B Rao     /* Advertise VMX/VSX (vector extensions) if available
6850da6f3feSBharata B Rao      *   0 / no property == no vector extensions
6860da6f3feSBharata B Rao      *   1               == VMX / Altivec available
6870da6f3feSBharata B Rao      *   2               == VSX available */
6880da6f3feSBharata B Rao     if (env->insns_flags & PPC_ALTIVEC) {
6890da6f3feSBharata B Rao         uint32_t vmx = (env->insns_flags2 & PPC2_VSX) ? 2 : 1;
6900da6f3feSBharata B Rao 
6910da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "ibm,vmx", vmx)));
6920da6f3feSBharata B Rao     }
6930da6f3feSBharata B Rao 
6940da6f3feSBharata B Rao     /* Advertise DFP (Decimal Floating Point) if available
6950da6f3feSBharata B Rao      *   0 / no property == no DFP
6960da6f3feSBharata B Rao      *   1               == DFP available */
6970da6f3feSBharata B Rao     if (env->insns_flags2 & PPC2_DFP) {
6980da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "ibm,dfp", 1)));
6990da6f3feSBharata B Rao     }
7000da6f3feSBharata B Rao 
7010da6f3feSBharata B Rao     page_sizes_prop_size = create_page_sizes_prop(env, page_sizes_prop,
7020da6f3feSBharata B Rao                                                   sizeof(page_sizes_prop));
7030da6f3feSBharata B Rao     if (page_sizes_prop_size) {
7040da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,segment-page-sizes",
7050da6f3feSBharata B Rao                           page_sizes_prop, page_sizes_prop_size)));
7060da6f3feSBharata B Rao     }
7070da6f3feSBharata B Rao 
70890da0d5aSBenjamin Herrenschmidt     /* Do the ibm,pa-features property, adjust it for ci-large-pages */
70990da0d5aSBenjamin Herrenschmidt     if (env->mmu_model == POWERPC_MMU_2_06) {
71090da0d5aSBenjamin Herrenschmidt         pa_features = pa_features_206;
71190da0d5aSBenjamin Herrenschmidt         pa_size = sizeof(pa_features_206);
71290da0d5aSBenjamin Herrenschmidt     } else /* env->mmu_model == POWERPC_MMU_2_07 */ {
71390da0d5aSBenjamin Herrenschmidt         pa_features = pa_features_207;
71490da0d5aSBenjamin Herrenschmidt         pa_size = sizeof(pa_features_207);
71590da0d5aSBenjamin Herrenschmidt     }
71690da0d5aSBenjamin Herrenschmidt     if (env->ci_large_pages) {
71790da0d5aSBenjamin Herrenschmidt         pa_features[3] |= 0x20;
71890da0d5aSBenjamin Herrenschmidt     }
71990da0d5aSBenjamin Herrenschmidt     _FDT((fdt_setprop(fdt, offset, "ibm,pa-features", pa_features, pa_size)));
72090da0d5aSBenjamin Herrenschmidt 
7210da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "ibm,chip-id",
72222419c2aSDavid Gibson                            cs->cpu_index / vcpus_per_socket)));
7230da6f3feSBharata B Rao 
7240da6f3feSBharata B Rao     _FDT((fdt_setprop(fdt, offset, "ibm,pft-size",
7250da6f3feSBharata B Rao                       pft_size_prop, sizeof(pft_size_prop))));
7260da6f3feSBharata B Rao 
7270da6f3feSBharata B Rao     _FDT(spapr_fixup_cpu_numa_dt(fdt, offset, cs));
7280da6f3feSBharata B Rao 
7290da6f3feSBharata B Rao     _FDT(spapr_fixup_cpu_smt_dt(fdt, offset, cpu,
7300da6f3feSBharata B Rao                                 ppc_get_compat_smt_threads(cpu)));
7310da6f3feSBharata B Rao }
7320da6f3feSBharata B Rao 
7330da6f3feSBharata B Rao static void spapr_populate_cpus_dt_node(void *fdt, sPAPRMachineState *spapr)
7340da6f3feSBharata B Rao {
7350da6f3feSBharata B Rao     CPUState *cs;
7360da6f3feSBharata B Rao     int cpus_offset;
7370da6f3feSBharata B Rao     char *nodename;
7380da6f3feSBharata B Rao     int smt = kvmppc_smt_threads();
7390da6f3feSBharata B Rao 
7400da6f3feSBharata B Rao     cpus_offset = fdt_add_subnode(fdt, 0, "cpus");
7410da6f3feSBharata B Rao     _FDT(cpus_offset);
7420da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, cpus_offset, "#address-cells", 0x1)));
7430da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, cpus_offset, "#size-cells", 0x0)));
7440da6f3feSBharata B Rao 
7450da6f3feSBharata B Rao     /*
7460da6f3feSBharata B Rao      * We walk the CPUs in reverse order to ensure that CPU DT nodes
7470da6f3feSBharata B Rao      * created by fdt_add_subnode() end up in the right order in FDT
7480da6f3feSBharata B Rao      * for the guest kernel the enumerate the CPUs correctly.
7490da6f3feSBharata B Rao      */
7500da6f3feSBharata B Rao     CPU_FOREACH_REVERSE(cs) {
7510da6f3feSBharata B Rao         PowerPCCPU *cpu = POWERPC_CPU(cs);
7520da6f3feSBharata B Rao         int index = ppc_get_vcpu_dt_id(cpu);
7530da6f3feSBharata B Rao         DeviceClass *dc = DEVICE_GET_CLASS(cs);
7540da6f3feSBharata B Rao         int offset;
7550da6f3feSBharata B Rao 
7560da6f3feSBharata B Rao         if ((index % smt) != 0) {
7570da6f3feSBharata B Rao             continue;
7580da6f3feSBharata B Rao         }
7590da6f3feSBharata B Rao 
7600da6f3feSBharata B Rao         nodename = g_strdup_printf("%s@%x", dc->fw_name, index);
7610da6f3feSBharata B Rao         offset = fdt_add_subnode(fdt, cpus_offset, nodename);
7620da6f3feSBharata B Rao         g_free(nodename);
7630da6f3feSBharata B Rao         _FDT(offset);
7640da6f3feSBharata B Rao         spapr_populate_cpu_dt(cs, fdt, offset, spapr);
7650da6f3feSBharata B Rao     }
7660da6f3feSBharata B Rao 
7670da6f3feSBharata B Rao }
7680da6f3feSBharata B Rao 
76903d196b7SBharata B Rao /*
77003d196b7SBharata B Rao  * Adds ibm,dynamic-reconfiguration-memory node.
77103d196b7SBharata B Rao  * Refer to docs/specs/ppc-spapr-hotplug.txt for the documentation
77203d196b7SBharata B Rao  * of this device tree node.
77303d196b7SBharata B Rao  */
77403d196b7SBharata B Rao static int spapr_populate_drconf_memory(sPAPRMachineState *spapr, void *fdt)
77503d196b7SBharata B Rao {
77603d196b7SBharata B Rao     MachineState *machine = MACHINE(spapr);
77703d196b7SBharata B Rao     int ret, i, offset;
77803d196b7SBharata B Rao     uint64_t lmb_size = SPAPR_MEMORY_BLOCK_SIZE;
77903d196b7SBharata B Rao     uint32_t prop_lmb_size[] = {0, cpu_to_be32(lmb_size)};
780d0e5a8f2SBharata B Rao     uint32_t hotplug_lmb_start = spapr->hotplug_memory.base / lmb_size;
781d0e5a8f2SBharata B Rao     uint32_t nr_lmbs = (spapr->hotplug_memory.base +
782d0e5a8f2SBharata B Rao                        memory_region_size(&spapr->hotplug_memory.mr)) /
783d0e5a8f2SBharata B Rao                        lmb_size;
78403d196b7SBharata B Rao     uint32_t *int_buf, *cur_index, buf_len;
7856663864eSBharata B Rao     int nr_nodes = nb_numa_nodes ? nb_numa_nodes : 1;
78603d196b7SBharata B Rao 
787ef001f06SThomas Huth     /*
788d0e5a8f2SBharata B Rao      * Don't create the node if there is no hotpluggable memory
78916c25aefSBharata B Rao      */
790d0e5a8f2SBharata B Rao     if (machine->ram_size == machine->maxram_size) {
79116c25aefSBharata B Rao         return 0;
79216c25aefSBharata B Rao     }
79316c25aefSBharata B Rao 
79416c25aefSBharata B Rao     /*
795ef001f06SThomas Huth      * Allocate enough buffer size to fit in ibm,dynamic-memory
796ef001f06SThomas Huth      * or ibm,associativity-lookup-arrays
797ef001f06SThomas Huth      */
798ef001f06SThomas Huth     buf_len = MAX(nr_lmbs * SPAPR_DR_LMB_LIST_ENTRY_SIZE + 1, nr_nodes * 4 + 2)
799ef001f06SThomas Huth               * sizeof(uint32_t);
80003d196b7SBharata B Rao     cur_index = int_buf = g_malloc0(buf_len);
80103d196b7SBharata B Rao 
80203d196b7SBharata B Rao     offset = fdt_add_subnode(fdt, 0, "ibm,dynamic-reconfiguration-memory");
80303d196b7SBharata B Rao 
80403d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,lmb-size", prop_lmb_size,
80503d196b7SBharata B Rao                     sizeof(prop_lmb_size));
80603d196b7SBharata B Rao     if (ret < 0) {
80703d196b7SBharata B Rao         goto out;
80803d196b7SBharata B Rao     }
80903d196b7SBharata B Rao 
81003d196b7SBharata B Rao     ret = fdt_setprop_cell(fdt, offset, "ibm,memory-flags-mask", 0xff);
81103d196b7SBharata B Rao     if (ret < 0) {
81203d196b7SBharata B Rao         goto out;
81303d196b7SBharata B Rao     }
81403d196b7SBharata B Rao 
81503d196b7SBharata B Rao     ret = fdt_setprop_cell(fdt, offset, "ibm,memory-preservation-time", 0x0);
81603d196b7SBharata B Rao     if (ret < 0) {
81703d196b7SBharata B Rao         goto out;
81803d196b7SBharata B Rao     }
81903d196b7SBharata B Rao 
82003d196b7SBharata B Rao     /* ibm,dynamic-memory */
82103d196b7SBharata B Rao     int_buf[0] = cpu_to_be32(nr_lmbs);
82203d196b7SBharata B Rao     cur_index++;
82303d196b7SBharata B Rao     for (i = 0; i < nr_lmbs; i++) {
824d0e5a8f2SBharata B Rao         uint64_t addr = i * lmb_size;
82503d196b7SBharata B Rao         uint32_t *dynamic_memory = cur_index;
82603d196b7SBharata B Rao 
827d0e5a8f2SBharata B Rao         if (i >= hotplug_lmb_start) {
828d0e5a8f2SBharata B Rao             sPAPRDRConnector *drc;
829d0e5a8f2SBharata B Rao             sPAPRDRConnectorClass *drck;
830d0e5a8f2SBharata B Rao 
831d0e5a8f2SBharata B Rao             drc = spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_LMB, i);
83203d196b7SBharata B Rao             g_assert(drc);
83303d196b7SBharata B Rao             drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
83403d196b7SBharata B Rao 
83503d196b7SBharata B Rao             dynamic_memory[0] = cpu_to_be32(addr >> 32);
83603d196b7SBharata B Rao             dynamic_memory[1] = cpu_to_be32(addr & 0xffffffff);
83703d196b7SBharata B Rao             dynamic_memory[2] = cpu_to_be32(drck->get_index(drc));
83803d196b7SBharata B Rao             dynamic_memory[3] = cpu_to_be32(0); /* reserved */
83903d196b7SBharata B Rao             dynamic_memory[4] = cpu_to_be32(numa_get_node(addr, NULL));
840d0e5a8f2SBharata B Rao             if (memory_region_present(get_system_memory(), addr)) {
84103d196b7SBharata B Rao                 dynamic_memory[5] = cpu_to_be32(SPAPR_LMB_FLAGS_ASSIGNED);
84203d196b7SBharata B Rao             } else {
84303d196b7SBharata B Rao                 dynamic_memory[5] = cpu_to_be32(0);
84403d196b7SBharata B Rao             }
845d0e5a8f2SBharata B Rao         } else {
846d0e5a8f2SBharata B Rao             /*
847d0e5a8f2SBharata B Rao              * LMB information for RMA, boot time RAM and gap b/n RAM and
848d0e5a8f2SBharata B Rao              * hotplug memory region -- all these are marked as reserved
849d0e5a8f2SBharata B Rao              * and as having no valid DRC.
850d0e5a8f2SBharata B Rao              */
851d0e5a8f2SBharata B Rao             dynamic_memory[0] = cpu_to_be32(addr >> 32);
852d0e5a8f2SBharata B Rao             dynamic_memory[1] = cpu_to_be32(addr & 0xffffffff);
853d0e5a8f2SBharata B Rao             dynamic_memory[2] = cpu_to_be32(0);
854d0e5a8f2SBharata B Rao             dynamic_memory[3] = cpu_to_be32(0); /* reserved */
855d0e5a8f2SBharata B Rao             dynamic_memory[4] = cpu_to_be32(-1);
856d0e5a8f2SBharata B Rao             dynamic_memory[5] = cpu_to_be32(SPAPR_LMB_FLAGS_RESERVED |
857d0e5a8f2SBharata B Rao                                             SPAPR_LMB_FLAGS_DRC_INVALID);
858d0e5a8f2SBharata B Rao         }
85903d196b7SBharata B Rao 
86003d196b7SBharata B Rao         cur_index += SPAPR_DR_LMB_LIST_ENTRY_SIZE;
86103d196b7SBharata B Rao     }
86203d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,dynamic-memory", int_buf, buf_len);
86303d196b7SBharata B Rao     if (ret < 0) {
86403d196b7SBharata B Rao         goto out;
86503d196b7SBharata B Rao     }
86603d196b7SBharata B Rao 
86703d196b7SBharata B Rao     /* ibm,associativity-lookup-arrays */
86803d196b7SBharata B Rao     cur_index = int_buf;
8696663864eSBharata B Rao     int_buf[0] = cpu_to_be32(nr_nodes);
87003d196b7SBharata B Rao     int_buf[1] = cpu_to_be32(4); /* Number of entries per associativity list */
87103d196b7SBharata B Rao     cur_index += 2;
8726663864eSBharata B Rao     for (i = 0; i < nr_nodes; i++) {
87303d196b7SBharata B Rao         uint32_t associativity[] = {
87403d196b7SBharata B Rao             cpu_to_be32(0x0),
87503d196b7SBharata B Rao             cpu_to_be32(0x0),
87603d196b7SBharata B Rao             cpu_to_be32(0x0),
87703d196b7SBharata B Rao             cpu_to_be32(i)
87803d196b7SBharata B Rao         };
87903d196b7SBharata B Rao         memcpy(cur_index, associativity, sizeof(associativity));
88003d196b7SBharata B Rao         cur_index += 4;
88103d196b7SBharata B Rao     }
88203d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,associativity-lookup-arrays", int_buf,
88303d196b7SBharata B Rao             (cur_index - int_buf) * sizeof(uint32_t));
88403d196b7SBharata B Rao out:
88503d196b7SBharata B Rao     g_free(int_buf);
88603d196b7SBharata B Rao     return ret;
88703d196b7SBharata B Rao }
88803d196b7SBharata B Rao 
88903d196b7SBharata B Rao int spapr_h_cas_compose_response(sPAPRMachineState *spapr,
89003d196b7SBharata B Rao                                  target_ulong addr, target_ulong size,
89103d196b7SBharata B Rao                                  bool cpu_update, bool memory_update)
89203d196b7SBharata B Rao {
89303d196b7SBharata B Rao     void *fdt, *fdt_skel;
89403d196b7SBharata B Rao     sPAPRDeviceTreeUpdateHeader hdr = { .version_id = 1 };
89503d196b7SBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(qdev_get_machine());
89603d196b7SBharata B Rao 
89703d196b7SBharata B Rao     size -= sizeof(hdr);
89803d196b7SBharata B Rao 
89903d196b7SBharata B Rao     /* Create sceleton */
90003d196b7SBharata B Rao     fdt_skel = g_malloc0(size);
90103d196b7SBharata B Rao     _FDT((fdt_create(fdt_skel, size)));
90203d196b7SBharata B Rao     _FDT((fdt_begin_node(fdt_skel, "")));
90303d196b7SBharata B Rao     _FDT((fdt_end_node(fdt_skel)));
90403d196b7SBharata B Rao     _FDT((fdt_finish(fdt_skel)));
90503d196b7SBharata B Rao     fdt = g_malloc0(size);
90603d196b7SBharata B Rao     _FDT((fdt_open_into(fdt_skel, fdt, size)));
90703d196b7SBharata B Rao     g_free(fdt_skel);
90803d196b7SBharata B Rao 
90903d196b7SBharata B Rao     /* Fixup cpu nodes */
91003d196b7SBharata B Rao     if (cpu_update) {
91103d196b7SBharata B Rao         _FDT((spapr_fixup_cpu_dt(fdt, spapr)));
91203d196b7SBharata B Rao     }
91303d196b7SBharata B Rao 
91416c25aefSBharata B Rao     /* Generate ibm,dynamic-reconfiguration-memory node if required */
91503d196b7SBharata B Rao     if (memory_update && smc->dr_lmb_enabled) {
91603d196b7SBharata B Rao         _FDT((spapr_populate_drconf_memory(spapr, fdt)));
91703d196b7SBharata B Rao     }
91803d196b7SBharata B Rao 
91903d196b7SBharata B Rao     /* Pack resulting tree */
92003d196b7SBharata B Rao     _FDT((fdt_pack(fdt)));
92103d196b7SBharata B Rao 
92203d196b7SBharata B Rao     if (fdt_totalsize(fdt) + sizeof(hdr) > size) {
92303d196b7SBharata B Rao         trace_spapr_cas_failed(size);
92403d196b7SBharata B Rao         return -1;
92503d196b7SBharata B Rao     }
92603d196b7SBharata B Rao 
92703d196b7SBharata B Rao     cpu_physical_memory_write(addr, &hdr, sizeof(hdr));
92803d196b7SBharata B Rao     cpu_physical_memory_write(addr + sizeof(hdr), fdt, fdt_totalsize(fdt));
92903d196b7SBharata B Rao     trace_spapr_cas_continue(fdt_totalsize(fdt) + sizeof(hdr));
93003d196b7SBharata B Rao     g_free(fdt);
93103d196b7SBharata B Rao 
93203d196b7SBharata B Rao     return 0;
93303d196b7SBharata B Rao }
93403d196b7SBharata B Rao 
93528e02042SDavid Gibson static void spapr_finalize_fdt(sPAPRMachineState *spapr,
93653018216SPaolo Bonzini                                hwaddr fdt_addr,
93753018216SPaolo Bonzini                                hwaddr rtas_addr,
93853018216SPaolo Bonzini                                hwaddr rtas_size)
93953018216SPaolo Bonzini {
9405b2128d2SAlexander Graf     MachineState *machine = MACHINE(qdev_get_machine());
941c20d332aSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(machine);
9425b2128d2SAlexander Graf     const char *boot_device = machine->boot_order;
94371461b0fSAlexey Kardashevskiy     int ret, i;
94471461b0fSAlexey Kardashevskiy     size_t cb = 0;
94571461b0fSAlexey Kardashevskiy     char *bootlist;
94653018216SPaolo Bonzini     void *fdt;
94753018216SPaolo Bonzini     sPAPRPHBState *phb;
94853018216SPaolo Bonzini 
94953018216SPaolo Bonzini     fdt = g_malloc(FDT_MAX_SIZE);
95053018216SPaolo Bonzini 
95153018216SPaolo Bonzini     /* open out the base tree into a temp buffer for the final tweaks */
95253018216SPaolo Bonzini     _FDT((fdt_open_into(spapr->fdt_skel, fdt, FDT_MAX_SIZE)));
95353018216SPaolo Bonzini 
954e8f986fcSBharata B Rao     ret = spapr_populate_memory(spapr, fdt);
955e8f986fcSBharata B Rao     if (ret < 0) {
956e8f986fcSBharata B Rao         fprintf(stderr, "couldn't setup memory nodes in fdt\n");
957e8f986fcSBharata B Rao         exit(1);
95853018216SPaolo Bonzini     }
95953018216SPaolo Bonzini 
96053018216SPaolo Bonzini     ret = spapr_populate_vdevice(spapr->vio_bus, fdt);
96153018216SPaolo Bonzini     if (ret < 0) {
96253018216SPaolo Bonzini         fprintf(stderr, "couldn't setup vio devices in fdt\n");
96353018216SPaolo Bonzini         exit(1);
96453018216SPaolo Bonzini     }
96553018216SPaolo Bonzini 
9664d9392beSThomas Huth     if (object_resolve_path_type("", TYPE_SPAPR_RNG, NULL)) {
9674d9392beSThomas Huth         ret = spapr_rng_populate_dt(fdt);
9684d9392beSThomas Huth         if (ret < 0) {
9694d9392beSThomas Huth             fprintf(stderr, "could not set up rng device in the fdt\n");
9704d9392beSThomas Huth             exit(1);
9714d9392beSThomas Huth         }
9724d9392beSThomas Huth     }
9734d9392beSThomas Huth 
97453018216SPaolo Bonzini     QLIST_FOREACH(phb, &spapr->phbs, list) {
97553018216SPaolo Bonzini         ret = spapr_populate_pci_dt(phb, PHANDLE_XICP, fdt);
97653018216SPaolo Bonzini         if (ret < 0) {
977da34fed7SThomas Huth             error_report("couldn't setup PCI devices in fdt");
97853018216SPaolo Bonzini             exit(1);
97953018216SPaolo Bonzini         }
980da34fed7SThomas Huth     }
98153018216SPaolo Bonzini 
98253018216SPaolo Bonzini     /* RTAS */
98353018216SPaolo Bonzini     ret = spapr_rtas_device_tree_setup(fdt, rtas_addr, rtas_size);
98453018216SPaolo Bonzini     if (ret < 0) {
98553018216SPaolo Bonzini         fprintf(stderr, "Couldn't set up RTAS device tree properties\n");
98653018216SPaolo Bonzini     }
98753018216SPaolo Bonzini 
9880da6f3feSBharata B Rao     /* cpus */
9890da6f3feSBharata B Rao     spapr_populate_cpus_dt_node(fdt, spapr);
99053018216SPaolo Bonzini 
99171461b0fSAlexey Kardashevskiy     bootlist = get_boot_devices_list(&cb, true);
99271461b0fSAlexey Kardashevskiy     if (cb && bootlist) {
99371461b0fSAlexey Kardashevskiy         int offset = fdt_path_offset(fdt, "/chosen");
99471461b0fSAlexey Kardashevskiy         if (offset < 0) {
99571461b0fSAlexey Kardashevskiy             exit(1);
99671461b0fSAlexey Kardashevskiy         }
99771461b0fSAlexey Kardashevskiy         for (i = 0; i < cb; i++) {
99871461b0fSAlexey Kardashevskiy             if (bootlist[i] == '\n') {
99971461b0fSAlexey Kardashevskiy                 bootlist[i] = ' ';
100071461b0fSAlexey Kardashevskiy             }
100171461b0fSAlexey Kardashevskiy 
100271461b0fSAlexey Kardashevskiy         }
100371461b0fSAlexey Kardashevskiy         ret = fdt_setprop_string(fdt, offset, "qemu,boot-list", bootlist);
100471461b0fSAlexey Kardashevskiy     }
100571461b0fSAlexey Kardashevskiy 
10065b2128d2SAlexander Graf     if (boot_device && strlen(boot_device)) {
10075b2128d2SAlexander Graf         int offset = fdt_path_offset(fdt, "/chosen");
10085b2128d2SAlexander Graf 
10095b2128d2SAlexander Graf         if (offset < 0) {
10105b2128d2SAlexander Graf             exit(1);
10115b2128d2SAlexander Graf         }
10125b2128d2SAlexander Graf         fdt_setprop_string(fdt, offset, "qemu,boot-device", boot_device);
10135b2128d2SAlexander Graf     }
10145b2128d2SAlexander Graf 
101553018216SPaolo Bonzini     if (!spapr->has_graphics) {
101653018216SPaolo Bonzini         spapr_populate_chosen_stdout(fdt, spapr->vio_bus);
101753018216SPaolo Bonzini     }
101853018216SPaolo Bonzini 
1019c20d332aSBharata B Rao     if (smc->dr_lmb_enabled) {
1020c20d332aSBharata B Rao         _FDT(spapr_drc_populate_dt(fdt, 0, NULL, SPAPR_DR_CONNECTOR_TYPE_LMB));
1021c20d332aSBharata B Rao     }
1022c20d332aSBharata B Rao 
1023af81cf32SBharata B Rao     if (smc->dr_cpu_enabled) {
1024af81cf32SBharata B Rao         int offset = fdt_path_offset(fdt, "/cpus");
1025af81cf32SBharata B Rao         ret = spapr_drc_populate_dt(fdt, offset, NULL,
1026af81cf32SBharata B Rao                                     SPAPR_DR_CONNECTOR_TYPE_CPU);
1027af81cf32SBharata B Rao         if (ret < 0) {
1028af81cf32SBharata B Rao             error_report("Couldn't set up CPU DR device tree properties");
1029af81cf32SBharata B Rao             exit(1);
1030af81cf32SBharata B Rao         }
1031af81cf32SBharata B Rao     }
1032af81cf32SBharata B Rao 
103353018216SPaolo Bonzini     _FDT((fdt_pack(fdt)));
103453018216SPaolo Bonzini 
103553018216SPaolo Bonzini     if (fdt_totalsize(fdt) > FDT_MAX_SIZE) {
1036730fce59SThomas Huth         error_report("FDT too big ! 0x%x bytes (max is 0x%x)",
103753018216SPaolo Bonzini                      fdt_totalsize(fdt), FDT_MAX_SIZE);
103853018216SPaolo Bonzini         exit(1);
103953018216SPaolo Bonzini     }
104053018216SPaolo Bonzini 
1041ad440b4aSAndrew Jones     qemu_fdt_dumpdtb(fdt, fdt_totalsize(fdt));
104253018216SPaolo Bonzini     cpu_physical_memory_write(fdt_addr, fdt, fdt_totalsize(fdt));
104353018216SPaolo Bonzini 
1044a21a7a70SGonglei     g_free(bootlist);
104553018216SPaolo Bonzini     g_free(fdt);
104653018216SPaolo Bonzini }
104753018216SPaolo Bonzini 
104853018216SPaolo Bonzini static uint64_t translate_kernel_address(void *opaque, uint64_t addr)
104953018216SPaolo Bonzini {
105053018216SPaolo Bonzini     return (addr & 0x0fffffff) + KERNEL_LOAD_ADDR;
105153018216SPaolo Bonzini }
105253018216SPaolo Bonzini 
105353018216SPaolo Bonzini static void emulate_spapr_hypercall(PowerPCCPU *cpu)
105453018216SPaolo Bonzini {
105553018216SPaolo Bonzini     CPUPPCState *env = &cpu->env;
105653018216SPaolo Bonzini 
105753018216SPaolo Bonzini     if (msr_pr) {
105853018216SPaolo Bonzini         hcall_dprintf("Hypercall made with MSR[PR]=1\n");
105953018216SPaolo Bonzini         env->gpr[3] = H_PRIVILEGE;
106053018216SPaolo Bonzini     } else {
106153018216SPaolo Bonzini         env->gpr[3] = spapr_hypercall(cpu, env->gpr[3], &env->gpr[4]);
106253018216SPaolo Bonzini     }
106353018216SPaolo Bonzini }
106453018216SPaolo Bonzini 
1065e6b8fd24SSamuel Mendoza-Jonas #define HPTE(_table, _i)   (void *)(((uint64_t *)(_table)) + ((_i) * 2))
1066e6b8fd24SSamuel Mendoza-Jonas #define HPTE_VALID(_hpte)  (tswap64(*((uint64_t *)(_hpte))) & HPTE64_V_VALID)
1067e6b8fd24SSamuel Mendoza-Jonas #define HPTE_DIRTY(_hpte)  (tswap64(*((uint64_t *)(_hpte))) & HPTE64_V_HPTE_DIRTY)
1068e6b8fd24SSamuel Mendoza-Jonas #define CLEAN_HPTE(_hpte)  ((*(uint64_t *)(_hpte)) &= tswap64(~HPTE64_V_HPTE_DIRTY))
1069e6b8fd24SSamuel Mendoza-Jonas #define DIRTY_HPTE(_hpte)  ((*(uint64_t *)(_hpte)) |= tswap64(HPTE64_V_HPTE_DIRTY))
1070e6b8fd24SSamuel Mendoza-Jonas 
1071715c5407SDavid Gibson /*
1072715c5407SDavid Gibson  * Get the fd to access the kernel htab, re-opening it if necessary
1073715c5407SDavid Gibson  */
1074715c5407SDavid Gibson static int get_htab_fd(sPAPRMachineState *spapr)
1075715c5407SDavid Gibson {
1076715c5407SDavid Gibson     if (spapr->htab_fd >= 0) {
1077715c5407SDavid Gibson         return spapr->htab_fd;
1078715c5407SDavid Gibson     }
1079715c5407SDavid Gibson 
1080715c5407SDavid Gibson     spapr->htab_fd = kvmppc_get_htab_fd(false);
1081715c5407SDavid Gibson     if (spapr->htab_fd < 0) {
1082715c5407SDavid Gibson         error_report("Unable to open fd for reading hash table from KVM: %s",
1083715c5407SDavid Gibson                      strerror(errno));
1084715c5407SDavid Gibson     }
1085715c5407SDavid Gibson 
1086715c5407SDavid Gibson     return spapr->htab_fd;
1087715c5407SDavid Gibson }
1088715c5407SDavid Gibson 
1089715c5407SDavid Gibson static void close_htab_fd(sPAPRMachineState *spapr)
1090715c5407SDavid Gibson {
1091715c5407SDavid Gibson     if (spapr->htab_fd >= 0) {
1092715c5407SDavid Gibson         close(spapr->htab_fd);
1093715c5407SDavid Gibson     }
1094715c5407SDavid Gibson     spapr->htab_fd = -1;
1095715c5407SDavid Gibson }
1096715c5407SDavid Gibson 
10978dfe8e7fSDavid Gibson static int spapr_hpt_shift_for_ramsize(uint64_t ramsize)
10988dfe8e7fSDavid Gibson {
10998dfe8e7fSDavid Gibson     int shift;
11008dfe8e7fSDavid Gibson 
11018dfe8e7fSDavid Gibson     /* We aim for a hash table of size 1/128 the size of RAM (rounded
11028dfe8e7fSDavid Gibson      * up).  The PAPR recommendation is actually 1/64 of RAM size, but
11038dfe8e7fSDavid Gibson      * that's much more than is needed for Linux guests */
11048dfe8e7fSDavid Gibson     shift = ctz64(pow2ceil(ramsize)) - 7;
11058dfe8e7fSDavid Gibson     shift = MAX(shift, 18); /* Minimum architected size */
11068dfe8e7fSDavid Gibson     shift = MIN(shift, 46); /* Maximum architected size */
11078dfe8e7fSDavid Gibson     return shift;
11088dfe8e7fSDavid Gibson }
11098dfe8e7fSDavid Gibson 
1110c5f54f3eSDavid Gibson static void spapr_reallocate_hpt(sPAPRMachineState *spapr, int shift,
1111c5f54f3eSDavid Gibson                                  Error **errp)
111253018216SPaolo Bonzini {
1113c5f54f3eSDavid Gibson     long rc;
111453018216SPaolo Bonzini 
1115c5f54f3eSDavid Gibson     /* Clean up any HPT info from a previous boot */
1116c5f54f3eSDavid Gibson     g_free(spapr->htab);
1117c5f54f3eSDavid Gibson     spapr->htab = NULL;
1118c5f54f3eSDavid Gibson     spapr->htab_shift = 0;
1119c5f54f3eSDavid Gibson     close_htab_fd(spapr);
112053018216SPaolo Bonzini 
1121c5f54f3eSDavid Gibson     rc = kvmppc_reset_htab(shift);
1122c5f54f3eSDavid Gibson     if (rc < 0) {
1123c5f54f3eSDavid Gibson         /* kernel-side HPT needed, but couldn't allocate one */
1124c5f54f3eSDavid Gibson         error_setg_errno(errp, errno,
1125c5f54f3eSDavid Gibson                          "Failed to allocate KVM HPT of order %d (try smaller maxmem?)",
1126c5f54f3eSDavid Gibson                          shift);
1127c5f54f3eSDavid Gibson         /* This is almost certainly fatal, but if the caller really
1128c5f54f3eSDavid Gibson          * wants to carry on with shift == 0, it's welcome to try */
1129c5f54f3eSDavid Gibson     } else if (rc > 0) {
1130c5f54f3eSDavid Gibson         /* kernel-side HPT allocated */
1131c5f54f3eSDavid Gibson         if (rc != shift) {
1132c5f54f3eSDavid Gibson             error_setg(errp,
1133c5f54f3eSDavid Gibson                        "Requested order %d HPT, but kernel allocated order %ld (try smaller maxmem?)",
1134c5f54f3eSDavid Gibson                        shift, rc);
11357735fedaSBharata B Rao         }
11367735fedaSBharata B Rao 
113753018216SPaolo Bonzini         spapr->htab_shift = shift;
1138c18ad9a5SDavid Gibson         spapr->htab = NULL;
1139b817772aSBharata B Rao     } else {
1140c5f54f3eSDavid Gibson         /* kernel-side HPT not needed, allocate in userspace instead */
1141c5f54f3eSDavid Gibson         size_t size = 1ULL << shift;
1142c5f54f3eSDavid Gibson         int i;
114301a57972SSamuel Mendoza-Jonas 
1144c5f54f3eSDavid Gibson         spapr->htab = qemu_memalign(size, size);
1145c5f54f3eSDavid Gibson         if (!spapr->htab) {
1146c5f54f3eSDavid Gibson             error_setg_errno(errp, errno,
1147c5f54f3eSDavid Gibson                              "Could not allocate HPT of order %d", shift);
1148c5f54f3eSDavid Gibson             return;
1149b817772aSBharata B Rao         }
1150b817772aSBharata B Rao 
1151c5f54f3eSDavid Gibson         memset(spapr->htab, 0, size);
1152c5f54f3eSDavid Gibson         spapr->htab_shift = shift;
1153b817772aSBharata B Rao 
1154c5f54f3eSDavid Gibson         for (i = 0; i < size / HASH_PTE_SIZE_64; i++) {
1155c5f54f3eSDavid Gibson             DIRTY_HPTE(HPTE(spapr->htab, i));
11567735fedaSBharata B Rao         }
115753018216SPaolo Bonzini     }
115853018216SPaolo Bonzini }
115953018216SPaolo Bonzini 
11609e3f9733SAlexander Graf static int find_unknown_sysbus_device(SysBusDevice *sbdev, void *opaque)
11619e3f9733SAlexander Graf {
11629e3f9733SAlexander Graf     bool matched = false;
11639e3f9733SAlexander Graf 
11649e3f9733SAlexander Graf     if (object_dynamic_cast(OBJECT(sbdev), TYPE_SPAPR_PCI_HOST_BRIDGE)) {
11659e3f9733SAlexander Graf         matched = true;
11669e3f9733SAlexander Graf     }
11679e3f9733SAlexander Graf 
11689e3f9733SAlexander Graf     if (!matched) {
11699e3f9733SAlexander Graf         error_report("Device %s is not supported by this machine yet.",
11709e3f9733SAlexander Graf                      qdev_fw_name(DEVICE(sbdev)));
11719e3f9733SAlexander Graf         exit(1);
11729e3f9733SAlexander Graf     }
11739e3f9733SAlexander Graf 
11749e3f9733SAlexander Graf     return 0;
11759e3f9733SAlexander Graf }
11769e3f9733SAlexander Graf 
117753018216SPaolo Bonzini static void ppc_spapr_reset(void)
117853018216SPaolo Bonzini {
1179c5f54f3eSDavid Gibson     MachineState *machine = MACHINE(qdev_get_machine());
1180c5f54f3eSDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
1181182735efSAndreas Färber     PowerPCCPU *first_ppc_cpu;
1182b7d1f77aSBenjamin Herrenschmidt     uint32_t rtas_limit;
1183259186a7SAndreas Färber 
11849e3f9733SAlexander Graf     /* Check for unknown sysbus devices */
11859e3f9733SAlexander Graf     foreach_dynamic_sysbus_device(find_unknown_sysbus_device, NULL);
11869e3f9733SAlexander Graf 
1187c5f54f3eSDavid Gibson     /* Allocate and/or reset the hash page table */
1188c5f54f3eSDavid Gibson     spapr_reallocate_hpt(spapr,
1189c5f54f3eSDavid Gibson                          spapr_hpt_shift_for_ramsize(machine->maxram_size),
1190c5f54f3eSDavid Gibson                          &error_fatal);
1191c5f54f3eSDavid Gibson 
1192c5f54f3eSDavid Gibson     /* Update the RMA size if necessary */
1193c5f54f3eSDavid Gibson     if (spapr->vrma_adjust) {
1194c5f54f3eSDavid Gibson         spapr->rma_size = kvmppc_rma_size(spapr_node0_size(),
1195c5f54f3eSDavid Gibson                                           spapr->htab_shift);
1196c5f54f3eSDavid Gibson     }
119753018216SPaolo Bonzini 
119853018216SPaolo Bonzini     qemu_devices_reset();
119953018216SPaolo Bonzini 
1200b7d1f77aSBenjamin Herrenschmidt     /*
1201b7d1f77aSBenjamin Herrenschmidt      * We place the device tree and RTAS just below either the top of the RMA,
1202b7d1f77aSBenjamin Herrenschmidt      * or just below 2GB, whichever is lowere, so that it can be
1203b7d1f77aSBenjamin Herrenschmidt      * processed with 32-bit real mode code if necessary
1204b7d1f77aSBenjamin Herrenschmidt      */
1205b7d1f77aSBenjamin Herrenschmidt     rtas_limit = MIN(spapr->rma_size, RTAS_MAX_ADDR);
1206b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_addr = rtas_limit - RTAS_MAX_SIZE;
1207b7d1f77aSBenjamin Herrenschmidt     spapr->fdt_addr = spapr->rtas_addr - FDT_MAX_SIZE;
1208b7d1f77aSBenjamin Herrenschmidt 
120953018216SPaolo Bonzini     /* Load the fdt */
121053018216SPaolo Bonzini     spapr_finalize_fdt(spapr, spapr->fdt_addr, spapr->rtas_addr,
121153018216SPaolo Bonzini                        spapr->rtas_size);
121253018216SPaolo Bonzini 
1213b7d1f77aSBenjamin Herrenschmidt     /* Copy RTAS over */
1214b7d1f77aSBenjamin Herrenschmidt     cpu_physical_memory_write(spapr->rtas_addr, spapr->rtas_blob,
1215b7d1f77aSBenjamin Herrenschmidt                               spapr->rtas_size);
1216b7d1f77aSBenjamin Herrenschmidt 
121753018216SPaolo Bonzini     /* Set up the entry state */
1218182735efSAndreas Färber     first_ppc_cpu = POWERPC_CPU(first_cpu);
1219182735efSAndreas Färber     first_ppc_cpu->env.gpr[3] = spapr->fdt_addr;
1220182735efSAndreas Färber     first_ppc_cpu->env.gpr[5] = 0;
1221182735efSAndreas Färber     first_cpu->halted = 0;
12221b718907SDavid Gibson     first_ppc_cpu->env.nip = SPAPR_ENTRY_POINT;
122353018216SPaolo Bonzini 
122453018216SPaolo Bonzini }
122553018216SPaolo Bonzini 
122628e02042SDavid Gibson static void spapr_create_nvram(sPAPRMachineState *spapr)
122753018216SPaolo Bonzini {
12282ff3de68SMarkus Armbruster     DeviceState *dev = qdev_create(&spapr->vio_bus->bus, "spapr-nvram");
12293978b863SPaolo Bonzini     DriveInfo *dinfo = drive_get(IF_PFLASH, 0, 0);
123053018216SPaolo Bonzini 
12313978b863SPaolo Bonzini     if (dinfo) {
12326231a6daSMarkus Armbruster         qdev_prop_set_drive(dev, "drive", blk_by_legacy_dinfo(dinfo),
12336231a6daSMarkus Armbruster                             &error_fatal);
123453018216SPaolo Bonzini     }
123553018216SPaolo Bonzini 
123653018216SPaolo Bonzini     qdev_init_nofail(dev);
123753018216SPaolo Bonzini 
123853018216SPaolo Bonzini     spapr->nvram = (struct sPAPRNVRAM *)dev;
123953018216SPaolo Bonzini }
124053018216SPaolo Bonzini 
124128e02042SDavid Gibson static void spapr_rtc_create(sPAPRMachineState *spapr)
124228df36a1SDavid Gibson {
124328df36a1SDavid Gibson     DeviceState *dev = qdev_create(NULL, TYPE_SPAPR_RTC);
124428df36a1SDavid Gibson 
124528df36a1SDavid Gibson     qdev_init_nofail(dev);
124628df36a1SDavid Gibson     spapr->rtc = dev;
124774e5ae28SDavid Gibson 
124874e5ae28SDavid Gibson     object_property_add_alias(qdev_get_machine(), "rtc-time",
124974e5ae28SDavid Gibson                               OBJECT(spapr->rtc), "date", NULL);
125028df36a1SDavid Gibson }
125128df36a1SDavid Gibson 
125253018216SPaolo Bonzini /* Returns whether we want to use VGA or not */
125314c6a894SDavid Gibson static bool spapr_vga_init(PCIBus *pci_bus, Error **errp)
125453018216SPaolo Bonzini {
125553018216SPaolo Bonzini     switch (vga_interface_type) {
125653018216SPaolo Bonzini     case VGA_NONE:
12577effdaa3SMark Wu         return false;
12587effdaa3SMark Wu     case VGA_DEVICE:
12597effdaa3SMark Wu         return true;
126053018216SPaolo Bonzini     case VGA_STD:
1261b798c190SBenjamin Herrenschmidt     case VGA_VIRTIO:
126253018216SPaolo Bonzini         return pci_vga_init(pci_bus) != NULL;
126353018216SPaolo Bonzini     default:
126414c6a894SDavid Gibson         error_setg(errp,
126514c6a894SDavid Gibson                    "Unsupported VGA mode, only -vga std or -vga virtio is supported");
126614c6a894SDavid Gibson         return false;
126753018216SPaolo Bonzini     }
126853018216SPaolo Bonzini }
126953018216SPaolo Bonzini 
1270880ae7deSDavid Gibson static int spapr_post_load(void *opaque, int version_id)
1271880ae7deSDavid Gibson {
127228e02042SDavid Gibson     sPAPRMachineState *spapr = (sPAPRMachineState *)opaque;
1273880ae7deSDavid Gibson     int err = 0;
1274880ae7deSDavid Gibson 
1275631b22eaSStefan Weil     /* In earlier versions, there was no separate qdev for the PAPR
1276880ae7deSDavid Gibson      * RTC, so the RTC offset was stored directly in sPAPREnvironment.
1277880ae7deSDavid Gibson      * So when migrating from those versions, poke the incoming offset
1278880ae7deSDavid Gibson      * value into the RTC device */
1279880ae7deSDavid Gibson     if (version_id < 3) {
1280880ae7deSDavid Gibson         err = spapr_rtc_import_offset(spapr->rtc, spapr->rtc_offset);
1281880ae7deSDavid Gibson     }
1282880ae7deSDavid Gibson 
1283880ae7deSDavid Gibson     return err;
1284880ae7deSDavid Gibson }
1285880ae7deSDavid Gibson 
1286880ae7deSDavid Gibson static bool version_before_3(void *opaque, int version_id)
1287880ae7deSDavid Gibson {
1288880ae7deSDavid Gibson     return version_id < 3;
1289880ae7deSDavid Gibson }
1290880ae7deSDavid Gibson 
12914be21d56SDavid Gibson static const VMStateDescription vmstate_spapr = {
12924be21d56SDavid Gibson     .name = "spapr",
1293880ae7deSDavid Gibson     .version_id = 3,
12944be21d56SDavid Gibson     .minimum_version_id = 1,
1295880ae7deSDavid Gibson     .post_load = spapr_post_load,
12964be21d56SDavid Gibson     .fields = (VMStateField[]) {
1297880ae7deSDavid Gibson         /* used to be @next_irq */
1298880ae7deSDavid Gibson         VMSTATE_UNUSED_BUFFER(version_before_3, 0, 4),
12994be21d56SDavid Gibson 
13004be21d56SDavid Gibson         /* RTC offset */
130128e02042SDavid Gibson         VMSTATE_UINT64_TEST(rtc_offset, sPAPRMachineState, version_before_3),
1302880ae7deSDavid Gibson 
130328e02042SDavid Gibson         VMSTATE_PPC_TIMEBASE_V(tb, sPAPRMachineState, 2),
13044be21d56SDavid Gibson         VMSTATE_END_OF_LIST()
13054be21d56SDavid Gibson     },
13064be21d56SDavid Gibson };
13074be21d56SDavid Gibson 
13084be21d56SDavid Gibson static int htab_save_setup(QEMUFile *f, void *opaque)
13094be21d56SDavid Gibson {
131028e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
13114be21d56SDavid Gibson 
13124be21d56SDavid Gibson     /* "Iteration" header */
13134be21d56SDavid Gibson     qemu_put_be32(f, spapr->htab_shift);
13144be21d56SDavid Gibson 
1315e68cb8b4SAlexey Kardashevskiy     if (spapr->htab) {
1316e68cb8b4SAlexey Kardashevskiy         spapr->htab_save_index = 0;
1317e68cb8b4SAlexey Kardashevskiy         spapr->htab_first_pass = true;
1318e68cb8b4SAlexey Kardashevskiy     } else {
1319e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
13204be21d56SDavid Gibson     }
13214be21d56SDavid Gibson 
1322e68cb8b4SAlexey Kardashevskiy 
1323e68cb8b4SAlexey Kardashevskiy     return 0;
1324e68cb8b4SAlexey Kardashevskiy }
13254be21d56SDavid Gibson 
132628e02042SDavid Gibson static void htab_save_first_pass(QEMUFile *f, sPAPRMachineState *spapr,
13274be21d56SDavid Gibson                                  int64_t max_ns)
13284be21d56SDavid Gibson {
1329378bc217SDavid Gibson     bool has_timeout = max_ns != -1;
13304be21d56SDavid Gibson     int htabslots = HTAB_SIZE(spapr) / HASH_PTE_SIZE_64;
13314be21d56SDavid Gibson     int index = spapr->htab_save_index;
1332bc72ad67SAlex Bligh     int64_t starttime = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
13334be21d56SDavid Gibson 
13344be21d56SDavid Gibson     assert(spapr->htab_first_pass);
13354be21d56SDavid Gibson 
13364be21d56SDavid Gibson     do {
13374be21d56SDavid Gibson         int chunkstart;
13384be21d56SDavid Gibson 
13394be21d56SDavid Gibson         /* Consume invalid HPTEs */
13404be21d56SDavid Gibson         while ((index < htabslots)
13414be21d56SDavid Gibson                && !HPTE_VALID(HPTE(spapr->htab, index))) {
13424be21d56SDavid Gibson             index++;
13434be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
13444be21d56SDavid Gibson         }
13454be21d56SDavid Gibson 
13464be21d56SDavid Gibson         /* Consume valid HPTEs */
13474be21d56SDavid Gibson         chunkstart = index;
1348338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - chunkstart < USHRT_MAX)
13494be21d56SDavid Gibson                && HPTE_VALID(HPTE(spapr->htab, index))) {
13504be21d56SDavid Gibson             index++;
13514be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
13524be21d56SDavid Gibson         }
13534be21d56SDavid Gibson 
13544be21d56SDavid Gibson         if (index > chunkstart) {
13554be21d56SDavid Gibson             int n_valid = index - chunkstart;
13564be21d56SDavid Gibson 
13574be21d56SDavid Gibson             qemu_put_be32(f, chunkstart);
13584be21d56SDavid Gibson             qemu_put_be16(f, n_valid);
13594be21d56SDavid Gibson             qemu_put_be16(f, 0);
13604be21d56SDavid Gibson             qemu_put_buffer(f, HPTE(spapr->htab, chunkstart),
13614be21d56SDavid Gibson                             HASH_PTE_SIZE_64 * n_valid);
13624be21d56SDavid Gibson 
1363378bc217SDavid Gibson             if (has_timeout &&
1364378bc217SDavid Gibson                 (qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - starttime) > max_ns) {
13654be21d56SDavid Gibson                 break;
13664be21d56SDavid Gibson             }
13674be21d56SDavid Gibson         }
13684be21d56SDavid Gibson     } while ((index < htabslots) && !qemu_file_rate_limit(f));
13694be21d56SDavid Gibson 
13704be21d56SDavid Gibson     if (index >= htabslots) {
13714be21d56SDavid Gibson         assert(index == htabslots);
13724be21d56SDavid Gibson         index = 0;
13734be21d56SDavid Gibson         spapr->htab_first_pass = false;
13744be21d56SDavid Gibson     }
13754be21d56SDavid Gibson     spapr->htab_save_index = index;
13764be21d56SDavid Gibson }
13774be21d56SDavid Gibson 
137828e02042SDavid Gibson static int htab_save_later_pass(QEMUFile *f, sPAPRMachineState *spapr,
13794be21d56SDavid Gibson                                 int64_t max_ns)
13804be21d56SDavid Gibson {
13814be21d56SDavid Gibson     bool final = max_ns < 0;
13824be21d56SDavid Gibson     int htabslots = HTAB_SIZE(spapr) / HASH_PTE_SIZE_64;
13834be21d56SDavid Gibson     int examined = 0, sent = 0;
13844be21d56SDavid Gibson     int index = spapr->htab_save_index;
1385bc72ad67SAlex Bligh     int64_t starttime = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
13864be21d56SDavid Gibson 
13874be21d56SDavid Gibson     assert(!spapr->htab_first_pass);
13884be21d56SDavid Gibson 
13894be21d56SDavid Gibson     do {
13904be21d56SDavid Gibson         int chunkstart, invalidstart;
13914be21d56SDavid Gibson 
13924be21d56SDavid Gibson         /* Consume non-dirty HPTEs */
13934be21d56SDavid Gibson         while ((index < htabslots)
13944be21d56SDavid Gibson                && !HPTE_DIRTY(HPTE(spapr->htab, index))) {
13954be21d56SDavid Gibson             index++;
13964be21d56SDavid Gibson             examined++;
13974be21d56SDavid Gibson         }
13984be21d56SDavid Gibson 
13994be21d56SDavid Gibson         chunkstart = index;
14004be21d56SDavid Gibson         /* Consume valid dirty HPTEs */
1401338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - chunkstart < USHRT_MAX)
14024be21d56SDavid Gibson                && HPTE_DIRTY(HPTE(spapr->htab, index))
14034be21d56SDavid Gibson                && HPTE_VALID(HPTE(spapr->htab, index))) {
14044be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
14054be21d56SDavid Gibson             index++;
14064be21d56SDavid Gibson             examined++;
14074be21d56SDavid Gibson         }
14084be21d56SDavid Gibson 
14094be21d56SDavid Gibson         invalidstart = index;
14104be21d56SDavid Gibson         /* Consume invalid dirty HPTEs */
1411338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - invalidstart < USHRT_MAX)
14124be21d56SDavid Gibson                && HPTE_DIRTY(HPTE(spapr->htab, index))
14134be21d56SDavid Gibson                && !HPTE_VALID(HPTE(spapr->htab, index))) {
14144be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
14154be21d56SDavid Gibson             index++;
14164be21d56SDavid Gibson             examined++;
14174be21d56SDavid Gibson         }
14184be21d56SDavid Gibson 
14194be21d56SDavid Gibson         if (index > chunkstart) {
14204be21d56SDavid Gibson             int n_valid = invalidstart - chunkstart;
14214be21d56SDavid Gibson             int n_invalid = index - invalidstart;
14224be21d56SDavid Gibson 
14234be21d56SDavid Gibson             qemu_put_be32(f, chunkstart);
14244be21d56SDavid Gibson             qemu_put_be16(f, n_valid);
14254be21d56SDavid Gibson             qemu_put_be16(f, n_invalid);
14264be21d56SDavid Gibson             qemu_put_buffer(f, HPTE(spapr->htab, chunkstart),
14274be21d56SDavid Gibson                             HASH_PTE_SIZE_64 * n_valid);
14284be21d56SDavid Gibson             sent += index - chunkstart;
14294be21d56SDavid Gibson 
1430bc72ad67SAlex Bligh             if (!final && (qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - starttime) > max_ns) {
14314be21d56SDavid Gibson                 break;
14324be21d56SDavid Gibson             }
14334be21d56SDavid Gibson         }
14344be21d56SDavid Gibson 
14354be21d56SDavid Gibson         if (examined >= htabslots) {
14364be21d56SDavid Gibson             break;
14374be21d56SDavid Gibson         }
14384be21d56SDavid Gibson 
14394be21d56SDavid Gibson         if (index >= htabslots) {
14404be21d56SDavid Gibson             assert(index == htabslots);
14414be21d56SDavid Gibson             index = 0;
14424be21d56SDavid Gibson         }
14434be21d56SDavid Gibson     } while ((examined < htabslots) && (!qemu_file_rate_limit(f) || final));
14444be21d56SDavid Gibson 
14454be21d56SDavid Gibson     if (index >= htabslots) {
14464be21d56SDavid Gibson         assert(index == htabslots);
14474be21d56SDavid Gibson         index = 0;
14484be21d56SDavid Gibson     }
14494be21d56SDavid Gibson 
14504be21d56SDavid Gibson     spapr->htab_save_index = index;
14514be21d56SDavid Gibson 
1452e68cb8b4SAlexey Kardashevskiy     return (examined >= htabslots) && (sent == 0) ? 1 : 0;
14534be21d56SDavid Gibson }
14544be21d56SDavid Gibson 
1455e68cb8b4SAlexey Kardashevskiy #define MAX_ITERATION_NS    5000000 /* 5 ms */
1456e68cb8b4SAlexey Kardashevskiy #define MAX_KVM_BUF_SIZE    2048
1457e68cb8b4SAlexey Kardashevskiy 
14584be21d56SDavid Gibson static int htab_save_iterate(QEMUFile *f, void *opaque)
14594be21d56SDavid Gibson {
146028e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
1461715c5407SDavid Gibson     int fd;
1462e68cb8b4SAlexey Kardashevskiy     int rc = 0;
14634be21d56SDavid Gibson 
14644be21d56SDavid Gibson     /* Iteration header */
14654be21d56SDavid Gibson     qemu_put_be32(f, 0);
14664be21d56SDavid Gibson 
1467e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1468e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1469e68cb8b4SAlexey Kardashevskiy 
1470715c5407SDavid Gibson         fd = get_htab_fd(spapr);
1471715c5407SDavid Gibson         if (fd < 0) {
1472715c5407SDavid Gibson             return fd;
147301a57972SSamuel Mendoza-Jonas         }
147401a57972SSamuel Mendoza-Jonas 
1475715c5407SDavid Gibson         rc = kvmppc_save_htab(f, fd, MAX_KVM_BUF_SIZE, MAX_ITERATION_NS);
1476e68cb8b4SAlexey Kardashevskiy         if (rc < 0) {
1477e68cb8b4SAlexey Kardashevskiy             return rc;
1478e68cb8b4SAlexey Kardashevskiy         }
1479e68cb8b4SAlexey Kardashevskiy     } else  if (spapr->htab_first_pass) {
14804be21d56SDavid Gibson         htab_save_first_pass(f, spapr, MAX_ITERATION_NS);
14814be21d56SDavid Gibson     } else {
1482e68cb8b4SAlexey Kardashevskiy         rc = htab_save_later_pass(f, spapr, MAX_ITERATION_NS);
14834be21d56SDavid Gibson     }
14844be21d56SDavid Gibson 
14854be21d56SDavid Gibson     /* End marker */
14864be21d56SDavid Gibson     qemu_put_be32(f, 0);
14874be21d56SDavid Gibson     qemu_put_be16(f, 0);
14884be21d56SDavid Gibson     qemu_put_be16(f, 0);
14894be21d56SDavid Gibson 
1490e68cb8b4SAlexey Kardashevskiy     return rc;
14914be21d56SDavid Gibson }
14924be21d56SDavid Gibson 
14934be21d56SDavid Gibson static int htab_save_complete(QEMUFile *f, void *opaque)
14944be21d56SDavid Gibson {
149528e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
1496715c5407SDavid Gibson     int fd;
14974be21d56SDavid Gibson 
14984be21d56SDavid Gibson     /* Iteration header */
14994be21d56SDavid Gibson     qemu_put_be32(f, 0);
15004be21d56SDavid Gibson 
1501e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1502e68cb8b4SAlexey Kardashevskiy         int rc;
1503e68cb8b4SAlexey Kardashevskiy 
1504e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1505e68cb8b4SAlexey Kardashevskiy 
1506715c5407SDavid Gibson         fd = get_htab_fd(spapr);
1507715c5407SDavid Gibson         if (fd < 0) {
1508715c5407SDavid Gibson             return fd;
150901a57972SSamuel Mendoza-Jonas         }
151001a57972SSamuel Mendoza-Jonas 
1511715c5407SDavid Gibson         rc = kvmppc_save_htab(f, fd, MAX_KVM_BUF_SIZE, -1);
1512e68cb8b4SAlexey Kardashevskiy         if (rc < 0) {
1513e68cb8b4SAlexey Kardashevskiy             return rc;
1514e68cb8b4SAlexey Kardashevskiy         }
1515715c5407SDavid Gibson         close_htab_fd(spapr);
1516e68cb8b4SAlexey Kardashevskiy     } else {
1517378bc217SDavid Gibson         if (spapr->htab_first_pass) {
1518378bc217SDavid Gibson             htab_save_first_pass(f, spapr, -1);
1519378bc217SDavid Gibson         }
15204be21d56SDavid Gibson         htab_save_later_pass(f, spapr, -1);
1521e68cb8b4SAlexey Kardashevskiy     }
15224be21d56SDavid Gibson 
15234be21d56SDavid Gibson     /* End marker */
15244be21d56SDavid Gibson     qemu_put_be32(f, 0);
15254be21d56SDavid Gibson     qemu_put_be16(f, 0);
15264be21d56SDavid Gibson     qemu_put_be16(f, 0);
15274be21d56SDavid Gibson 
15284be21d56SDavid Gibson     return 0;
15294be21d56SDavid Gibson }
15304be21d56SDavid Gibson 
15314be21d56SDavid Gibson static int htab_load(QEMUFile *f, void *opaque, int version_id)
15324be21d56SDavid Gibson {
153328e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
15344be21d56SDavid Gibson     uint32_t section_hdr;
1535e68cb8b4SAlexey Kardashevskiy     int fd = -1;
15364be21d56SDavid Gibson 
15374be21d56SDavid Gibson     if (version_id < 1 || version_id > 1) {
153898a5d100SDavid Gibson         error_report("htab_load() bad version");
15394be21d56SDavid Gibson         return -EINVAL;
15404be21d56SDavid Gibson     }
15414be21d56SDavid Gibson 
15424be21d56SDavid Gibson     section_hdr = qemu_get_be32(f);
15434be21d56SDavid Gibson 
15444be21d56SDavid Gibson     if (section_hdr) {
15459897e462SGreg Kurz         Error *local_err = NULL;
1546c5f54f3eSDavid Gibson 
1547c5f54f3eSDavid Gibson         /* First section gives the htab size */
1548c5f54f3eSDavid Gibson         spapr_reallocate_hpt(spapr, section_hdr, &local_err);
1549c5f54f3eSDavid Gibson         if (local_err) {
1550c5f54f3eSDavid Gibson             error_report_err(local_err);
15514be21d56SDavid Gibson             return -EINVAL;
15524be21d56SDavid Gibson         }
15534be21d56SDavid Gibson         return 0;
15544be21d56SDavid Gibson     }
15554be21d56SDavid Gibson 
1556e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1557e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1558e68cb8b4SAlexey Kardashevskiy 
1559e68cb8b4SAlexey Kardashevskiy         fd = kvmppc_get_htab_fd(true);
1560e68cb8b4SAlexey Kardashevskiy         if (fd < 0) {
156198a5d100SDavid Gibson             error_report("Unable to open fd to restore KVM hash table: %s",
1562e68cb8b4SAlexey Kardashevskiy                          strerror(errno));
1563e68cb8b4SAlexey Kardashevskiy         }
1564e68cb8b4SAlexey Kardashevskiy     }
1565e68cb8b4SAlexey Kardashevskiy 
15664be21d56SDavid Gibson     while (true) {
15674be21d56SDavid Gibson         uint32_t index;
15684be21d56SDavid Gibson         uint16_t n_valid, n_invalid;
15694be21d56SDavid Gibson 
15704be21d56SDavid Gibson         index = qemu_get_be32(f);
15714be21d56SDavid Gibson         n_valid = qemu_get_be16(f);
15724be21d56SDavid Gibson         n_invalid = qemu_get_be16(f);
15734be21d56SDavid Gibson 
15744be21d56SDavid Gibson         if ((index == 0) && (n_valid == 0) && (n_invalid == 0)) {
15754be21d56SDavid Gibson             /* End of Stream */
15764be21d56SDavid Gibson             break;
15774be21d56SDavid Gibson         }
15784be21d56SDavid Gibson 
1579e68cb8b4SAlexey Kardashevskiy         if ((index + n_valid + n_invalid) >
15804be21d56SDavid Gibson             (HTAB_SIZE(spapr) / HASH_PTE_SIZE_64)) {
15814be21d56SDavid Gibson             /* Bad index in stream */
158298a5d100SDavid Gibson             error_report(
158398a5d100SDavid Gibson                 "htab_load() bad index %d (%hd+%hd entries) in htab stream (htab_shift=%d)",
158498a5d100SDavid Gibson                 index, n_valid, n_invalid, spapr->htab_shift);
15854be21d56SDavid Gibson             return -EINVAL;
15864be21d56SDavid Gibson         }
15874be21d56SDavid Gibson 
1588e68cb8b4SAlexey Kardashevskiy         if (spapr->htab) {
15894be21d56SDavid Gibson             if (n_valid) {
15904be21d56SDavid Gibson                 qemu_get_buffer(f, HPTE(spapr->htab, index),
15914be21d56SDavid Gibson                                 HASH_PTE_SIZE_64 * n_valid);
15924be21d56SDavid Gibson             }
15934be21d56SDavid Gibson             if (n_invalid) {
15944be21d56SDavid Gibson                 memset(HPTE(spapr->htab, index + n_valid), 0,
15954be21d56SDavid Gibson                        HASH_PTE_SIZE_64 * n_invalid);
15964be21d56SDavid Gibson             }
1597e68cb8b4SAlexey Kardashevskiy         } else {
1598e68cb8b4SAlexey Kardashevskiy             int rc;
1599e68cb8b4SAlexey Kardashevskiy 
1600e68cb8b4SAlexey Kardashevskiy             assert(fd >= 0);
1601e68cb8b4SAlexey Kardashevskiy 
1602e68cb8b4SAlexey Kardashevskiy             rc = kvmppc_load_htab_chunk(f, fd, index, n_valid, n_invalid);
1603e68cb8b4SAlexey Kardashevskiy             if (rc < 0) {
1604e68cb8b4SAlexey Kardashevskiy                 return rc;
1605e68cb8b4SAlexey Kardashevskiy             }
1606e68cb8b4SAlexey Kardashevskiy         }
1607e68cb8b4SAlexey Kardashevskiy     }
1608e68cb8b4SAlexey Kardashevskiy 
1609e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1610e68cb8b4SAlexey Kardashevskiy         assert(fd >= 0);
1611e68cb8b4SAlexey Kardashevskiy         close(fd);
16124be21d56SDavid Gibson     }
16134be21d56SDavid Gibson 
16144be21d56SDavid Gibson     return 0;
16154be21d56SDavid Gibson }
16164be21d56SDavid Gibson 
16174be21d56SDavid Gibson static SaveVMHandlers savevm_htab_handlers = {
16184be21d56SDavid Gibson     .save_live_setup = htab_save_setup,
16194be21d56SDavid Gibson     .save_live_iterate = htab_save_iterate,
1620a3e06c3dSDr. David Alan Gilbert     .save_live_complete_precopy = htab_save_complete,
16214be21d56SDavid Gibson     .load_state = htab_load,
16224be21d56SDavid Gibson };
16234be21d56SDavid Gibson 
16245b2128d2SAlexander Graf static void spapr_boot_set(void *opaque, const char *boot_device,
16255b2128d2SAlexander Graf                            Error **errp)
16265b2128d2SAlexander Graf {
16275b2128d2SAlexander Graf     MachineState *machine = MACHINE(qdev_get_machine());
16285b2128d2SAlexander Graf     machine->boot_order = g_strdup(boot_device);
16295b2128d2SAlexander Graf }
16305b2128d2SAlexander Graf 
1631224245bfSDavid Gibson /*
1632224245bfSDavid Gibson  * Reset routine for LMB DR devices.
1633224245bfSDavid Gibson  *
1634224245bfSDavid Gibson  * Unlike PCI DR devices, LMB DR devices explicitly register this reset
1635224245bfSDavid Gibson  * routine. Reset for PCI DR devices will be handled by PHB reset routine
1636224245bfSDavid Gibson  * when it walks all its children devices. LMB devices reset occurs
1637224245bfSDavid Gibson  * as part of spapr_ppc_reset().
1638224245bfSDavid Gibson  */
1639224245bfSDavid Gibson static void spapr_drc_reset(void *opaque)
1640224245bfSDavid Gibson {
1641224245bfSDavid Gibson     sPAPRDRConnector *drc = opaque;
1642224245bfSDavid Gibson     DeviceState *d = DEVICE(drc);
1643224245bfSDavid Gibson 
1644224245bfSDavid Gibson     if (d) {
1645224245bfSDavid Gibson         device_reset(d);
1646224245bfSDavid Gibson     }
1647224245bfSDavid Gibson }
1648224245bfSDavid Gibson 
1649224245bfSDavid Gibson static void spapr_create_lmb_dr_connectors(sPAPRMachineState *spapr)
1650224245bfSDavid Gibson {
1651224245bfSDavid Gibson     MachineState *machine = MACHINE(spapr);
1652224245bfSDavid Gibson     uint64_t lmb_size = SPAPR_MEMORY_BLOCK_SIZE;
1653e8f986fcSBharata B Rao     uint32_t nr_lmbs = (machine->maxram_size - machine->ram_size)/lmb_size;
1654224245bfSDavid Gibson     int i;
1655224245bfSDavid Gibson 
1656224245bfSDavid Gibson     for (i = 0; i < nr_lmbs; i++) {
1657224245bfSDavid Gibson         sPAPRDRConnector *drc;
1658224245bfSDavid Gibson         uint64_t addr;
1659224245bfSDavid Gibson 
1660e8f986fcSBharata B Rao         addr = i * lmb_size + spapr->hotplug_memory.base;
1661224245bfSDavid Gibson         drc = spapr_dr_connector_new(OBJECT(spapr), SPAPR_DR_CONNECTOR_TYPE_LMB,
1662224245bfSDavid Gibson                                      addr/lmb_size);
1663224245bfSDavid Gibson         qemu_register_reset(spapr_drc_reset, drc);
1664224245bfSDavid Gibson     }
1665224245bfSDavid Gibson }
1666224245bfSDavid Gibson 
1667224245bfSDavid Gibson /*
1668224245bfSDavid Gibson  * If RAM size, maxmem size and individual node mem sizes aren't aligned
1669224245bfSDavid Gibson  * to SPAPR_MEMORY_BLOCK_SIZE(256MB), then refuse to start the guest
1670224245bfSDavid Gibson  * since we can't support such unaligned sizes with DRCONF_MEMORY.
1671224245bfSDavid Gibson  */
16727c150d6fSDavid Gibson static void spapr_validate_node_memory(MachineState *machine, Error **errp)
1673224245bfSDavid Gibson {
1674224245bfSDavid Gibson     int i;
1675224245bfSDavid Gibson 
16767c150d6fSDavid Gibson     if (machine->ram_size % SPAPR_MEMORY_BLOCK_SIZE) {
16777c150d6fSDavid Gibson         error_setg(errp, "Memory size 0x" RAM_ADDR_FMT
16787c150d6fSDavid Gibson                    " is not aligned to %llu MiB",
16797c150d6fSDavid Gibson                    machine->ram_size,
1680224245bfSDavid Gibson                    SPAPR_MEMORY_BLOCK_SIZE / M_BYTE);
16817c150d6fSDavid Gibson         return;
16827c150d6fSDavid Gibson     }
16837c150d6fSDavid Gibson 
16847c150d6fSDavid Gibson     if (machine->maxram_size % SPAPR_MEMORY_BLOCK_SIZE) {
16857c150d6fSDavid Gibson         error_setg(errp, "Maximum memory size 0x" RAM_ADDR_FMT
16867c150d6fSDavid Gibson                    " is not aligned to %llu MiB",
16877c150d6fSDavid Gibson                    machine->ram_size,
16887c150d6fSDavid Gibson                    SPAPR_MEMORY_BLOCK_SIZE / M_BYTE);
16897c150d6fSDavid Gibson         return;
1690224245bfSDavid Gibson     }
1691224245bfSDavid Gibson 
1692224245bfSDavid Gibson     for (i = 0; i < nb_numa_nodes; i++) {
1693224245bfSDavid Gibson         if (numa_info[i].node_mem % SPAPR_MEMORY_BLOCK_SIZE) {
16947c150d6fSDavid Gibson             error_setg(errp,
16957c150d6fSDavid Gibson                        "Node %d memory size 0x%" PRIx64
16967c150d6fSDavid Gibson                        " is not aligned to %llu MiB",
16977c150d6fSDavid Gibson                        i, numa_info[i].node_mem,
1698224245bfSDavid Gibson                        SPAPR_MEMORY_BLOCK_SIZE / M_BYTE);
16997c150d6fSDavid Gibson             return;
1700224245bfSDavid Gibson         }
1701224245bfSDavid Gibson     }
1702224245bfSDavid Gibson }
1703224245bfSDavid Gibson 
170453018216SPaolo Bonzini /* pSeries LPAR / sPAPR hardware init */
17053ef96221SMarcel Apfelbaum static void ppc_spapr_init(MachineState *machine)
170653018216SPaolo Bonzini {
170728e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
1708224245bfSDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(machine);
17093ef96221SMarcel Apfelbaum     const char *kernel_filename = machine->kernel_filename;
17103ef96221SMarcel Apfelbaum     const char *kernel_cmdline = machine->kernel_cmdline;
17113ef96221SMarcel Apfelbaum     const char *initrd_filename = machine->initrd_filename;
171253018216SPaolo Bonzini     PCIHostState *phb;
171353018216SPaolo Bonzini     int i;
171453018216SPaolo Bonzini     MemoryRegion *sysmem = get_system_memory();
171553018216SPaolo Bonzini     MemoryRegion *ram = g_new(MemoryRegion, 1);
1716658fa66bSAlexey Kardashevskiy     MemoryRegion *rma_region;
1717658fa66bSAlexey Kardashevskiy     void *rma = NULL;
171853018216SPaolo Bonzini     hwaddr rma_alloc_size;
1719b082d65aSAlexey Kardashevskiy     hwaddr node0_size = spapr_node0_size();
172053018216SPaolo Bonzini     uint32_t initrd_base = 0;
172153018216SPaolo Bonzini     long kernel_size = 0, initrd_size = 0;
1722b7d1f77aSBenjamin Herrenschmidt     long load_limit, fw_size;
172316457e7fSBenjamin Herrenschmidt     bool kernel_le = false;
172453018216SPaolo Bonzini     char *filename;
172594a94e4cSBharata B Rao     int smt = kvmppc_smt_threads();
172694a94e4cSBharata B Rao     int spapr_cores = smp_cpus / smp_threads;
172794a94e4cSBharata B Rao     int spapr_max_cores = max_cpus / smp_threads;
172894a94e4cSBharata B Rao 
172994a94e4cSBharata B Rao     if (smc->dr_cpu_enabled) {
173094a94e4cSBharata B Rao         if (smp_cpus % smp_threads) {
173194a94e4cSBharata B Rao             error_report("smp_cpus (%u) must be multiple of threads (%u)",
173294a94e4cSBharata B Rao                          smp_cpus, smp_threads);
173394a94e4cSBharata B Rao             exit(1);
173494a94e4cSBharata B Rao         }
173594a94e4cSBharata B Rao         if (max_cpus % smp_threads) {
173694a94e4cSBharata B Rao             error_report("max_cpus (%u) must be multiple of threads (%u)",
173794a94e4cSBharata B Rao                          max_cpus, smp_threads);
173894a94e4cSBharata B Rao             exit(1);
173994a94e4cSBharata B Rao         }
174094a94e4cSBharata B Rao     }
174153018216SPaolo Bonzini 
1742226419d6SMichael S. Tsirkin     msi_nonbroken = true;
174353018216SPaolo Bonzini 
174453018216SPaolo Bonzini     QLIST_INIT(&spapr->phbs);
174553018216SPaolo Bonzini 
174653018216SPaolo Bonzini     cpu_ppc_hypercall = emulate_spapr_hypercall;
174753018216SPaolo Bonzini 
174853018216SPaolo Bonzini     /* Allocate RMA if necessary */
1749658fa66bSAlexey Kardashevskiy     rma_alloc_size = kvmppc_alloc_rma(&rma);
175053018216SPaolo Bonzini 
175153018216SPaolo Bonzini     if (rma_alloc_size == -1) {
1752730fce59SThomas Huth         error_report("Unable to create RMA");
175353018216SPaolo Bonzini         exit(1);
175453018216SPaolo Bonzini     }
175553018216SPaolo Bonzini 
1756c4177479SAlexey Kardashevskiy     if (rma_alloc_size && (rma_alloc_size < node0_size)) {
175753018216SPaolo Bonzini         spapr->rma_size = rma_alloc_size;
175853018216SPaolo Bonzini     } else {
1759c4177479SAlexey Kardashevskiy         spapr->rma_size = node0_size;
176053018216SPaolo Bonzini 
176153018216SPaolo Bonzini         /* With KVM, we don't actually know whether KVM supports an
176253018216SPaolo Bonzini          * unbounded RMA (PR KVM) or is limited by the hash table size
176353018216SPaolo Bonzini          * (HV KVM using VRMA), so we always assume the latter
176453018216SPaolo Bonzini          *
176553018216SPaolo Bonzini          * In that case, we also limit the initial allocations for RTAS
176653018216SPaolo Bonzini          * etc... to 256M since we have no way to know what the VRMA size
176753018216SPaolo Bonzini          * is going to be as it depends on the size of the hash table
176853018216SPaolo Bonzini          * isn't determined yet.
176953018216SPaolo Bonzini          */
177053018216SPaolo Bonzini         if (kvm_enabled()) {
177153018216SPaolo Bonzini             spapr->vrma_adjust = 1;
177253018216SPaolo Bonzini             spapr->rma_size = MIN(spapr->rma_size, 0x10000000);
177353018216SPaolo Bonzini         }
177453018216SPaolo Bonzini     }
177553018216SPaolo Bonzini 
1776c4177479SAlexey Kardashevskiy     if (spapr->rma_size > node0_size) {
1777d54e4d76SDavid Gibson         error_report("Numa node 0 has to span the RMA (%#08"HWADDR_PRIx")",
1778c4177479SAlexey Kardashevskiy                      spapr->rma_size);
1779c4177479SAlexey Kardashevskiy         exit(1);
1780c4177479SAlexey Kardashevskiy     }
1781c4177479SAlexey Kardashevskiy 
1782b7d1f77aSBenjamin Herrenschmidt     /* Setup a load limit for the ramdisk leaving room for SLOF and FDT */
1783b7d1f77aSBenjamin Herrenschmidt     load_limit = MIN(spapr->rma_size, RTAS_MAX_ADDR) - FW_OVERHEAD;
178453018216SPaolo Bonzini 
17857b565160SDavid Gibson     /* Set up Interrupt Controller before we create the VCPUs */
178627f24582SBenjamin Herrenschmidt     spapr->xics = xics_system_init(machine,
178794a94e4cSBharata B Rao                                    DIV_ROUND_UP(max_cpus * smt, smp_threads),
1788161deaf2SBenjamin Herrenschmidt                                    XICS_IRQS_SPAPR, &error_fatal);
17897b565160SDavid Gibson 
1790224245bfSDavid Gibson     if (smc->dr_lmb_enabled) {
17917c150d6fSDavid Gibson         spapr_validate_node_memory(machine, &error_fatal);
1792224245bfSDavid Gibson     }
1793224245bfSDavid Gibson 
179453018216SPaolo Bonzini     /* init CPUs */
179519fb2c36SBharata B Rao     if (machine->cpu_model == NULL) {
179619fb2c36SBharata B Rao         machine->cpu_model = kvm_enabled() ? "host" : "POWER7";
179753018216SPaolo Bonzini     }
179894a94e4cSBharata B Rao 
179994a94e4cSBharata B Rao     if (smc->dr_cpu_enabled) {
180094a94e4cSBharata B Rao         char *type = spapr_get_cpu_core_type(machine->cpu_model);
180194a94e4cSBharata B Rao 
180294a94e4cSBharata B Rao         spapr->cores = g_new0(Object *, spapr_max_cores);
1803af81cf32SBharata B Rao         for (i = 0; i < spapr_max_cores; i++) {
180494a94e4cSBharata B Rao             int core_dt_id = i * smt;
1805af81cf32SBharata B Rao             sPAPRDRConnector *drc =
1806af81cf32SBharata B Rao                 spapr_dr_connector_new(OBJECT(spapr),
1807af81cf32SBharata B Rao                                        SPAPR_DR_CONNECTOR_TYPE_CPU, core_dt_id);
1808af81cf32SBharata B Rao 
1809af81cf32SBharata B Rao             qemu_register_reset(spapr_drc_reset, drc);
1810af81cf32SBharata B Rao 
1811af81cf32SBharata B Rao             if (i < spapr_cores) {
1812af81cf32SBharata B Rao                 char *type = spapr_get_cpu_core_type(machine->cpu_model);
181394a94e4cSBharata B Rao                 Object *core;
181494a94e4cSBharata B Rao 
181594a94e4cSBharata B Rao                 if (!object_class_by_name(type)) {
181694a94e4cSBharata B Rao                     error_report("Unable to find sPAPR CPU Core definition");
181794a94e4cSBharata B Rao                     exit(1);
181894a94e4cSBharata B Rao                 }
181994a94e4cSBharata B Rao 
182094a94e4cSBharata B Rao                 core  = object_new(type);
182194a94e4cSBharata B Rao                 object_property_set_int(core, smp_threads, "nr-threads",
182294a94e4cSBharata B Rao                                         &error_fatal);
182394a94e4cSBharata B Rao                 object_property_set_int(core, core_dt_id, CPU_CORE_PROP_CORE_ID,
182494a94e4cSBharata B Rao                                         &error_fatal);
182594a94e4cSBharata B Rao                 object_property_set_bool(core, true, "realized", &error_fatal);
182694a94e4cSBharata B Rao             }
1827af81cf32SBharata B Rao         }
182894a94e4cSBharata B Rao         g_free(type);
182994a94e4cSBharata B Rao     } else {
183053018216SPaolo Bonzini         for (i = 0; i < smp_cpus; i++) {
183194a94e4cSBharata B Rao             PowerPCCPU *cpu = cpu_ppc_init(machine->cpu_model);
183253018216SPaolo Bonzini             if (cpu == NULL) {
1833569f4967SDavid Gibson                 error_report("Unable to find PowerPC CPU definition");
183453018216SPaolo Bonzini                 exit(1);
183553018216SPaolo Bonzini             }
1836569f4967SDavid Gibson             spapr_cpu_init(spapr, cpu, &error_fatal);
183753018216SPaolo Bonzini        }
183894a94e4cSBharata B Rao     }
183953018216SPaolo Bonzini 
1840026bfd89SDavid Gibson     if (kvm_enabled()) {
1841026bfd89SDavid Gibson         /* Enable H_LOGICAL_CI_* so SLOF can talk to in-kernel devices */
1842026bfd89SDavid Gibson         kvmppc_enable_logical_ci_hcalls();
1843ef9971ddSAlexey Kardashevskiy         kvmppc_enable_set_mode_hcall();
1844026bfd89SDavid Gibson     }
1845026bfd89SDavid Gibson 
184653018216SPaolo Bonzini     /* allocate RAM */
1847f92f5da1SAlexey Kardashevskiy     memory_region_allocate_system_memory(ram, NULL, "ppc_spapr.ram",
1848fb164994SDavid Gibson                                          machine->ram_size);
1849f92f5da1SAlexey Kardashevskiy     memory_region_add_subregion(sysmem, 0, ram);
185053018216SPaolo Bonzini 
1851658fa66bSAlexey Kardashevskiy     if (rma_alloc_size && rma) {
1852658fa66bSAlexey Kardashevskiy         rma_region = g_new(MemoryRegion, 1);
1853658fa66bSAlexey Kardashevskiy         memory_region_init_ram_ptr(rma_region, NULL, "ppc_spapr.rma",
1854658fa66bSAlexey Kardashevskiy                                    rma_alloc_size, rma);
1855658fa66bSAlexey Kardashevskiy         vmstate_register_ram_global(rma_region);
1856658fa66bSAlexey Kardashevskiy         memory_region_add_subregion(sysmem, 0, rma_region);
1857658fa66bSAlexey Kardashevskiy     }
1858658fa66bSAlexey Kardashevskiy 
18594a1c9cf0SBharata B Rao     /* initialize hotplug memory address space */
18604a1c9cf0SBharata B Rao     if (machine->ram_size < machine->maxram_size) {
18614a1c9cf0SBharata B Rao         ram_addr_t hotplug_mem_size = machine->maxram_size - machine->ram_size;
186271c9a3ddSBharata B Rao         /*
186371c9a3ddSBharata B Rao          * Limit the number of hotpluggable memory slots to half the number
186471c9a3ddSBharata B Rao          * slots that KVM supports, leaving the other half for PCI and other
186571c9a3ddSBharata B Rao          * devices. However ensure that number of slots doesn't drop below 32.
186671c9a3ddSBharata B Rao          */
186771c9a3ddSBharata B Rao         int max_memslots = kvm_enabled() ? kvm_get_max_memslots() / 2 :
186871c9a3ddSBharata B Rao                            SPAPR_MAX_RAM_SLOTS;
18694a1c9cf0SBharata B Rao 
187071c9a3ddSBharata B Rao         if (max_memslots < SPAPR_MAX_RAM_SLOTS) {
187171c9a3ddSBharata B Rao             max_memslots = SPAPR_MAX_RAM_SLOTS;
187271c9a3ddSBharata B Rao         }
187371c9a3ddSBharata B Rao         if (machine->ram_slots > max_memslots) {
1874d54e4d76SDavid Gibson             error_report("Specified number of memory slots %"
1875d54e4d76SDavid Gibson                          PRIu64" exceeds max supported %d",
187671c9a3ddSBharata B Rao                          machine->ram_slots, max_memslots);
1877d54e4d76SDavid Gibson             exit(1);
18784a1c9cf0SBharata B Rao         }
18794a1c9cf0SBharata B Rao 
18804a1c9cf0SBharata B Rao         spapr->hotplug_memory.base = ROUND_UP(machine->ram_size,
18814a1c9cf0SBharata B Rao                                               SPAPR_HOTPLUG_MEM_ALIGN);
18824a1c9cf0SBharata B Rao         memory_region_init(&spapr->hotplug_memory.mr, OBJECT(spapr),
18834a1c9cf0SBharata B Rao                            "hotplug-memory", hotplug_mem_size);
18844a1c9cf0SBharata B Rao         memory_region_add_subregion(sysmem, spapr->hotplug_memory.base,
18854a1c9cf0SBharata B Rao                                     &spapr->hotplug_memory.mr);
18864a1c9cf0SBharata B Rao     }
18874a1c9cf0SBharata B Rao 
1888224245bfSDavid Gibson     if (smc->dr_lmb_enabled) {
1889224245bfSDavid Gibson         spapr_create_lmb_dr_connectors(spapr);
1890224245bfSDavid Gibson     }
1891224245bfSDavid Gibson 
189253018216SPaolo Bonzini     filename = qemu_find_file(QEMU_FILE_TYPE_BIOS, "spapr-rtas.bin");
18934c56440dSStefan Weil     if (!filename) {
1894730fce59SThomas Huth         error_report("Could not find LPAR rtas '%s'", "spapr-rtas.bin");
18954c56440dSStefan Weil         exit(1);
18964c56440dSStefan Weil     }
1897b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_size = get_image_size(filename);
18988afc22a2SZhou Jie     if (spapr->rtas_size < 0) {
18998afc22a2SZhou Jie         error_report("Could not get size of LPAR rtas '%s'", filename);
19008afc22a2SZhou Jie         exit(1);
19018afc22a2SZhou Jie     }
1902b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_blob = g_malloc(spapr->rtas_size);
1903b7d1f77aSBenjamin Herrenschmidt     if (load_image_size(filename, spapr->rtas_blob, spapr->rtas_size) < 0) {
1904730fce59SThomas Huth         error_report("Could not load LPAR rtas '%s'", filename);
190553018216SPaolo Bonzini         exit(1);
190653018216SPaolo Bonzini     }
190753018216SPaolo Bonzini     if (spapr->rtas_size > RTAS_MAX_SIZE) {
1908730fce59SThomas Huth         error_report("RTAS too big ! 0x%zx bytes (max is 0x%x)",
19092f285bddSPeter Maydell                      (size_t)spapr->rtas_size, RTAS_MAX_SIZE);
191053018216SPaolo Bonzini         exit(1);
191153018216SPaolo Bonzini     }
191253018216SPaolo Bonzini     g_free(filename);
191353018216SPaolo Bonzini 
191453018216SPaolo Bonzini     /* Set up EPOW events infrastructure */
191553018216SPaolo Bonzini     spapr_events_init(spapr);
191653018216SPaolo Bonzini 
191712f42174SDavid Gibson     /* Set up the RTC RTAS interfaces */
191828df36a1SDavid Gibson     spapr_rtc_create(spapr);
191912f42174SDavid Gibson 
192053018216SPaolo Bonzini     /* Set up VIO bus */
192153018216SPaolo Bonzini     spapr->vio_bus = spapr_vio_bus_init();
192253018216SPaolo Bonzini 
192353018216SPaolo Bonzini     for (i = 0; i < MAX_SERIAL_PORTS; i++) {
192453018216SPaolo Bonzini         if (serial_hds[i]) {
192553018216SPaolo Bonzini             spapr_vty_create(spapr->vio_bus, serial_hds[i]);
192653018216SPaolo Bonzini         }
192753018216SPaolo Bonzini     }
192853018216SPaolo Bonzini 
192953018216SPaolo Bonzini     /* We always have at least the nvram device on VIO */
193053018216SPaolo Bonzini     spapr_create_nvram(spapr);
193153018216SPaolo Bonzini 
193253018216SPaolo Bonzini     /* Set up PCI */
193353018216SPaolo Bonzini     spapr_pci_rtas_init();
193453018216SPaolo Bonzini 
193589dfd6e1SDavid Gibson     phb = spapr_create_phb(spapr, 0);
193653018216SPaolo Bonzini 
193753018216SPaolo Bonzini     for (i = 0; i < nb_nics; i++) {
193853018216SPaolo Bonzini         NICInfo *nd = &nd_table[i];
193953018216SPaolo Bonzini 
194053018216SPaolo Bonzini         if (!nd->model) {
194153018216SPaolo Bonzini             nd->model = g_strdup("ibmveth");
194253018216SPaolo Bonzini         }
194353018216SPaolo Bonzini 
194453018216SPaolo Bonzini         if (strcmp(nd->model, "ibmveth") == 0) {
194553018216SPaolo Bonzini             spapr_vlan_create(spapr->vio_bus, nd);
194653018216SPaolo Bonzini         } else {
194729b358f9SDavid Gibson             pci_nic_init_nofail(&nd_table[i], phb->bus, nd->model, NULL);
194853018216SPaolo Bonzini         }
194953018216SPaolo Bonzini     }
195053018216SPaolo Bonzini 
195153018216SPaolo Bonzini     for (i = 0; i <= drive_get_max_bus(IF_SCSI); i++) {
195253018216SPaolo Bonzini         spapr_vscsi_create(spapr->vio_bus);
195353018216SPaolo Bonzini     }
195453018216SPaolo Bonzini 
195553018216SPaolo Bonzini     /* Graphics */
195614c6a894SDavid Gibson     if (spapr_vga_init(phb->bus, &error_fatal)) {
195753018216SPaolo Bonzini         spapr->has_graphics = true;
1958c6e76503SPaolo Bonzini         machine->usb |= defaults_enabled() && !machine->usb_disabled;
195953018216SPaolo Bonzini     }
196053018216SPaolo Bonzini 
19614ee9ced9SMarcel Apfelbaum     if (machine->usb) {
196257040d45SThomas Huth         if (smc->use_ohci_by_default) {
196353018216SPaolo Bonzini             pci_create_simple(phb->bus, -1, "pci-ohci");
196457040d45SThomas Huth         } else {
196557040d45SThomas Huth             pci_create_simple(phb->bus, -1, "nec-usb-xhci");
196657040d45SThomas Huth         }
1967c86580b8SMarkus Armbruster 
196853018216SPaolo Bonzini         if (spapr->has_graphics) {
1969c86580b8SMarkus Armbruster             USBBus *usb_bus = usb_bus_find(-1);
1970c86580b8SMarkus Armbruster 
1971c86580b8SMarkus Armbruster             usb_create_simple(usb_bus, "usb-kbd");
1972c86580b8SMarkus Armbruster             usb_create_simple(usb_bus, "usb-mouse");
197353018216SPaolo Bonzini         }
197453018216SPaolo Bonzini     }
197553018216SPaolo Bonzini 
197653018216SPaolo Bonzini     if (spapr->rma_size < (MIN_RMA_SLOF << 20)) {
1977d54e4d76SDavid Gibson         error_report(
1978d54e4d76SDavid Gibson             "pSeries SLOF firmware requires >= %ldM guest RMA (Real Mode Area memory)",
1979d54e4d76SDavid Gibson             MIN_RMA_SLOF);
198053018216SPaolo Bonzini         exit(1);
198153018216SPaolo Bonzini     }
198253018216SPaolo Bonzini 
198353018216SPaolo Bonzini     if (kernel_filename) {
198453018216SPaolo Bonzini         uint64_t lowaddr = 0;
198553018216SPaolo Bonzini 
198653018216SPaolo Bonzini         kernel_size = load_elf(kernel_filename, translate_kernel_address, NULL,
19877ef295eaSPeter Crosthwaite                                NULL, &lowaddr, NULL, 1, PPC_ELF_MACHINE,
19887ef295eaSPeter Crosthwaite                                0, 0);
19893b66da82SAlexey Kardashevskiy         if (kernel_size == ELF_LOAD_WRONG_ENDIAN) {
199016457e7fSBenjamin Herrenschmidt             kernel_size = load_elf(kernel_filename,
199116457e7fSBenjamin Herrenschmidt                                    translate_kernel_address, NULL,
19927ef295eaSPeter Crosthwaite                                    NULL, &lowaddr, NULL, 0, PPC_ELF_MACHINE,
19937ef295eaSPeter Crosthwaite                                    0, 0);
199416457e7fSBenjamin Herrenschmidt             kernel_le = kernel_size > 0;
199516457e7fSBenjamin Herrenschmidt         }
199616457e7fSBenjamin Herrenschmidt         if (kernel_size < 0) {
1997d54e4d76SDavid Gibson             error_report("error loading %s: %s",
19983b66da82SAlexey Kardashevskiy                          kernel_filename, load_elf_strerror(kernel_size));
199953018216SPaolo Bonzini             exit(1);
200053018216SPaolo Bonzini         }
200153018216SPaolo Bonzini 
200253018216SPaolo Bonzini         /* load initrd */
200353018216SPaolo Bonzini         if (initrd_filename) {
200453018216SPaolo Bonzini             /* Try to locate the initrd in the gap between the kernel
200553018216SPaolo Bonzini              * and the firmware. Add a bit of space just in case
200653018216SPaolo Bonzini              */
200753018216SPaolo Bonzini             initrd_base = (KERNEL_LOAD_ADDR + kernel_size + 0x1ffff) & ~0xffff;
200853018216SPaolo Bonzini             initrd_size = load_image_targphys(initrd_filename, initrd_base,
200953018216SPaolo Bonzini                                               load_limit - initrd_base);
201053018216SPaolo Bonzini             if (initrd_size < 0) {
2011d54e4d76SDavid Gibson                 error_report("could not load initial ram disk '%s'",
201253018216SPaolo Bonzini                              initrd_filename);
201353018216SPaolo Bonzini                 exit(1);
201453018216SPaolo Bonzini             }
201553018216SPaolo Bonzini         } else {
201653018216SPaolo Bonzini             initrd_base = 0;
201753018216SPaolo Bonzini             initrd_size = 0;
201853018216SPaolo Bonzini         }
201953018216SPaolo Bonzini     }
202053018216SPaolo Bonzini 
20218e7ea787SAndreas Färber     if (bios_name == NULL) {
20228e7ea787SAndreas Färber         bios_name = FW_FILE_NAME;
20238e7ea787SAndreas Färber     }
20248e7ea787SAndreas Färber     filename = qemu_find_file(QEMU_FILE_TYPE_BIOS, bios_name);
20254c56440dSStefan Weil     if (!filename) {
202668fea5a0SThomas Huth         error_report("Could not find LPAR firmware '%s'", bios_name);
20274c56440dSStefan Weil         exit(1);
20284c56440dSStefan Weil     }
202953018216SPaolo Bonzini     fw_size = load_image_targphys(filename, 0, FW_MAX_SIZE);
203068fea5a0SThomas Huth     if (fw_size <= 0) {
203168fea5a0SThomas Huth         error_report("Could not load LPAR firmware '%s'", filename);
203253018216SPaolo Bonzini         exit(1);
203353018216SPaolo Bonzini     }
203453018216SPaolo Bonzini     g_free(filename);
203553018216SPaolo Bonzini 
203628e02042SDavid Gibson     /* FIXME: Should register things through the MachineState's qdev
203728e02042SDavid Gibson      * interface, this is a legacy from the sPAPREnvironment structure
203828e02042SDavid Gibson      * which predated MachineState but had a similar function */
20394be21d56SDavid Gibson     vmstate_register(NULL, 0, &vmstate_spapr, spapr);
20404be21d56SDavid Gibson     register_savevm_live(NULL, "spapr/htab", -1, 1,
20414be21d56SDavid Gibson                          &savevm_htab_handlers, spapr);
20424be21d56SDavid Gibson 
204353018216SPaolo Bonzini     /* Prepare the device tree */
20443bbf37f2SAndreas Färber     spapr->fdt_skel = spapr_create_fdt_skel(initrd_base, initrd_size,
204516457e7fSBenjamin Herrenschmidt                                             kernel_size, kernel_le,
204631fe14d1SNathan Fontenot                                             kernel_cmdline,
204731fe14d1SNathan Fontenot                                             spapr->check_exception_irq);
204853018216SPaolo Bonzini     assert(spapr->fdt_skel != NULL);
20495b2128d2SAlexander Graf 
205046503c2bSMichael Roth     /* used by RTAS */
205146503c2bSMichael Roth     QTAILQ_INIT(&spapr->ccs_list);
205246503c2bSMichael Roth     qemu_register_reset(spapr_ccs_reset_hook, spapr);
205346503c2bSMichael Roth 
20545b2128d2SAlexander Graf     qemu_register_boot_set(spapr_boot_set, spapr);
205553018216SPaolo Bonzini }
205653018216SPaolo Bonzini 
2057135a129aSAneesh Kumar K.V static int spapr_kvm_type(const char *vm_type)
2058135a129aSAneesh Kumar K.V {
2059135a129aSAneesh Kumar K.V     if (!vm_type) {
2060135a129aSAneesh Kumar K.V         return 0;
2061135a129aSAneesh Kumar K.V     }
2062135a129aSAneesh Kumar K.V 
2063135a129aSAneesh Kumar K.V     if (!strcmp(vm_type, "HV")) {
2064135a129aSAneesh Kumar K.V         return 1;
2065135a129aSAneesh Kumar K.V     }
2066135a129aSAneesh Kumar K.V 
2067135a129aSAneesh Kumar K.V     if (!strcmp(vm_type, "PR")) {
2068135a129aSAneesh Kumar K.V         return 2;
2069135a129aSAneesh Kumar K.V     }
2070135a129aSAneesh Kumar K.V 
2071135a129aSAneesh Kumar K.V     error_report("Unknown kvm-type specified '%s'", vm_type);
2072135a129aSAneesh Kumar K.V     exit(1);
2073135a129aSAneesh Kumar K.V }
2074135a129aSAneesh Kumar K.V 
207571461b0fSAlexey Kardashevskiy /*
2076627b84f4SGonglei  * Implementation of an interface to adjust firmware path
207771461b0fSAlexey Kardashevskiy  * for the bootindex property handling.
207871461b0fSAlexey Kardashevskiy  */
207971461b0fSAlexey Kardashevskiy static char *spapr_get_fw_dev_path(FWPathProvider *p, BusState *bus,
208071461b0fSAlexey Kardashevskiy                                    DeviceState *dev)
208171461b0fSAlexey Kardashevskiy {
208271461b0fSAlexey Kardashevskiy #define CAST(type, obj, name) \
208371461b0fSAlexey Kardashevskiy     ((type *)object_dynamic_cast(OBJECT(obj), (name)))
208471461b0fSAlexey Kardashevskiy     SCSIDevice *d = CAST(SCSIDevice,  dev, TYPE_SCSI_DEVICE);
208571461b0fSAlexey Kardashevskiy     sPAPRPHBState *phb = CAST(sPAPRPHBState, dev, TYPE_SPAPR_PCI_HOST_BRIDGE);
208671461b0fSAlexey Kardashevskiy 
208771461b0fSAlexey Kardashevskiy     if (d) {
208871461b0fSAlexey Kardashevskiy         void *spapr = CAST(void, bus->parent, "spapr-vscsi");
208971461b0fSAlexey Kardashevskiy         VirtIOSCSI *virtio = CAST(VirtIOSCSI, bus->parent, TYPE_VIRTIO_SCSI);
209071461b0fSAlexey Kardashevskiy         USBDevice *usb = CAST(USBDevice, bus->parent, TYPE_USB_DEVICE);
209171461b0fSAlexey Kardashevskiy 
209271461b0fSAlexey Kardashevskiy         if (spapr) {
209371461b0fSAlexey Kardashevskiy             /*
209471461b0fSAlexey Kardashevskiy              * Replace "channel@0/disk@0,0" with "disk@8000000000000000":
209571461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 8000 | (bus << 8) | (id << 5) | lun
209671461b0fSAlexey Kardashevskiy              * in the top 16 bits of the 64-bit LUN
209771461b0fSAlexey Kardashevskiy              */
209871461b0fSAlexey Kardashevskiy             unsigned id = 0x8000 | (d->id << 8) | d->lun;
209971461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
210071461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 48);
210171461b0fSAlexey Kardashevskiy         } else if (virtio) {
210271461b0fSAlexey Kardashevskiy             /*
210371461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 01000000 | (target << 8) | lun
210471461b0fSAlexey Kardashevskiy              * in the top 32 bits of the 64-bit LUN
210571461b0fSAlexey Kardashevskiy              * Note: the quote above is from SLOF and it is wrong,
210671461b0fSAlexey Kardashevskiy              * the actual binding is:
210771461b0fSAlexey Kardashevskiy              * swap 0100 or 10 << or 20 << ( target lun-id -- srplun )
210871461b0fSAlexey Kardashevskiy              */
210971461b0fSAlexey Kardashevskiy             unsigned id = 0x1000000 | (d->id << 16) | d->lun;
211071461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
211171461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 32);
211271461b0fSAlexey Kardashevskiy         } else if (usb) {
211371461b0fSAlexey Kardashevskiy             /*
211471461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 01000000 | (usb-port << 16) | lun
211571461b0fSAlexey Kardashevskiy              * in the top 32 bits of the 64-bit LUN
211671461b0fSAlexey Kardashevskiy              */
211771461b0fSAlexey Kardashevskiy             unsigned usb_port = atoi(usb->port->path);
211871461b0fSAlexey Kardashevskiy             unsigned id = 0x1000000 | (usb_port << 16) | d->lun;
211971461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
212071461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 32);
212171461b0fSAlexey Kardashevskiy         }
212271461b0fSAlexey Kardashevskiy     }
212371461b0fSAlexey Kardashevskiy 
212471461b0fSAlexey Kardashevskiy     if (phb) {
212571461b0fSAlexey Kardashevskiy         /* Replace "pci" with "pci@800000020000000" */
212671461b0fSAlexey Kardashevskiy         return g_strdup_printf("pci@%"PRIX64, phb->buid);
212771461b0fSAlexey Kardashevskiy     }
212871461b0fSAlexey Kardashevskiy 
212971461b0fSAlexey Kardashevskiy     return NULL;
213071461b0fSAlexey Kardashevskiy }
213171461b0fSAlexey Kardashevskiy 
213223825581SEduardo Habkost static char *spapr_get_kvm_type(Object *obj, Error **errp)
213323825581SEduardo Habkost {
213428e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
213523825581SEduardo Habkost 
213628e02042SDavid Gibson     return g_strdup(spapr->kvm_type);
213723825581SEduardo Habkost }
213823825581SEduardo Habkost 
213923825581SEduardo Habkost static void spapr_set_kvm_type(Object *obj, const char *value, Error **errp)
214023825581SEduardo Habkost {
214128e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
214223825581SEduardo Habkost 
214328e02042SDavid Gibson     g_free(spapr->kvm_type);
214428e02042SDavid Gibson     spapr->kvm_type = g_strdup(value);
214523825581SEduardo Habkost }
214623825581SEduardo Habkost 
214723825581SEduardo Habkost static void spapr_machine_initfn(Object *obj)
214823825581SEduardo Habkost {
2149715c5407SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
2150715c5407SDavid Gibson 
2151715c5407SDavid Gibson     spapr->htab_fd = -1;
215223825581SEduardo Habkost     object_property_add_str(obj, "kvm-type",
215323825581SEduardo Habkost                             spapr_get_kvm_type, spapr_set_kvm_type, NULL);
215449d2e648SMarcel Apfelbaum     object_property_set_description(obj, "kvm-type",
215549d2e648SMarcel Apfelbaum                                     "Specifies the KVM virtualization mode (HV, PR)",
215649d2e648SMarcel Apfelbaum                                     NULL);
215723825581SEduardo Habkost }
215823825581SEduardo Habkost 
215987bbdd9cSDavid Gibson static void spapr_machine_finalizefn(Object *obj)
216087bbdd9cSDavid Gibson {
216187bbdd9cSDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
216287bbdd9cSDavid Gibson 
216387bbdd9cSDavid Gibson     g_free(spapr->kvm_type);
216487bbdd9cSDavid Gibson }
216587bbdd9cSDavid Gibson 
216634316482SAlexey Kardashevskiy static void ppc_cpu_do_nmi_on_cpu(void *arg)
216734316482SAlexey Kardashevskiy {
216834316482SAlexey Kardashevskiy     CPUState *cs = arg;
216934316482SAlexey Kardashevskiy 
217034316482SAlexey Kardashevskiy     cpu_synchronize_state(cs);
217134316482SAlexey Kardashevskiy     ppc_cpu_do_system_reset(cs);
217234316482SAlexey Kardashevskiy }
217334316482SAlexey Kardashevskiy 
217434316482SAlexey Kardashevskiy static void spapr_nmi(NMIState *n, int cpu_index, Error **errp)
217534316482SAlexey Kardashevskiy {
217634316482SAlexey Kardashevskiy     CPUState *cs;
217734316482SAlexey Kardashevskiy 
217834316482SAlexey Kardashevskiy     CPU_FOREACH(cs) {
217934316482SAlexey Kardashevskiy         async_run_on_cpu(cs, ppc_cpu_do_nmi_on_cpu, cs);
218034316482SAlexey Kardashevskiy     }
218134316482SAlexey Kardashevskiy }
218234316482SAlexey Kardashevskiy 
2183c20d332aSBharata B Rao static void spapr_add_lmbs(DeviceState *dev, uint64_t addr, uint64_t size,
2184c20d332aSBharata B Rao                            uint32_t node, Error **errp)
2185c20d332aSBharata B Rao {
2186c20d332aSBharata B Rao     sPAPRDRConnector *drc;
2187c20d332aSBharata B Rao     sPAPRDRConnectorClass *drck;
2188c20d332aSBharata B Rao     uint32_t nr_lmbs = size/SPAPR_MEMORY_BLOCK_SIZE;
2189c20d332aSBharata B Rao     int i, fdt_offset, fdt_size;
2190c20d332aSBharata B Rao     void *fdt;
2191c20d332aSBharata B Rao 
2192c20d332aSBharata B Rao     for (i = 0; i < nr_lmbs; i++) {
2193c20d332aSBharata B Rao         drc = spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_LMB,
2194c20d332aSBharata B Rao                 addr/SPAPR_MEMORY_BLOCK_SIZE);
2195c20d332aSBharata B Rao         g_assert(drc);
2196c20d332aSBharata B Rao 
2197c20d332aSBharata B Rao         fdt = create_device_tree(&fdt_size);
2198c20d332aSBharata B Rao         fdt_offset = spapr_populate_memory_node(fdt, node, addr,
2199c20d332aSBharata B Rao                                                 SPAPR_MEMORY_BLOCK_SIZE);
2200c20d332aSBharata B Rao 
2201c20d332aSBharata B Rao         drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
2202c20d332aSBharata B Rao         drck->attach(drc, dev, fdt, fdt_offset, !dev->hotplugged, errp);
2203c20d332aSBharata B Rao         addr += SPAPR_MEMORY_BLOCK_SIZE;
2204c20d332aSBharata B Rao     }
22055dd5238cSJianjun Duan     /* send hotplug notification to the
22065dd5238cSJianjun Duan      * guest only in case of hotplugged memory
22075dd5238cSJianjun Duan      */
22085dd5238cSJianjun Duan     if (dev->hotplugged) {
22090a417869SBharata B Rao        spapr_hotplug_req_add_by_count(SPAPR_DR_CONNECTOR_TYPE_LMB, nr_lmbs);
2210c20d332aSBharata B Rao     }
22115dd5238cSJianjun Duan }
2212c20d332aSBharata B Rao 
2213c20d332aSBharata B Rao static void spapr_memory_plug(HotplugHandler *hotplug_dev, DeviceState *dev,
2214c20d332aSBharata B Rao                               uint32_t node, Error **errp)
2215c20d332aSBharata B Rao {
2216c20d332aSBharata B Rao     Error *local_err = NULL;
2217c20d332aSBharata B Rao     sPAPRMachineState *ms = SPAPR_MACHINE(hotplug_dev);
2218c20d332aSBharata B Rao     PCDIMMDevice *dimm = PC_DIMM(dev);
2219c20d332aSBharata B Rao     PCDIMMDeviceClass *ddc = PC_DIMM_GET_CLASS(dimm);
2220c20d332aSBharata B Rao     MemoryRegion *mr = ddc->get_memory_region(dimm);
2221c20d332aSBharata B Rao     uint64_t align = memory_region_get_alignment(mr);
2222c20d332aSBharata B Rao     uint64_t size = memory_region_size(mr);
2223c20d332aSBharata B Rao     uint64_t addr;
2224c20d332aSBharata B Rao 
2225c20d332aSBharata B Rao     if (size % SPAPR_MEMORY_BLOCK_SIZE) {
2226c20d332aSBharata B Rao         error_setg(&local_err, "Hotplugged memory size must be a multiple of "
2227c20d332aSBharata B Rao                       "%lld MB", SPAPR_MEMORY_BLOCK_SIZE/M_BYTE);
2228c20d332aSBharata B Rao         goto out;
2229c20d332aSBharata B Rao     }
2230c20d332aSBharata B Rao 
2231d6a9b0b8SMichael S. Tsirkin     pc_dimm_memory_plug(dev, &ms->hotplug_memory, mr, align, &local_err);
2232c20d332aSBharata B Rao     if (local_err) {
2233c20d332aSBharata B Rao         goto out;
2234c20d332aSBharata B Rao     }
2235c20d332aSBharata B Rao 
2236c20d332aSBharata B Rao     addr = object_property_get_int(OBJECT(dimm), PC_DIMM_ADDR_PROP, &local_err);
2237c20d332aSBharata B Rao     if (local_err) {
2238c20d332aSBharata B Rao         pc_dimm_memory_unplug(dev, &ms->hotplug_memory, mr);
2239c20d332aSBharata B Rao         goto out;
2240c20d332aSBharata B Rao     }
2241c20d332aSBharata B Rao 
2242c20d332aSBharata B Rao     spapr_add_lmbs(dev, addr, size, node, &error_abort);
2243c20d332aSBharata B Rao 
2244c20d332aSBharata B Rao out:
2245c20d332aSBharata B Rao     error_propagate(errp, local_err);
2246c20d332aSBharata B Rao }
2247c20d332aSBharata B Rao 
2248af81cf32SBharata B Rao void *spapr_populate_hotplug_cpu_dt(CPUState *cs, int *fdt_offset,
2249af81cf32SBharata B Rao                                     sPAPRMachineState *spapr)
2250af81cf32SBharata B Rao {
2251af81cf32SBharata B Rao     PowerPCCPU *cpu = POWERPC_CPU(cs);
2252af81cf32SBharata B Rao     DeviceClass *dc = DEVICE_GET_CLASS(cs);
2253af81cf32SBharata B Rao     int id = ppc_get_vcpu_dt_id(cpu);
2254af81cf32SBharata B Rao     void *fdt;
2255af81cf32SBharata B Rao     int offset, fdt_size;
2256af81cf32SBharata B Rao     char *nodename;
2257af81cf32SBharata B Rao 
2258af81cf32SBharata B Rao     fdt = create_device_tree(&fdt_size);
2259af81cf32SBharata B Rao     nodename = g_strdup_printf("%s@%x", dc->fw_name, id);
2260af81cf32SBharata B Rao     offset = fdt_add_subnode(fdt, 0, nodename);
2261af81cf32SBharata B Rao 
2262af81cf32SBharata B Rao     spapr_populate_cpu_dt(cs, fdt, offset, spapr);
2263af81cf32SBharata B Rao     g_free(nodename);
2264af81cf32SBharata B Rao 
2265af81cf32SBharata B Rao     *fdt_offset = offset;
2266af81cf32SBharata B Rao     return fdt;
2267af81cf32SBharata B Rao }
2268af81cf32SBharata B Rao 
2269c20d332aSBharata B Rao static void spapr_machine_device_plug(HotplugHandler *hotplug_dev,
2270c20d332aSBharata B Rao                                       DeviceState *dev, Error **errp)
2271c20d332aSBharata B Rao {
2272c20d332aSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(qdev_get_machine());
2273c20d332aSBharata B Rao 
2274c20d332aSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2275b556854bSBharata B Rao         int node;
2276c20d332aSBharata B Rao 
2277c20d332aSBharata B Rao         if (!smc->dr_lmb_enabled) {
2278c20d332aSBharata B Rao             error_setg(errp, "Memory hotplug not supported for this machine");
2279c20d332aSBharata B Rao             return;
2280c20d332aSBharata B Rao         }
2281c20d332aSBharata B Rao         node = object_property_get_int(OBJECT(dev), PC_DIMM_NODE_PROP, errp);
2282c20d332aSBharata B Rao         if (*errp) {
2283c20d332aSBharata B Rao             return;
2284c20d332aSBharata B Rao         }
22851a5512bbSGonglei         if (node < 0 || node >= MAX_NODES) {
22861a5512bbSGonglei             error_setg(errp, "Invaild node %d", node);
22871a5512bbSGonglei             return;
22881a5512bbSGonglei         }
2289c20d332aSBharata B Rao 
2290b556854bSBharata B Rao         /*
2291b556854bSBharata B Rao          * Currently PowerPC kernel doesn't allow hot-adding memory to
2292b556854bSBharata B Rao          * memory-less node, but instead will silently add the memory
2293b556854bSBharata B Rao          * to the first node that has some memory. This causes two
2294b556854bSBharata B Rao          * unexpected behaviours for the user.
2295b556854bSBharata B Rao          *
2296b556854bSBharata B Rao          * - Memory gets hotplugged to a different node than what the user
2297b556854bSBharata B Rao          *   specified.
2298b556854bSBharata B Rao          * - Since pc-dimm subsystem in QEMU still thinks that memory belongs
2299b556854bSBharata B Rao          *   to memory-less node, a reboot will set things accordingly
2300b556854bSBharata B Rao          *   and the previously hotplugged memory now ends in the right node.
2301b556854bSBharata B Rao          *   This appears as if some memory moved from one node to another.
2302b556854bSBharata B Rao          *
2303b556854bSBharata B Rao          * So until kernel starts supporting memory hotplug to memory-less
2304b556854bSBharata B Rao          * nodes, just prevent such attempts upfront in QEMU.
2305b556854bSBharata B Rao          */
2306b556854bSBharata B Rao         if (nb_numa_nodes && !numa_info[node].node_mem) {
2307b556854bSBharata B Rao             error_setg(errp, "Can't hotplug memory to memory-less node %d",
2308b556854bSBharata B Rao                        node);
2309b556854bSBharata B Rao             return;
2310b556854bSBharata B Rao         }
2311b556854bSBharata B Rao 
2312c20d332aSBharata B Rao         spapr_memory_plug(hotplug_dev, dev, node, errp);
2313af81cf32SBharata B Rao     } else if (object_dynamic_cast(OBJECT(dev), TYPE_SPAPR_CPU_CORE)) {
2314af81cf32SBharata B Rao         spapr_core_plug(hotplug_dev, dev, errp);
2315c20d332aSBharata B Rao     }
2316c20d332aSBharata B Rao }
2317c20d332aSBharata B Rao 
2318c20d332aSBharata B Rao static void spapr_machine_device_unplug(HotplugHandler *hotplug_dev,
2319c20d332aSBharata B Rao                                       DeviceState *dev, Error **errp)
2320c20d332aSBharata B Rao {
23216f4b5c3eSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(qdev_get_machine());
23226f4b5c3eSBharata B Rao 
2323c20d332aSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2324c20d332aSBharata B Rao         error_setg(errp, "Memory hot unplug not supported by sPAPR");
23256f4b5c3eSBharata B Rao     } else if (object_dynamic_cast(OBJECT(dev), TYPE_SPAPR_CPU_CORE)) {
23266f4b5c3eSBharata B Rao         if (!smc->dr_cpu_enabled) {
23276f4b5c3eSBharata B Rao             error_setg(errp, "CPU hot unplug not supported on this machine");
23286f4b5c3eSBharata B Rao             return;
23296f4b5c3eSBharata B Rao         }
23306f4b5c3eSBharata B Rao         spapr_core_unplug(hotplug_dev, dev, errp);
2331c20d332aSBharata B Rao     }
2332c20d332aSBharata B Rao }
2333c20d332aSBharata B Rao 
233494a94e4cSBharata B Rao static void spapr_machine_device_pre_plug(HotplugHandler *hotplug_dev,
233594a94e4cSBharata B Rao                                           DeviceState *dev, Error **errp)
233694a94e4cSBharata B Rao {
233794a94e4cSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_SPAPR_CPU_CORE)) {
233894a94e4cSBharata B Rao         spapr_core_pre_plug(hotplug_dev, dev, errp);
233994a94e4cSBharata B Rao     }
234094a94e4cSBharata B Rao }
234194a94e4cSBharata B Rao 
2342c20d332aSBharata B Rao static HotplugHandler *spapr_get_hotpug_handler(MachineState *machine,
2343c20d332aSBharata B Rao                                              DeviceState *dev)
2344c20d332aSBharata B Rao {
234594a94e4cSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM) ||
234694a94e4cSBharata B Rao         object_dynamic_cast(OBJECT(dev), TYPE_SPAPR_CPU_CORE)) {
2347c20d332aSBharata B Rao         return HOTPLUG_HANDLER(machine);
2348c20d332aSBharata B Rao     }
2349c20d332aSBharata B Rao     return NULL;
2350c20d332aSBharata B Rao }
2351c20d332aSBharata B Rao 
235220bb648dSDavid Gibson static unsigned spapr_cpu_index_to_socket_id(unsigned cpu_index)
235320bb648dSDavid Gibson {
235420bb648dSDavid Gibson     /* Allocate to NUMA nodes on a "socket" basis (not that concept of
235520bb648dSDavid Gibson      * socket means much for the paravirtualized PAPR platform) */
235620bb648dSDavid Gibson     return cpu_index / smp_threads / smp_cores;
235720bb648dSDavid Gibson }
235820bb648dSDavid Gibson 
23592474bfd4SIgor Mammedov static HotpluggableCPUList *spapr_query_hotpluggable_cpus(MachineState *machine)
23602474bfd4SIgor Mammedov {
23612474bfd4SIgor Mammedov     int i;
23622474bfd4SIgor Mammedov     HotpluggableCPUList *head = NULL;
23632474bfd4SIgor Mammedov     sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
23642474bfd4SIgor Mammedov     int spapr_max_cores = max_cpus / smp_threads;
23652474bfd4SIgor Mammedov     int smt = kvmppc_smt_threads();
23662474bfd4SIgor Mammedov 
23672474bfd4SIgor Mammedov     for (i = 0; i < spapr_max_cores; i++) {
23682474bfd4SIgor Mammedov         HotpluggableCPUList *list_item = g_new0(typeof(*list_item), 1);
23692474bfd4SIgor Mammedov         HotpluggableCPU *cpu_item = g_new0(typeof(*cpu_item), 1);
23702474bfd4SIgor Mammedov         CpuInstanceProperties *cpu_props = g_new0(typeof(*cpu_props), 1);
23712474bfd4SIgor Mammedov 
23722474bfd4SIgor Mammedov         cpu_item->type = spapr_get_cpu_core_type(machine->cpu_model);
23732474bfd4SIgor Mammedov         cpu_item->vcpus_count = smp_threads;
237427393c33SPeter Krempa         cpu_props->has_core_id = true;
237527393c33SPeter Krempa         cpu_props->core_id = i * smt;
23762474bfd4SIgor Mammedov         /* TODO: add 'has_node/node' here to describe
23772474bfd4SIgor Mammedov            to which node core belongs */
23782474bfd4SIgor Mammedov 
23792474bfd4SIgor Mammedov         cpu_item->props = cpu_props;
23802474bfd4SIgor Mammedov         if (spapr->cores[i]) {
23812474bfd4SIgor Mammedov             cpu_item->has_qom_path = true;
23822474bfd4SIgor Mammedov             cpu_item->qom_path = object_get_canonical_path(spapr->cores[i]);
23832474bfd4SIgor Mammedov         }
23842474bfd4SIgor Mammedov         list_item->value = cpu_item;
23852474bfd4SIgor Mammedov         list_item->next = head;
23862474bfd4SIgor Mammedov         head = list_item;
23872474bfd4SIgor Mammedov     }
23882474bfd4SIgor Mammedov     return head;
23892474bfd4SIgor Mammedov }
23902474bfd4SIgor Mammedov 
239129ee3247SAlexey Kardashevskiy static void spapr_machine_class_init(ObjectClass *oc, void *data)
239253018216SPaolo Bonzini {
239329ee3247SAlexey Kardashevskiy     MachineClass *mc = MACHINE_CLASS(oc);
2394224245bfSDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(oc);
239571461b0fSAlexey Kardashevskiy     FWPathProviderClass *fwc = FW_PATH_PROVIDER_CLASS(oc);
239634316482SAlexey Kardashevskiy     NMIClass *nc = NMI_CLASS(oc);
2397c20d332aSBharata B Rao     HotplugHandlerClass *hc = HOTPLUG_HANDLER_CLASS(oc);
239829ee3247SAlexey Kardashevskiy 
23990eb9054cSDavid Gibson     mc->desc = "pSeries Logical Partition (PAPR compliant)";
2400fc9f38c3SDavid Gibson 
2401fc9f38c3SDavid Gibson     /*
2402fc9f38c3SDavid Gibson      * We set up the default / latest behaviour here.  The class_init
2403fc9f38c3SDavid Gibson      * functions for the specific versioned machine types can override
2404fc9f38c3SDavid Gibson      * these details for backwards compatibility
2405fc9f38c3SDavid Gibson      */
2406958db90cSMarcel Apfelbaum     mc->init = ppc_spapr_init;
2407958db90cSMarcel Apfelbaum     mc->reset = ppc_spapr_reset;
2408958db90cSMarcel Apfelbaum     mc->block_default_type = IF_SCSI;
240938b02bd8SAlexey Kardashevskiy     mc->max_cpus = MAX_CPUMASK_BITS;
2410958db90cSMarcel Apfelbaum     mc->no_parallel = 1;
24115b2128d2SAlexander Graf     mc->default_boot_order = "";
2412a34944feSNikunj A Dadhania     mc->default_ram_size = 512 * M_BYTE;
2413958db90cSMarcel Apfelbaum     mc->kvm_type = spapr_kvm_type;
24149e3f9733SAlexander Graf     mc->has_dynamic_sysbus = true;
2415e4024630SLaurent Vivier     mc->pci_allow_0_address = true;
2416c20d332aSBharata B Rao     mc->get_hotplug_handler = spapr_get_hotpug_handler;
241794a94e4cSBharata B Rao     hc->pre_plug = spapr_machine_device_pre_plug;
2418c20d332aSBharata B Rao     hc->plug = spapr_machine_device_plug;
2419c20d332aSBharata B Rao     hc->unplug = spapr_machine_device_unplug;
242020bb648dSDavid Gibson     mc->cpu_index_to_socket_id = spapr_cpu_index_to_socket_id;
24212474bfd4SIgor Mammedov     mc->query_hotpluggable_cpus = spapr_query_hotpluggable_cpus;
242200b4fbe2SMarcel Apfelbaum 
2423fc9f38c3SDavid Gibson     smc->dr_lmb_enabled = true;
242494a94e4cSBharata B Rao     smc->dr_cpu_enabled = true;
242571461b0fSAlexey Kardashevskiy     fwc->get_dev_path = spapr_get_fw_dev_path;
242634316482SAlexey Kardashevskiy     nc->nmi_monitor_handler = spapr_nmi;
242753018216SPaolo Bonzini }
242853018216SPaolo Bonzini 
242929ee3247SAlexey Kardashevskiy static const TypeInfo spapr_machine_info = {
243029ee3247SAlexey Kardashevskiy     .name          = TYPE_SPAPR_MACHINE,
243129ee3247SAlexey Kardashevskiy     .parent        = TYPE_MACHINE,
24324aee7362SDavid Gibson     .abstract      = true,
24336ca1502eSAlexey Kardashevskiy     .instance_size = sizeof(sPAPRMachineState),
243423825581SEduardo Habkost     .instance_init = spapr_machine_initfn,
243587bbdd9cSDavid Gibson     .instance_finalize = spapr_machine_finalizefn,
2436183930c0SDavid Gibson     .class_size    = sizeof(sPAPRMachineClass),
243729ee3247SAlexey Kardashevskiy     .class_init    = spapr_machine_class_init,
243871461b0fSAlexey Kardashevskiy     .interfaces = (InterfaceInfo[]) {
243971461b0fSAlexey Kardashevskiy         { TYPE_FW_PATH_PROVIDER },
244034316482SAlexey Kardashevskiy         { TYPE_NMI },
2441c20d332aSBharata B Rao         { TYPE_HOTPLUG_HANDLER },
244271461b0fSAlexey Kardashevskiy         { }
244371461b0fSAlexey Kardashevskiy     },
244429ee3247SAlexey Kardashevskiy };
244529ee3247SAlexey Kardashevskiy 
2446fccbc785SDavid Gibson #define DEFINE_SPAPR_MACHINE(suffix, verstr, latest)                 \
24475013c547SDavid Gibson     static void spapr_machine_##suffix##_class_init(ObjectClass *oc, \
24485013c547SDavid Gibson                                                     void *data)      \
24495013c547SDavid Gibson     {                                                                \
24505013c547SDavid Gibson         MachineClass *mc = MACHINE_CLASS(oc);                        \
24515013c547SDavid Gibson         spapr_machine_##suffix##_class_options(mc);                  \
2452fccbc785SDavid Gibson         if (latest) {                                                \
2453fccbc785SDavid Gibson             mc->alias = "pseries";                                   \
2454fccbc785SDavid Gibson             mc->is_default = 1;                                      \
2455fccbc785SDavid Gibson         }                                                            \
24565013c547SDavid Gibson     }                                                                \
24575013c547SDavid Gibson     static void spapr_machine_##suffix##_instance_init(Object *obj)  \
24585013c547SDavid Gibson     {                                                                \
24595013c547SDavid Gibson         MachineState *machine = MACHINE(obj);                        \
24605013c547SDavid Gibson         spapr_machine_##suffix##_instance_options(machine);          \
24615013c547SDavid Gibson     }                                                                \
24625013c547SDavid Gibson     static const TypeInfo spapr_machine_##suffix##_info = {          \
24635013c547SDavid Gibson         .name = MACHINE_TYPE_NAME("pseries-" verstr),                \
24645013c547SDavid Gibson         .parent = TYPE_SPAPR_MACHINE,                                \
24655013c547SDavid Gibson         .class_init = spapr_machine_##suffix##_class_init,           \
24665013c547SDavid Gibson         .instance_init = spapr_machine_##suffix##_instance_init,     \
24675013c547SDavid Gibson     };                                                               \
24685013c547SDavid Gibson     static void spapr_machine_register_##suffix(void)                \
24695013c547SDavid Gibson     {                                                                \
24705013c547SDavid Gibson         type_register(&spapr_machine_##suffix##_info);               \
24715013c547SDavid Gibson     }                                                                \
24720e6aac87SEduardo Habkost     type_init(spapr_machine_register_##suffix)
24735013c547SDavid Gibson 
24741c5f29bbSDavid Gibson /*
24751ea1eefcSBharata B Rao  * pseries-2.7
24761ea1eefcSBharata B Rao  */
24771ea1eefcSBharata B Rao static void spapr_machine_2_7_instance_options(MachineState *machine)
24781ea1eefcSBharata B Rao {
24791ea1eefcSBharata B Rao }
24801ea1eefcSBharata B Rao 
24811ea1eefcSBharata B Rao static void spapr_machine_2_7_class_options(MachineClass *mc)
24821ea1eefcSBharata B Rao {
24831ea1eefcSBharata B Rao     /* Defaults for the latest behaviour inherited from the base class */
24841ea1eefcSBharata B Rao }
24851ea1eefcSBharata B Rao 
24861ea1eefcSBharata B Rao DEFINE_SPAPR_MACHINE(2_7, "2.7", true);
24871ea1eefcSBharata B Rao 
24881ea1eefcSBharata B Rao /*
24894b23699cSDavid Gibson  * pseries-2.6
24904b23699cSDavid Gibson  */
24911ea1eefcSBharata B Rao #define SPAPR_COMPAT_2_6 \
2492*ae4de14cSAlexey Kardashevskiy     HW_COMPAT_2_6 \
2493*ae4de14cSAlexey Kardashevskiy     { \
2494*ae4de14cSAlexey Kardashevskiy         .driver   = TYPE_SPAPR_PCI_HOST_BRIDGE,\
2495*ae4de14cSAlexey Kardashevskiy         .property = "ddw",\
2496*ae4de14cSAlexey Kardashevskiy         .value    = stringify(off),\
2497*ae4de14cSAlexey Kardashevskiy     },
24981ea1eefcSBharata B Rao 
24994b23699cSDavid Gibson static void spapr_machine_2_6_instance_options(MachineState *machine)
25004b23699cSDavid Gibson {
25014b23699cSDavid Gibson }
25024b23699cSDavid Gibson 
25034b23699cSDavid Gibson static void spapr_machine_2_6_class_options(MachineClass *mc)
25044b23699cSDavid Gibson {
250594a94e4cSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc);
250694a94e4cSBharata B Rao 
25071ea1eefcSBharata B Rao     spapr_machine_2_7_class_options(mc);
250894a94e4cSBharata B Rao     smc->dr_cpu_enabled = false;
25091ea1eefcSBharata B Rao     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_6);
25104b23699cSDavid Gibson }
25114b23699cSDavid Gibson 
25121ea1eefcSBharata B Rao DEFINE_SPAPR_MACHINE(2_6, "2.6", false);
25134b23699cSDavid Gibson 
25144b23699cSDavid Gibson /*
25151c5f29bbSDavid Gibson  * pseries-2.5
25161c5f29bbSDavid Gibson  */
25174b23699cSDavid Gibson #define SPAPR_COMPAT_2_5 \
251857c522f4SThomas Huth     HW_COMPAT_2_5 \
251957c522f4SThomas Huth     { \
252057c522f4SThomas Huth         .driver   = "spapr-vlan", \
252157c522f4SThomas Huth         .property = "use-rx-buffer-pools", \
252257c522f4SThomas Huth         .value    = "off", \
252357c522f4SThomas Huth     },
25244b23699cSDavid Gibson 
25255013c547SDavid Gibson static void spapr_machine_2_5_instance_options(MachineState *machine)
25261c5f29bbSDavid Gibson {
25275013c547SDavid Gibson }
25285013c547SDavid Gibson 
25295013c547SDavid Gibson static void spapr_machine_2_5_class_options(MachineClass *mc)
25305013c547SDavid Gibson {
253157040d45SThomas Huth     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc);
253257040d45SThomas Huth 
25334b23699cSDavid Gibson     spapr_machine_2_6_class_options(mc);
253457040d45SThomas Huth     smc->use_ohci_by_default = true;
25354b23699cSDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_5);
25361c5f29bbSDavid Gibson }
25371c5f29bbSDavid Gibson 
25384b23699cSDavid Gibson DEFINE_SPAPR_MACHINE(2_5, "2.5", false);
25391c5f29bbSDavid Gibson 
25401c5f29bbSDavid Gibson /*
25411c5f29bbSDavid Gibson  * pseries-2.4
25421c5f29bbSDavid Gibson  */
254380fd50f9SCornelia Huck #define SPAPR_COMPAT_2_4 \
254480fd50f9SCornelia Huck         HW_COMPAT_2_4
254580fd50f9SCornelia Huck 
25465013c547SDavid Gibson static void spapr_machine_2_4_instance_options(MachineState *machine)
25471c5f29bbSDavid Gibson {
25485013c547SDavid Gibson     spapr_machine_2_5_instance_options(machine);
25495013c547SDavid Gibson }
25501c5f29bbSDavid Gibson 
25515013c547SDavid Gibson static void spapr_machine_2_4_class_options(MachineClass *mc)
25525013c547SDavid Gibson {
2553fc9f38c3SDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc);
2554fc9f38c3SDavid Gibson 
2555fc9f38c3SDavid Gibson     spapr_machine_2_5_class_options(mc);
2556fc9f38c3SDavid Gibson     smc->dr_lmb_enabled = false;
2557f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_4);
25581c5f29bbSDavid Gibson }
25591c5f29bbSDavid Gibson 
2560fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_4, "2.4", false);
25611c5f29bbSDavid Gibson 
25621c5f29bbSDavid Gibson /*
25631c5f29bbSDavid Gibson  * pseries-2.3
25641c5f29bbSDavid Gibson  */
256538ff32c6SEduardo Habkost #define SPAPR_COMPAT_2_3 \
25667619c7b0SMichael Roth         HW_COMPAT_2_3 \
25677619c7b0SMichael Roth         {\
25687619c7b0SMichael Roth             .driver   = "spapr-pci-host-bridge",\
25697619c7b0SMichael Roth             .property = "dynamic-reconfiguration",\
25707619c7b0SMichael Roth             .value    = "off",\
25717619c7b0SMichael Roth         },
257238ff32c6SEduardo Habkost 
25735013c547SDavid Gibson static void spapr_machine_2_3_instance_options(MachineState *machine)
25741c5f29bbSDavid Gibson {
25755013c547SDavid Gibson     spapr_machine_2_4_instance_options(machine);
25761c5f29bbSDavid Gibson     savevm_skip_section_footers();
25771c5f29bbSDavid Gibson     global_state_set_optional();
257809b5e30dSGreg Kurz     savevm_skip_configuration();
25791c5f29bbSDavid Gibson }
25801c5f29bbSDavid Gibson 
25815013c547SDavid Gibson static void spapr_machine_2_3_class_options(MachineClass *mc)
25821c5f29bbSDavid Gibson {
2583fc9f38c3SDavid Gibson     spapr_machine_2_4_class_options(mc);
2584f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_3);
25851c5f29bbSDavid Gibson }
2586fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_3, "2.3", false);
25871c5f29bbSDavid Gibson 
25881c5f29bbSDavid Gibson /*
25891c5f29bbSDavid Gibson  * pseries-2.2
25901c5f29bbSDavid Gibson  */
25911c5f29bbSDavid Gibson 
2592b194df47SAlexey Kardashevskiy #define SPAPR_COMPAT_2_2 \
25934dfd8eaaSEduardo Habkost         HW_COMPAT_2_2 \
2594b194df47SAlexey Kardashevskiy         {\
2595b194df47SAlexey Kardashevskiy             .driver   = TYPE_SPAPR_PCI_HOST_BRIDGE,\
2596b194df47SAlexey Kardashevskiy             .property = "mem_win_size",\
2597b194df47SAlexey Kardashevskiy             .value    = "0x20000000",\
2598dd754bafSEduardo Habkost         },
2599b194df47SAlexey Kardashevskiy 
26005013c547SDavid Gibson static void spapr_machine_2_2_instance_options(MachineState *machine)
2601b0e966d0SJason Wang {
26025013c547SDavid Gibson     spapr_machine_2_3_instance_options(machine);
2603cba0e779SGreg Kurz     machine->suppress_vmdesc = true;
2604b0e966d0SJason Wang }
2605b0e966d0SJason Wang 
26065013c547SDavid Gibson static void spapr_machine_2_2_class_options(MachineClass *mc)
2607b0e966d0SJason Wang {
2608fc9f38c3SDavid Gibson     spapr_machine_2_3_class_options(mc);
2609f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_2);
26101c5f29bbSDavid Gibson }
2611fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_2, "2.2", false);
26121c5f29bbSDavid Gibson 
26131c5f29bbSDavid Gibson /*
26141c5f29bbSDavid Gibson  * pseries-2.1
26151c5f29bbSDavid Gibson  */
26161c5f29bbSDavid Gibson #define SPAPR_COMPAT_2_1 \
26171c5f29bbSDavid Gibson         HW_COMPAT_2_1
26181c5f29bbSDavid Gibson 
26195013c547SDavid Gibson static void spapr_machine_2_1_instance_options(MachineState *machine)
26201c5f29bbSDavid Gibson {
26215013c547SDavid Gibson     spapr_machine_2_2_instance_options(machine);
26221c5f29bbSDavid Gibson }
26231c5f29bbSDavid Gibson 
26245013c547SDavid Gibson static void spapr_machine_2_1_class_options(MachineClass *mc)
2625b0e966d0SJason Wang {
2626fc9f38c3SDavid Gibson     spapr_machine_2_2_class_options(mc);
2627f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_1);
26286026db45SAlexey Kardashevskiy }
2629fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_1, "2.1", false);
26306026db45SAlexey Kardashevskiy 
263129ee3247SAlexey Kardashevskiy static void spapr_machine_register_types(void)
263229ee3247SAlexey Kardashevskiy {
263329ee3247SAlexey Kardashevskiy     type_register_static(&spapr_machine_info);
263429ee3247SAlexey Kardashevskiy }
263529ee3247SAlexey Kardashevskiy 
263629ee3247SAlexey Kardashevskiy type_init(spapr_machine_register_types)
2637