xref: /openbmc/qemu/hw/ppc/spapr.c (revision 6cc09e26)
153018216SPaolo Bonzini /*
253018216SPaolo Bonzini  * QEMU PowerPC pSeries Logical Partition (aka sPAPR) hardware System Emulator
353018216SPaolo Bonzini  *
453018216SPaolo Bonzini  * Copyright (c) 2004-2007 Fabrice Bellard
553018216SPaolo Bonzini  * Copyright (c) 2007 Jocelyn Mayer
653018216SPaolo Bonzini  * Copyright (c) 2010 David Gibson, IBM Corporation.
753018216SPaolo Bonzini  *
853018216SPaolo Bonzini  * Permission is hereby granted, free of charge, to any person obtaining a copy
953018216SPaolo Bonzini  * of this software and associated documentation files (the "Software"), to deal
1053018216SPaolo Bonzini  * in the Software without restriction, including without limitation the rights
1153018216SPaolo Bonzini  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
1253018216SPaolo Bonzini  * copies of the Software, and to permit persons to whom the Software is
1353018216SPaolo Bonzini  * furnished to do so, subject to the following conditions:
1453018216SPaolo Bonzini  *
1553018216SPaolo Bonzini  * The above copyright notice and this permission notice shall be included in
1653018216SPaolo Bonzini  * all copies or substantial portions of the Software.
1753018216SPaolo Bonzini  *
1853018216SPaolo Bonzini  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1953018216SPaolo Bonzini  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
2053018216SPaolo Bonzini  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
2153018216SPaolo Bonzini  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
2253018216SPaolo Bonzini  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
2353018216SPaolo Bonzini  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
2453018216SPaolo Bonzini  * THE SOFTWARE.
2553018216SPaolo Bonzini  *
2653018216SPaolo Bonzini  */
270d75590dSPeter Maydell #include "qemu/osdep.h"
28da34e65cSMarkus Armbruster #include "qapi/error.h"
2953018216SPaolo Bonzini #include "sysemu/sysemu.h"
30e35704baSEduardo Habkost #include "sysemu/numa.h"
3153018216SPaolo Bonzini #include "hw/hw.h"
3203dd024fSPaolo Bonzini #include "qemu/log.h"
3371461b0fSAlexey Kardashevskiy #include "hw/fw-path-provider.h"
3453018216SPaolo Bonzini #include "elf.h"
3553018216SPaolo Bonzini #include "net/net.h"
36ad440b4aSAndrew Jones #include "sysemu/device_tree.h"
37fa1d36dfSMarkus Armbruster #include "sysemu/block-backend.h"
3853018216SPaolo Bonzini #include "sysemu/cpus.h"
3953018216SPaolo Bonzini #include "sysemu/kvm.h"
40c20d332aSBharata B Rao #include "sysemu/device_tree.h"
4153018216SPaolo Bonzini #include "kvm_ppc.h"
42ff14e817SDr. David Alan Gilbert #include "migration/migration.h"
434be21d56SDavid Gibson #include "mmu-hash64.h"
443794d548SAlexey Kardashevskiy #include "qom/cpu.h"
4553018216SPaolo Bonzini 
4653018216SPaolo Bonzini #include "hw/boards.h"
470d09e41aSPaolo Bonzini #include "hw/ppc/ppc.h"
4853018216SPaolo Bonzini #include "hw/loader.h"
4953018216SPaolo Bonzini 
500d09e41aSPaolo Bonzini #include "hw/ppc/spapr.h"
510d09e41aSPaolo Bonzini #include "hw/ppc/spapr_vio.h"
520d09e41aSPaolo Bonzini #include "hw/pci-host/spapr.h"
530d09e41aSPaolo Bonzini #include "hw/ppc/xics.h"
5453018216SPaolo Bonzini #include "hw/pci/msi.h"
5553018216SPaolo Bonzini 
5653018216SPaolo Bonzini #include "hw/pci/pci.h"
5771461b0fSAlexey Kardashevskiy #include "hw/scsi/scsi.h"
5871461b0fSAlexey Kardashevskiy #include "hw/virtio/virtio-scsi.h"
5953018216SPaolo Bonzini 
6053018216SPaolo Bonzini #include "exec/address-spaces.h"
6153018216SPaolo Bonzini #include "hw/usb.h"
6253018216SPaolo Bonzini #include "qemu/config-file.h"
63135a129aSAneesh Kumar K.V #include "qemu/error-report.h"
642a6593cbSAlexey Kardashevskiy #include "trace.h"
6534316482SAlexey Kardashevskiy #include "hw/nmi.h"
6653018216SPaolo Bonzini 
6768a27b20SMichael S. Tsirkin #include "hw/compat.h"
68f348b6d1SVeronia Bahaa #include "qemu/cutils.h"
6994a94e4cSBharata B Rao #include "hw/ppc/spapr_cpu_core.h"
702474bfd4SIgor Mammedov #include "qmp-commands.h"
7168a27b20SMichael S. Tsirkin 
7253018216SPaolo Bonzini #include <libfdt.h>
7353018216SPaolo Bonzini 
7453018216SPaolo Bonzini /* SLOF memory layout:
7553018216SPaolo Bonzini  *
7653018216SPaolo Bonzini  * SLOF raw image loaded at 0, copies its romfs right below the flat
7753018216SPaolo Bonzini  * device-tree, then position SLOF itself 31M below that
7853018216SPaolo Bonzini  *
7953018216SPaolo Bonzini  * So we set FW_OVERHEAD to 40MB which should account for all of that
8053018216SPaolo Bonzini  * and more
8153018216SPaolo Bonzini  *
8253018216SPaolo Bonzini  * We load our kernel at 4M, leaving space for SLOF initial image
8353018216SPaolo Bonzini  */
8438b02bd8SAlexey Kardashevskiy #define FDT_MAX_SIZE            0x100000
8553018216SPaolo Bonzini #define RTAS_MAX_SIZE           0x10000
86b7d1f77aSBenjamin Herrenschmidt #define RTAS_MAX_ADDR           0x80000000 /* RTAS must stay below that */
8753018216SPaolo Bonzini #define FW_MAX_SIZE             0x400000
8853018216SPaolo Bonzini #define FW_FILE_NAME            "slof.bin"
8953018216SPaolo Bonzini #define FW_OVERHEAD             0x2800000
9053018216SPaolo Bonzini #define KERNEL_LOAD_ADDR        FW_MAX_SIZE
9153018216SPaolo Bonzini 
9253018216SPaolo Bonzini #define MIN_RMA_SLOF            128UL
9353018216SPaolo Bonzini 
9453018216SPaolo Bonzini #define PHANDLE_XICP            0x00001111
9553018216SPaolo Bonzini 
9653018216SPaolo Bonzini #define HTAB_SIZE(spapr)        (1ULL << ((spapr)->htab_shift))
9753018216SPaolo Bonzini 
98c04d6cfaSAnthony Liguori static XICSState *try_create_xics(const char *type, int nr_servers,
9934f2af3dSMarkus Armbruster                                   int nr_irqs, Error **errp)
100c04d6cfaSAnthony Liguori {
10134f2af3dSMarkus Armbruster     Error *err = NULL;
102c04d6cfaSAnthony Liguori     DeviceState *dev;
103c04d6cfaSAnthony Liguori 
104c04d6cfaSAnthony Liguori     dev = qdev_create(NULL, type);
105c04d6cfaSAnthony Liguori     qdev_prop_set_uint32(dev, "nr_servers", nr_servers);
106c04d6cfaSAnthony Liguori     qdev_prop_set_uint32(dev, "nr_irqs", nr_irqs);
10734f2af3dSMarkus Armbruster     object_property_set_bool(OBJECT(dev), true, "realized", &err);
10834f2af3dSMarkus Armbruster     if (err) {
10934f2af3dSMarkus Armbruster         error_propagate(errp, err);
11034f2af3dSMarkus Armbruster         object_unparent(OBJECT(dev));
111c04d6cfaSAnthony Liguori         return NULL;
112c04d6cfaSAnthony Liguori     }
1135a3d7b23SAlexey Kardashevskiy     return XICS_COMMON(dev);
114c04d6cfaSAnthony Liguori }
115c04d6cfaSAnthony Liguori 
116446f16a6SMarcel Apfelbaum static XICSState *xics_system_init(MachineState *machine,
1171e49182dSDavid Gibson                                    int nr_servers, int nr_irqs, Error **errp)
118c04d6cfaSAnthony Liguori {
119c04d6cfaSAnthony Liguori     XICSState *icp = NULL;
120c04d6cfaSAnthony Liguori 
12111ad93f6SDavid Gibson     if (kvm_enabled()) {
12234f2af3dSMarkus Armbruster         Error *err = NULL;
12334f2af3dSMarkus Armbruster 
124446f16a6SMarcel Apfelbaum         if (machine_kernel_irqchip_allowed(machine)) {
12534f2af3dSMarkus Armbruster             icp = try_create_xics(TYPE_KVM_XICS, nr_servers, nr_irqs, &err);
12611ad93f6SDavid Gibson         }
127446f16a6SMarcel Apfelbaum         if (machine_kernel_irqchip_required(machine) && !icp) {
128b83baa60SMarkus Armbruster             error_reportf_err(err,
129b83baa60SMarkus Armbruster                               "kernel_irqchip requested but unavailable: ");
130b83baa60SMarkus Armbruster         } else {
131903a41d3SStefano Dong (董兴水)             error_free(err);
13211ad93f6SDavid Gibson         }
133b83baa60SMarkus Armbruster     }
13411ad93f6SDavid Gibson 
13511ad93f6SDavid Gibson     if (!icp) {
1361e49182dSDavid Gibson         icp = try_create_xics(TYPE_XICS, nr_servers, nr_irqs, errp);
137c04d6cfaSAnthony Liguori     }
138c04d6cfaSAnthony Liguori 
139c04d6cfaSAnthony Liguori     return icp;
140c04d6cfaSAnthony Liguori }
141c04d6cfaSAnthony Liguori 
142833d4668SAlexey Kardashevskiy static int spapr_fixup_cpu_smt_dt(void *fdt, int offset, PowerPCCPU *cpu,
143833d4668SAlexey Kardashevskiy                                   int smt_threads)
144833d4668SAlexey Kardashevskiy {
145833d4668SAlexey Kardashevskiy     int i, ret = 0;
146833d4668SAlexey Kardashevskiy     uint32_t servers_prop[smt_threads];
147833d4668SAlexey Kardashevskiy     uint32_t gservers_prop[smt_threads * 2];
148833d4668SAlexey Kardashevskiy     int index = ppc_get_vcpu_dt_id(cpu);
149833d4668SAlexey Kardashevskiy 
1506d9412eaSAlexey Kardashevskiy     if (cpu->cpu_version) {
1514bce526eSLaurent Dufour         ret = fdt_setprop_cell(fdt, offset, "cpu-version", cpu->cpu_version);
1526d9412eaSAlexey Kardashevskiy         if (ret < 0) {
1536d9412eaSAlexey Kardashevskiy             return ret;
1546d9412eaSAlexey Kardashevskiy         }
1556d9412eaSAlexey Kardashevskiy     }
1566d9412eaSAlexey Kardashevskiy 
157833d4668SAlexey Kardashevskiy     /* Build interrupt servers and gservers properties */
158833d4668SAlexey Kardashevskiy     for (i = 0; i < smt_threads; i++) {
159833d4668SAlexey Kardashevskiy         servers_prop[i] = cpu_to_be32(index + i);
160833d4668SAlexey Kardashevskiy         /* Hack, direct the group queues back to cpu 0 */
161833d4668SAlexey Kardashevskiy         gservers_prop[i*2] = cpu_to_be32(index + i);
162833d4668SAlexey Kardashevskiy         gservers_prop[i*2 + 1] = 0;
163833d4668SAlexey Kardashevskiy     }
164833d4668SAlexey Kardashevskiy     ret = fdt_setprop(fdt, offset, "ibm,ppc-interrupt-server#s",
165833d4668SAlexey Kardashevskiy                       servers_prop, sizeof(servers_prop));
166833d4668SAlexey Kardashevskiy     if (ret < 0) {
167833d4668SAlexey Kardashevskiy         return ret;
168833d4668SAlexey Kardashevskiy     }
169833d4668SAlexey Kardashevskiy     ret = fdt_setprop(fdt, offset, "ibm,ppc-interrupt-gserver#s",
170833d4668SAlexey Kardashevskiy                       gservers_prop, sizeof(gservers_prop));
171833d4668SAlexey Kardashevskiy 
172833d4668SAlexey Kardashevskiy     return ret;
173833d4668SAlexey Kardashevskiy }
174833d4668SAlexey Kardashevskiy 
1750da6f3feSBharata B Rao static int spapr_fixup_cpu_numa_dt(void *fdt, int offset, CPUState *cs)
1760da6f3feSBharata B Rao {
1770da6f3feSBharata B Rao     int ret = 0;
1780da6f3feSBharata B Rao     PowerPCCPU *cpu = POWERPC_CPU(cs);
1790da6f3feSBharata B Rao     int index = ppc_get_vcpu_dt_id(cpu);
1800da6f3feSBharata B Rao     uint32_t associativity[] = {cpu_to_be32(0x5),
1810da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1820da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1830da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1840da6f3feSBharata B Rao                                 cpu_to_be32(cs->numa_node),
1850da6f3feSBharata B Rao                                 cpu_to_be32(index)};
1860da6f3feSBharata B Rao 
1870da6f3feSBharata B Rao     /* Advertise NUMA via ibm,associativity */
1880da6f3feSBharata B Rao     if (nb_numa_nodes > 1) {
1890da6f3feSBharata B Rao         ret = fdt_setprop(fdt, offset, "ibm,associativity", associativity,
1900da6f3feSBharata B Rao                           sizeof(associativity));
1910da6f3feSBharata B Rao     }
1920da6f3feSBharata B Rao 
1930da6f3feSBharata B Rao     return ret;
1940da6f3feSBharata B Rao }
1950da6f3feSBharata B Rao 
19628e02042SDavid Gibson static int spapr_fixup_cpu_dt(void *fdt, sPAPRMachineState *spapr)
19753018216SPaolo Bonzini {
19882677ed2SAlexey Kardashevskiy     int ret = 0, offset, cpus_offset;
19982677ed2SAlexey Kardashevskiy     CPUState *cs;
20053018216SPaolo Bonzini     char cpu_model[32];
20153018216SPaolo Bonzini     int smt = kvmppc_smt_threads();
20253018216SPaolo Bonzini     uint32_t pft_size_prop[] = {0, cpu_to_be32(spapr->htab_shift)};
20353018216SPaolo Bonzini 
20482677ed2SAlexey Kardashevskiy     CPU_FOREACH(cs) {
20582677ed2SAlexey Kardashevskiy         PowerPCCPU *cpu = POWERPC_CPU(cs);
20682677ed2SAlexey Kardashevskiy         DeviceClass *dc = DEVICE_GET_CLASS(cs);
20782677ed2SAlexey Kardashevskiy         int index = ppc_get_vcpu_dt_id(cpu);
20853018216SPaolo Bonzini 
2090f20ba62SAlexey Kardashevskiy         if ((index % smt) != 0) {
21053018216SPaolo Bonzini             continue;
21153018216SPaolo Bonzini         }
21253018216SPaolo Bonzini 
21382677ed2SAlexey Kardashevskiy         snprintf(cpu_model, 32, "%s@%x", dc->fw_name, index);
21453018216SPaolo Bonzini 
21582677ed2SAlexey Kardashevskiy         cpus_offset = fdt_path_offset(fdt, "/cpus");
21682677ed2SAlexey Kardashevskiy         if (cpus_offset < 0) {
21782677ed2SAlexey Kardashevskiy             cpus_offset = fdt_add_subnode(fdt, fdt_path_offset(fdt, "/"),
21882677ed2SAlexey Kardashevskiy                                           "cpus");
21982677ed2SAlexey Kardashevskiy             if (cpus_offset < 0) {
22082677ed2SAlexey Kardashevskiy                 return cpus_offset;
22182677ed2SAlexey Kardashevskiy             }
22282677ed2SAlexey Kardashevskiy         }
22382677ed2SAlexey Kardashevskiy         offset = fdt_subnode_offset(fdt, cpus_offset, cpu_model);
22482677ed2SAlexey Kardashevskiy         if (offset < 0) {
22582677ed2SAlexey Kardashevskiy             offset = fdt_add_subnode(fdt, cpus_offset, cpu_model);
22653018216SPaolo Bonzini             if (offset < 0) {
22753018216SPaolo Bonzini                 return offset;
22853018216SPaolo Bonzini             }
22982677ed2SAlexey Kardashevskiy         }
23053018216SPaolo Bonzini 
2310da6f3feSBharata B Rao         ret = fdt_setprop(fdt, offset, "ibm,pft-size",
2320da6f3feSBharata B Rao                           pft_size_prop, sizeof(pft_size_prop));
23353018216SPaolo Bonzini         if (ret < 0) {
23453018216SPaolo Bonzini             return ret;
23553018216SPaolo Bonzini         }
23653018216SPaolo Bonzini 
2370da6f3feSBharata B Rao         ret = spapr_fixup_cpu_numa_dt(fdt, offset, cs);
23853018216SPaolo Bonzini         if (ret < 0) {
23953018216SPaolo Bonzini             return ret;
24053018216SPaolo Bonzini         }
241833d4668SAlexey Kardashevskiy 
24282677ed2SAlexey Kardashevskiy         ret = spapr_fixup_cpu_smt_dt(fdt, offset, cpu,
2432a48d993SAlexey Kardashevskiy                                      ppc_get_compat_smt_threads(cpu));
244833d4668SAlexey Kardashevskiy         if (ret < 0) {
245833d4668SAlexey Kardashevskiy             return ret;
246833d4668SAlexey Kardashevskiy         }
24753018216SPaolo Bonzini     }
24853018216SPaolo Bonzini     return ret;
24953018216SPaolo Bonzini }
25053018216SPaolo Bonzini 
25153018216SPaolo Bonzini 
25253018216SPaolo Bonzini static size_t create_page_sizes_prop(CPUPPCState *env, uint32_t *prop,
25353018216SPaolo Bonzini                                      size_t maxsize)
25453018216SPaolo Bonzini {
25553018216SPaolo Bonzini     size_t maxcells = maxsize / sizeof(uint32_t);
25653018216SPaolo Bonzini     int i, j, count;
25753018216SPaolo Bonzini     uint32_t *p = prop;
25853018216SPaolo Bonzini 
25953018216SPaolo Bonzini     for (i = 0; i < PPC_PAGE_SIZES_MAX_SZ; i++) {
26053018216SPaolo Bonzini         struct ppc_one_seg_page_size *sps = &env->sps.sps[i];
26153018216SPaolo Bonzini 
26253018216SPaolo Bonzini         if (!sps->page_shift) {
26353018216SPaolo Bonzini             break;
26453018216SPaolo Bonzini         }
26553018216SPaolo Bonzini         for (count = 0; count < PPC_PAGE_SIZES_MAX_SZ; count++) {
26653018216SPaolo Bonzini             if (sps->enc[count].page_shift == 0) {
26753018216SPaolo Bonzini                 break;
26853018216SPaolo Bonzini             }
26953018216SPaolo Bonzini         }
27053018216SPaolo Bonzini         if ((p - prop) >= (maxcells - 3 - count * 2)) {
27153018216SPaolo Bonzini             break;
27253018216SPaolo Bonzini         }
27353018216SPaolo Bonzini         *(p++) = cpu_to_be32(sps->page_shift);
27453018216SPaolo Bonzini         *(p++) = cpu_to_be32(sps->slb_enc);
27553018216SPaolo Bonzini         *(p++) = cpu_to_be32(count);
27653018216SPaolo Bonzini         for (j = 0; j < count; j++) {
27753018216SPaolo Bonzini             *(p++) = cpu_to_be32(sps->enc[j].page_shift);
27853018216SPaolo Bonzini             *(p++) = cpu_to_be32(sps->enc[j].pte_enc);
27953018216SPaolo Bonzini         }
28053018216SPaolo Bonzini     }
28153018216SPaolo Bonzini 
28253018216SPaolo Bonzini     return (p - prop) * sizeof(uint32_t);
28353018216SPaolo Bonzini }
28453018216SPaolo Bonzini 
285b082d65aSAlexey Kardashevskiy static hwaddr spapr_node0_size(void)
286b082d65aSAlexey Kardashevskiy {
287fb164994SDavid Gibson     MachineState *machine = MACHINE(qdev_get_machine());
288fb164994SDavid Gibson 
289b082d65aSAlexey Kardashevskiy     if (nb_numa_nodes) {
290b082d65aSAlexey Kardashevskiy         int i;
291b082d65aSAlexey Kardashevskiy         for (i = 0; i < nb_numa_nodes; ++i) {
292b082d65aSAlexey Kardashevskiy             if (numa_info[i].node_mem) {
293fb164994SDavid Gibson                 return MIN(pow2floor(numa_info[i].node_mem),
294fb164994SDavid Gibson                            machine->ram_size);
295b082d65aSAlexey Kardashevskiy             }
296b082d65aSAlexey Kardashevskiy         }
297b082d65aSAlexey Kardashevskiy     }
298fb164994SDavid Gibson     return machine->ram_size;
299b082d65aSAlexey Kardashevskiy }
300b082d65aSAlexey Kardashevskiy 
30153018216SPaolo Bonzini #define _FDT(exp) \
30253018216SPaolo Bonzini     do { \
30353018216SPaolo Bonzini         int ret = (exp);                                           \
30453018216SPaolo Bonzini         if (ret < 0) {                                             \
30553018216SPaolo Bonzini             fprintf(stderr, "qemu: error creating device tree: %s: %s\n", \
30653018216SPaolo Bonzini                     #exp, fdt_strerror(ret));                      \
30753018216SPaolo Bonzini             exit(1);                                               \
30853018216SPaolo Bonzini         }                                                          \
30953018216SPaolo Bonzini     } while (0)
31053018216SPaolo Bonzini 
311a1d59c0fSAlexey Kardashevskiy static void add_str(GString *s, const gchar *s1)
312a1d59c0fSAlexey Kardashevskiy {
313a1d59c0fSAlexey Kardashevskiy     g_string_append_len(s, s1, strlen(s1) + 1);
314a1d59c0fSAlexey Kardashevskiy }
31553018216SPaolo Bonzini 
3163bbf37f2SAndreas Färber static void *spapr_create_fdt_skel(hwaddr initrd_base,
31753018216SPaolo Bonzini                                    hwaddr initrd_size,
31853018216SPaolo Bonzini                                    hwaddr kernel_size,
31916457e7fSBenjamin Herrenschmidt                                    bool little_endian,
32053018216SPaolo Bonzini                                    const char *kernel_cmdline,
32153018216SPaolo Bonzini                                    uint32_t epow_irq)
32253018216SPaolo Bonzini {
32353018216SPaolo Bonzini     void *fdt;
32453018216SPaolo Bonzini     uint32_t start_prop = cpu_to_be32(initrd_base);
32553018216SPaolo Bonzini     uint32_t end_prop = cpu_to_be32(initrd_base + initrd_size);
326a1d59c0fSAlexey Kardashevskiy     GString *hypertas = g_string_sized_new(256);
327a1d59c0fSAlexey Kardashevskiy     GString *qemu_hypertas = g_string_sized_new(256);
32853018216SPaolo Bonzini     uint32_t refpoints[] = {cpu_to_be32(0x4), cpu_to_be32(0x4)};
3299e734e3dSBharata B Rao     uint32_t interrupt_server_ranges_prop[] = {0, cpu_to_be32(max_cpus)};
33053018216SPaolo Bonzini     unsigned char vec5[] = {0x0, 0x0, 0x0, 0x0, 0x0, 0x80};
331ef951443SNikunj A Dadhania     char *buf;
33253018216SPaolo Bonzini 
333a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-pft");
334a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-term");
335a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-dabr");
336a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-interrupt");
337a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-tce");
338a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-vio");
339a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-splpar");
340a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-bulk");
341a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-set-mode");
342*6cc09e26SThomas Huth     add_str(hypertas, "hcall-sprg0");
343*6cc09e26SThomas Huth     add_str(hypertas, "hcall-copy");
344*6cc09e26SThomas Huth     add_str(hypertas, "hcall-debug");
345a1d59c0fSAlexey Kardashevskiy     add_str(qemu_hypertas, "hcall-memop1");
346a1d59c0fSAlexey Kardashevskiy 
34753018216SPaolo Bonzini     fdt = g_malloc0(FDT_MAX_SIZE);
34853018216SPaolo Bonzini     _FDT((fdt_create(fdt, FDT_MAX_SIZE)));
34953018216SPaolo Bonzini 
35053018216SPaolo Bonzini     if (kernel_size) {
35153018216SPaolo Bonzini         _FDT((fdt_add_reservemap_entry(fdt, KERNEL_LOAD_ADDR, kernel_size)));
35253018216SPaolo Bonzini     }
35353018216SPaolo Bonzini     if (initrd_size) {
35453018216SPaolo Bonzini         _FDT((fdt_add_reservemap_entry(fdt, initrd_base, initrd_size)));
35553018216SPaolo Bonzini     }
35653018216SPaolo Bonzini     _FDT((fdt_finish_reservemap(fdt)));
35753018216SPaolo Bonzini 
35853018216SPaolo Bonzini     /* Root node */
35953018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "")));
36053018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type", "chrp")));
36153018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "model", "IBM pSeries (emulated by qemu)")));
362fa388916SAnthony Liguori     _FDT((fdt_property_string(fdt, "compatible", "qemu,pseries")));
36353018216SPaolo Bonzini 
364ef951443SNikunj A Dadhania     /*
365ef951443SNikunj A Dadhania      * Add info to guest to indentify which host is it being run on
366ef951443SNikunj A Dadhania      * and what is the uuid of the guest
367ef951443SNikunj A Dadhania      */
368ef951443SNikunj A Dadhania     if (kvmppc_get_host_model(&buf)) {
369ef951443SNikunj A Dadhania         _FDT((fdt_property_string(fdt, "host-model", buf)));
370ef951443SNikunj A Dadhania         g_free(buf);
371ef951443SNikunj A Dadhania     }
372ef951443SNikunj A Dadhania     if (kvmppc_get_host_serial(&buf)) {
373ef951443SNikunj A Dadhania         _FDT((fdt_property_string(fdt, "host-serial", buf)));
374ef951443SNikunj A Dadhania         g_free(buf);
375ef951443SNikunj A Dadhania     }
376ef951443SNikunj A Dadhania 
377ef951443SNikunj A Dadhania     buf = g_strdup_printf(UUID_FMT, qemu_uuid[0], qemu_uuid[1],
378ef951443SNikunj A Dadhania                           qemu_uuid[2], qemu_uuid[3], qemu_uuid[4],
379ef951443SNikunj A Dadhania                           qemu_uuid[5], qemu_uuid[6], qemu_uuid[7],
380ef951443SNikunj A Dadhania                           qemu_uuid[8], qemu_uuid[9], qemu_uuid[10],
381ef951443SNikunj A Dadhania                           qemu_uuid[11], qemu_uuid[12], qemu_uuid[13],
382ef951443SNikunj A Dadhania                           qemu_uuid[14], qemu_uuid[15]);
383ef951443SNikunj A Dadhania 
384ef951443SNikunj A Dadhania     _FDT((fdt_property_string(fdt, "vm,uuid", buf)));
3853dc0a66dSAlexey Kardashevskiy     if (qemu_uuid_set) {
3863dc0a66dSAlexey Kardashevskiy         _FDT((fdt_property_string(fdt, "system-id", buf)));
3873dc0a66dSAlexey Kardashevskiy     }
388ef951443SNikunj A Dadhania     g_free(buf);
389ef951443SNikunj A Dadhania 
3902c1aaa81SSam Bobroff     if (qemu_get_vm_name()) {
3912c1aaa81SSam Bobroff         _FDT((fdt_property_string(fdt, "ibm,partition-name",
3922c1aaa81SSam Bobroff                                   qemu_get_vm_name())));
3932c1aaa81SSam Bobroff     }
3942c1aaa81SSam Bobroff 
39553018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#address-cells", 0x2)));
39653018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#size-cells", 0x2)));
39753018216SPaolo Bonzini 
39853018216SPaolo Bonzini     /* /chosen */
39953018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "chosen")));
40053018216SPaolo Bonzini 
40153018216SPaolo Bonzini     /* Set Form1_affinity */
40253018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,architecture-vec-5", vec5, sizeof(vec5))));
40353018216SPaolo Bonzini 
40453018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "bootargs", kernel_cmdline)));
40553018216SPaolo Bonzini     _FDT((fdt_property(fdt, "linux,initrd-start",
40653018216SPaolo Bonzini                        &start_prop, sizeof(start_prop))));
40753018216SPaolo Bonzini     _FDT((fdt_property(fdt, "linux,initrd-end",
40853018216SPaolo Bonzini                        &end_prop, sizeof(end_prop))));
40953018216SPaolo Bonzini     if (kernel_size) {
41053018216SPaolo Bonzini         uint64_t kprop[2] = { cpu_to_be64(KERNEL_LOAD_ADDR),
41153018216SPaolo Bonzini                               cpu_to_be64(kernel_size) };
41253018216SPaolo Bonzini 
41353018216SPaolo Bonzini         _FDT((fdt_property(fdt, "qemu,boot-kernel", &kprop, sizeof(kprop))));
41416457e7fSBenjamin Herrenschmidt         if (little_endian) {
41516457e7fSBenjamin Herrenschmidt             _FDT((fdt_property(fdt, "qemu,boot-kernel-le", NULL, 0)));
41616457e7fSBenjamin Herrenschmidt         }
41753018216SPaolo Bonzini     }
418cc84c0f3SAvik Sil     if (boot_menu) {
419cc84c0f3SAvik Sil         _FDT((fdt_property_cell(fdt, "qemu,boot-menu", boot_menu)));
420cc84c0f3SAvik Sil     }
42153018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-width", graphic_width)));
42253018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-height", graphic_height)));
42353018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-depth", graphic_depth)));
42453018216SPaolo Bonzini 
42553018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
42653018216SPaolo Bonzini 
42753018216SPaolo Bonzini     /* RTAS */
42853018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "rtas")));
42953018216SPaolo Bonzini 
430da95324eSAlexey Kardashevskiy     if (!kvm_enabled() || kvmppc_spapr_use_multitce()) {
431da95324eSAlexey Kardashevskiy         add_str(hypertas, "hcall-multi-tce");
432da95324eSAlexey Kardashevskiy     }
433a1d59c0fSAlexey Kardashevskiy     _FDT((fdt_property(fdt, "ibm,hypertas-functions", hypertas->str,
434a1d59c0fSAlexey Kardashevskiy                        hypertas->len)));
435a1d59c0fSAlexey Kardashevskiy     g_string_free(hypertas, TRUE);
436a1d59c0fSAlexey Kardashevskiy     _FDT((fdt_property(fdt, "qemu,hypertas-functions", qemu_hypertas->str,
437a1d59c0fSAlexey Kardashevskiy                        qemu_hypertas->len)));
438a1d59c0fSAlexey Kardashevskiy     g_string_free(qemu_hypertas, TRUE);
43953018216SPaolo Bonzini 
44053018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,associativity-reference-points",
44153018216SPaolo Bonzini         refpoints, sizeof(refpoints))));
44253018216SPaolo Bonzini 
44353018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "rtas-error-log-max", RTAS_ERROR_LOG_MAX)));
44479853e18STyrel Datwyler     _FDT((fdt_property_cell(fdt, "rtas-event-scan-rate",
44579853e18STyrel Datwyler                             RTAS_EVENT_SCAN_RATE)));
44653018216SPaolo Bonzini 
447226419d6SMichael S. Tsirkin     if (msi_nonbroken) {
448a95f9922SSam Bobroff         _FDT((fdt_property(fdt, "ibm,change-msix-capable", NULL, 0)));
449a95f9922SSam Bobroff     }
450a95f9922SSam Bobroff 
4512e14072fSNikunj A Dadhania     /*
4529d632f5fSzhanghailiang      * According to PAPR, rtas ibm,os-term does not guarantee a return
4532e14072fSNikunj A Dadhania      * back to the guest cpu.
4542e14072fSNikunj A Dadhania      *
4552e14072fSNikunj A Dadhania      * While an additional ibm,extended-os-term property indicates that
4562e14072fSNikunj A Dadhania      * rtas call return will always occur. Set this property.
4572e14072fSNikunj A Dadhania      */
4582e14072fSNikunj A Dadhania     _FDT((fdt_property(fdt, "ibm,extended-os-term", NULL, 0)));
4592e14072fSNikunj A Dadhania 
46053018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
46153018216SPaolo Bonzini 
46253018216SPaolo Bonzini     /* interrupt controller */
46353018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "interrupt-controller")));
46453018216SPaolo Bonzini 
46553018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type",
46653018216SPaolo Bonzini                               "PowerPC-External-Interrupt-Presentation")));
46753018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "compatible", "IBM,ppc-xicp")));
46853018216SPaolo Bonzini     _FDT((fdt_property(fdt, "interrupt-controller", NULL, 0)));
46953018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,interrupt-server-ranges",
47053018216SPaolo Bonzini                        interrupt_server_ranges_prop,
47153018216SPaolo Bonzini                        sizeof(interrupt_server_ranges_prop))));
47253018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#interrupt-cells", 2)));
47353018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "linux,phandle", PHANDLE_XICP)));
47453018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "phandle", PHANDLE_XICP)));
47553018216SPaolo Bonzini 
47653018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
47753018216SPaolo Bonzini 
47853018216SPaolo Bonzini     /* vdevice */
47953018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "vdevice")));
48053018216SPaolo Bonzini 
48153018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type", "vdevice")));
48253018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "compatible", "IBM,vdevice")));
48353018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#address-cells", 0x1)));
48453018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#size-cells", 0x0)));
48553018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#interrupt-cells", 0x2)));
48653018216SPaolo Bonzini     _FDT((fdt_property(fdt, "interrupt-controller", NULL, 0)));
48753018216SPaolo Bonzini 
48853018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
48953018216SPaolo Bonzini 
49053018216SPaolo Bonzini     /* event-sources */
49153018216SPaolo Bonzini     spapr_events_fdt_skel(fdt, epow_irq);
49253018216SPaolo Bonzini 
493f7d69146SAlexander Graf     /* /hypervisor node */
494f7d69146SAlexander Graf     if (kvm_enabled()) {
495f7d69146SAlexander Graf         uint8_t hypercall[16];
496f7d69146SAlexander Graf 
497f7d69146SAlexander Graf         /* indicate KVM hypercall interface */
498f7d69146SAlexander Graf         _FDT((fdt_begin_node(fdt, "hypervisor")));
499f7d69146SAlexander Graf         _FDT((fdt_property_string(fdt, "compatible", "linux,kvm")));
500f7d69146SAlexander Graf         if (kvmppc_has_cap_fixup_hcalls()) {
501f7d69146SAlexander Graf             /*
502f7d69146SAlexander Graf              * Older KVM versions with older guest kernels were broken with the
503f7d69146SAlexander Graf              * magic page, don't allow the guest to map it.
504f7d69146SAlexander Graf              */
5050ddbd053SAlexey Kardashevskiy             if (!kvmppc_get_hypercall(first_cpu->env_ptr, hypercall,
5060ddbd053SAlexey Kardashevskiy                                       sizeof(hypercall))) {
507f7d69146SAlexander Graf                 _FDT((fdt_property(fdt, "hcall-instructions", hypercall,
508f7d69146SAlexander Graf                                    sizeof(hypercall))));
509f7d69146SAlexander Graf             }
5100ddbd053SAlexey Kardashevskiy         }
511f7d69146SAlexander Graf         _FDT((fdt_end_node(fdt)));
512f7d69146SAlexander Graf     }
513f7d69146SAlexander Graf 
51453018216SPaolo Bonzini     _FDT((fdt_end_node(fdt))); /* close root node */
51553018216SPaolo Bonzini     _FDT((fdt_finish(fdt)));
51653018216SPaolo Bonzini 
51753018216SPaolo Bonzini     return fdt;
51853018216SPaolo Bonzini }
51953018216SPaolo Bonzini 
52003d196b7SBharata B Rao static int spapr_populate_memory_node(void *fdt, int nodeid, hwaddr start,
52126a8c353SAlexey Kardashevskiy                                        hwaddr size)
52226a8c353SAlexey Kardashevskiy {
52326a8c353SAlexey Kardashevskiy     uint32_t associativity[] = {
52426a8c353SAlexey Kardashevskiy         cpu_to_be32(0x4), /* length */
52526a8c353SAlexey Kardashevskiy         cpu_to_be32(0x0), cpu_to_be32(0x0),
526c3b4f589SAlexey Kardashevskiy         cpu_to_be32(0x0), cpu_to_be32(nodeid)
52726a8c353SAlexey Kardashevskiy     };
52826a8c353SAlexey Kardashevskiy     char mem_name[32];
52926a8c353SAlexey Kardashevskiy     uint64_t mem_reg_property[2];
53026a8c353SAlexey Kardashevskiy     int off;
53126a8c353SAlexey Kardashevskiy 
53226a8c353SAlexey Kardashevskiy     mem_reg_property[0] = cpu_to_be64(start);
53326a8c353SAlexey Kardashevskiy     mem_reg_property[1] = cpu_to_be64(size);
53426a8c353SAlexey Kardashevskiy 
53526a8c353SAlexey Kardashevskiy     sprintf(mem_name, "memory@" TARGET_FMT_lx, start);
53626a8c353SAlexey Kardashevskiy     off = fdt_add_subnode(fdt, 0, mem_name);
53726a8c353SAlexey Kardashevskiy     _FDT(off);
53826a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop_string(fdt, off, "device_type", "memory")));
53926a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop(fdt, off, "reg", mem_reg_property,
54026a8c353SAlexey Kardashevskiy                       sizeof(mem_reg_property))));
54126a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop(fdt, off, "ibm,associativity", associativity,
54226a8c353SAlexey Kardashevskiy                       sizeof(associativity))));
54303d196b7SBharata B Rao     return off;
54426a8c353SAlexey Kardashevskiy }
54526a8c353SAlexey Kardashevskiy 
54628e02042SDavid Gibson static int spapr_populate_memory(sPAPRMachineState *spapr, void *fdt)
54753018216SPaolo Bonzini {
548fb164994SDavid Gibson     MachineState *machine = MACHINE(spapr);
5497db8a127SAlexey Kardashevskiy     hwaddr mem_start, node_size;
5507db8a127SAlexey Kardashevskiy     int i, nb_nodes = nb_numa_nodes;
5517db8a127SAlexey Kardashevskiy     NodeInfo *nodes = numa_info;
5527db8a127SAlexey Kardashevskiy     NodeInfo ramnode;
55353018216SPaolo Bonzini 
5547db8a127SAlexey Kardashevskiy     /* No NUMA nodes, assume there is just one node with whole RAM */
5557db8a127SAlexey Kardashevskiy     if (!nb_numa_nodes) {
5567db8a127SAlexey Kardashevskiy         nb_nodes = 1;
557fb164994SDavid Gibson         ramnode.node_mem = machine->ram_size;
5587db8a127SAlexey Kardashevskiy         nodes = &ramnode;
5595fe269b1SPaul Mackerras     }
56053018216SPaolo Bonzini 
5617db8a127SAlexey Kardashevskiy     for (i = 0, mem_start = 0; i < nb_nodes; ++i) {
5627db8a127SAlexey Kardashevskiy         if (!nodes[i].node_mem) {
5637db8a127SAlexey Kardashevskiy             continue;
56453018216SPaolo Bonzini         }
565fb164994SDavid Gibson         if (mem_start >= machine->ram_size) {
5665fe269b1SPaul Mackerras             node_size = 0;
5675fe269b1SPaul Mackerras         } else {
5687db8a127SAlexey Kardashevskiy             node_size = nodes[i].node_mem;
569fb164994SDavid Gibson             if (node_size > machine->ram_size - mem_start) {
570fb164994SDavid Gibson                 node_size = machine->ram_size - mem_start;
5715fe269b1SPaul Mackerras             }
5725fe269b1SPaul Mackerras         }
5737db8a127SAlexey Kardashevskiy         if (!mem_start) {
5747db8a127SAlexey Kardashevskiy             /* ppc_spapr_init() checks for rma_size <= node0_size already */
575e8f986fcSBharata B Rao             spapr_populate_memory_node(fdt, i, 0, spapr->rma_size);
5767db8a127SAlexey Kardashevskiy             mem_start += spapr->rma_size;
5777db8a127SAlexey Kardashevskiy             node_size -= spapr->rma_size;
5787db8a127SAlexey Kardashevskiy         }
5796010818cSAlexey Kardashevskiy         for ( ; node_size; ) {
5806010818cSAlexey Kardashevskiy             hwaddr sizetmp = pow2floor(node_size);
5816010818cSAlexey Kardashevskiy 
5826010818cSAlexey Kardashevskiy             /* mem_start != 0 here */
5836010818cSAlexey Kardashevskiy             if (ctzl(mem_start) < ctzl(sizetmp)) {
5846010818cSAlexey Kardashevskiy                 sizetmp = 1ULL << ctzl(mem_start);
5856010818cSAlexey Kardashevskiy             }
5866010818cSAlexey Kardashevskiy 
5876010818cSAlexey Kardashevskiy             spapr_populate_memory_node(fdt, i, mem_start, sizetmp);
5886010818cSAlexey Kardashevskiy             node_size -= sizetmp;
5896010818cSAlexey Kardashevskiy             mem_start += sizetmp;
5906010818cSAlexey Kardashevskiy         }
59153018216SPaolo Bonzini     }
59253018216SPaolo Bonzini 
59353018216SPaolo Bonzini     return 0;
59453018216SPaolo Bonzini }
59553018216SPaolo Bonzini 
5960da6f3feSBharata B Rao static void spapr_populate_cpu_dt(CPUState *cs, void *fdt, int offset,
5970da6f3feSBharata B Rao                                   sPAPRMachineState *spapr)
5980da6f3feSBharata B Rao {
5990da6f3feSBharata B Rao     PowerPCCPU *cpu = POWERPC_CPU(cs);
6000da6f3feSBharata B Rao     CPUPPCState *env = &cpu->env;
6010da6f3feSBharata B Rao     PowerPCCPUClass *pcc = POWERPC_CPU_GET_CLASS(cs);
6020da6f3feSBharata B Rao     int index = ppc_get_vcpu_dt_id(cpu);
6030da6f3feSBharata B Rao     uint32_t segs[] = {cpu_to_be32(28), cpu_to_be32(40),
6040da6f3feSBharata B Rao                        0xffffffff, 0xffffffff};
605afd10a0fSBharata B Rao     uint32_t tbfreq = kvm_enabled() ? kvmppc_get_tbfreq()
606afd10a0fSBharata B Rao         : SPAPR_TIMEBASE_FREQ;
6070da6f3feSBharata B Rao     uint32_t cpufreq = kvm_enabled() ? kvmppc_get_clockfreq() : 1000000000;
6080da6f3feSBharata B Rao     uint32_t page_sizes_prop[64];
6090da6f3feSBharata B Rao     size_t page_sizes_prop_size;
61022419c2aSDavid Gibson     uint32_t vcpus_per_socket = smp_threads * smp_cores;
6110da6f3feSBharata B Rao     uint32_t pft_size_prop[] = {0, cpu_to_be32(spapr->htab_shift)};
612af81cf32SBharata B Rao     sPAPRDRConnector *drc;
613af81cf32SBharata B Rao     sPAPRDRConnectorClass *drck;
614af81cf32SBharata B Rao     int drc_index;
615af81cf32SBharata B Rao 
616af81cf32SBharata B Rao     drc = spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_CPU, index);
617af81cf32SBharata B Rao     if (drc) {
618af81cf32SBharata B Rao         drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
619af81cf32SBharata B Rao         drc_index = drck->get_index(drc);
620af81cf32SBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "ibm,my-drc-index", drc_index)));
621af81cf32SBharata B Rao     }
6220da6f3feSBharata B Rao 
62390da0d5aSBenjamin Herrenschmidt     /* Note: we keep CI large pages off for now because a 64K capable guest
62490da0d5aSBenjamin Herrenschmidt      * provisioned with large pages might otherwise try to map a qemu
62590da0d5aSBenjamin Herrenschmidt      * framebuffer (or other kind of memory mapped PCI BAR) using 64K pages
62690da0d5aSBenjamin Herrenschmidt      * even if that qemu runs on a 4k host.
62790da0d5aSBenjamin Herrenschmidt      *
62890da0d5aSBenjamin Herrenschmidt      * We can later add this bit back when we are confident this is not
62990da0d5aSBenjamin Herrenschmidt      * an issue (!HV KVM or 64K host)
63090da0d5aSBenjamin Herrenschmidt      */
63190da0d5aSBenjamin Herrenschmidt     uint8_t pa_features_206[] = { 6, 0,
63290da0d5aSBenjamin Herrenschmidt         0xf6, 0x1f, 0xc7, 0x00, 0x80, 0xc0 };
63390da0d5aSBenjamin Herrenschmidt     uint8_t pa_features_207[] = { 24, 0,
63490da0d5aSBenjamin Herrenschmidt         0xf6, 0x1f, 0xc7, 0xc0, 0x80, 0xf0,
63590da0d5aSBenjamin Herrenschmidt         0x80, 0x00, 0x00, 0x00, 0x00, 0x00,
63690da0d5aSBenjamin Herrenschmidt         0x00, 0x00, 0x00, 0x00, 0x80, 0x00,
63790da0d5aSBenjamin Herrenschmidt         0x80, 0x00, 0x80, 0x00, 0x80, 0x00 };
63890da0d5aSBenjamin Herrenschmidt     uint8_t *pa_features;
63990da0d5aSBenjamin Herrenschmidt     size_t pa_size;
64090da0d5aSBenjamin Herrenschmidt 
6410da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "reg", index)));
6420da6f3feSBharata B Rao     _FDT((fdt_setprop_string(fdt, offset, "device_type", "cpu")));
6430da6f3feSBharata B Rao 
6440da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "cpu-version", env->spr[SPR_PVR])));
6450da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "d-cache-block-size",
6460da6f3feSBharata B Rao                            env->dcache_line_size)));
6470da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "d-cache-line-size",
6480da6f3feSBharata B Rao                            env->dcache_line_size)));
6490da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "i-cache-block-size",
6500da6f3feSBharata B Rao                            env->icache_line_size)));
6510da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "i-cache-line-size",
6520da6f3feSBharata B Rao                            env->icache_line_size)));
6530da6f3feSBharata B Rao 
6540da6f3feSBharata B Rao     if (pcc->l1_dcache_size) {
6550da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "d-cache-size",
6560da6f3feSBharata B Rao                                pcc->l1_dcache_size)));
6570da6f3feSBharata B Rao     } else {
6580da6f3feSBharata B Rao         fprintf(stderr, "Warning: Unknown L1 dcache size for cpu\n");
6590da6f3feSBharata B Rao     }
6600da6f3feSBharata B Rao     if (pcc->l1_icache_size) {
6610da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "i-cache-size",
6620da6f3feSBharata B Rao                                pcc->l1_icache_size)));
6630da6f3feSBharata B Rao     } else {
6640da6f3feSBharata B Rao         fprintf(stderr, "Warning: Unknown L1 icache size for cpu\n");
6650da6f3feSBharata B Rao     }
6660da6f3feSBharata B Rao 
6670da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "timebase-frequency", tbfreq)));
6680da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "clock-frequency", cpufreq)));
669fd5da5c4SThomas Huth     _FDT((fdt_setprop_cell(fdt, offset, "slb-size", env->slb_nr)));
6700da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "ibm,slb-size", env->slb_nr)));
6710da6f3feSBharata B Rao     _FDT((fdt_setprop_string(fdt, offset, "status", "okay")));
6720da6f3feSBharata B Rao     _FDT((fdt_setprop(fdt, offset, "64-bit", NULL, 0)));
6730da6f3feSBharata B Rao 
6740da6f3feSBharata B Rao     if (env->spr_cb[SPR_PURR].oea_read) {
6750da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,purr", NULL, 0)));
6760da6f3feSBharata B Rao     }
6770da6f3feSBharata B Rao 
6780da6f3feSBharata B Rao     if (env->mmu_model & POWERPC_MMU_1TSEG) {
6790da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,processor-segment-sizes",
6800da6f3feSBharata B Rao                           segs, sizeof(segs))));
6810da6f3feSBharata B Rao     }
6820da6f3feSBharata B Rao 
6830da6f3feSBharata B Rao     /* Advertise VMX/VSX (vector extensions) if available
6840da6f3feSBharata B Rao      *   0 / no property == no vector extensions
6850da6f3feSBharata B Rao      *   1               == VMX / Altivec available
6860da6f3feSBharata B Rao      *   2               == VSX available */
6870da6f3feSBharata B Rao     if (env->insns_flags & PPC_ALTIVEC) {
6880da6f3feSBharata B Rao         uint32_t vmx = (env->insns_flags2 & PPC2_VSX) ? 2 : 1;
6890da6f3feSBharata B Rao 
6900da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "ibm,vmx", vmx)));
6910da6f3feSBharata B Rao     }
6920da6f3feSBharata B Rao 
6930da6f3feSBharata B Rao     /* Advertise DFP (Decimal Floating Point) if available
6940da6f3feSBharata B Rao      *   0 / no property == no DFP
6950da6f3feSBharata B Rao      *   1               == DFP available */
6960da6f3feSBharata B Rao     if (env->insns_flags2 & PPC2_DFP) {
6970da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "ibm,dfp", 1)));
6980da6f3feSBharata B Rao     }
6990da6f3feSBharata B Rao 
7000da6f3feSBharata B Rao     page_sizes_prop_size = create_page_sizes_prop(env, page_sizes_prop,
7010da6f3feSBharata B Rao                                                   sizeof(page_sizes_prop));
7020da6f3feSBharata B Rao     if (page_sizes_prop_size) {
7030da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,segment-page-sizes",
7040da6f3feSBharata B Rao                           page_sizes_prop, page_sizes_prop_size)));
7050da6f3feSBharata B Rao     }
7060da6f3feSBharata B Rao 
70790da0d5aSBenjamin Herrenschmidt     /* Do the ibm,pa-features property, adjust it for ci-large-pages */
70890da0d5aSBenjamin Herrenschmidt     if (env->mmu_model == POWERPC_MMU_2_06) {
70990da0d5aSBenjamin Herrenschmidt         pa_features = pa_features_206;
71090da0d5aSBenjamin Herrenschmidt         pa_size = sizeof(pa_features_206);
71190da0d5aSBenjamin Herrenschmidt     } else /* env->mmu_model == POWERPC_MMU_2_07 */ {
71290da0d5aSBenjamin Herrenschmidt         pa_features = pa_features_207;
71390da0d5aSBenjamin Herrenschmidt         pa_size = sizeof(pa_features_207);
71490da0d5aSBenjamin Herrenschmidt     }
71590da0d5aSBenjamin Herrenschmidt     if (env->ci_large_pages) {
71690da0d5aSBenjamin Herrenschmidt         pa_features[3] |= 0x20;
71790da0d5aSBenjamin Herrenschmidt     }
71890da0d5aSBenjamin Herrenschmidt     _FDT((fdt_setprop(fdt, offset, "ibm,pa-features", pa_features, pa_size)));
71990da0d5aSBenjamin Herrenschmidt 
7200da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "ibm,chip-id",
72122419c2aSDavid Gibson                            cs->cpu_index / vcpus_per_socket)));
7220da6f3feSBharata B Rao 
7230da6f3feSBharata B Rao     _FDT((fdt_setprop(fdt, offset, "ibm,pft-size",
7240da6f3feSBharata B Rao                       pft_size_prop, sizeof(pft_size_prop))));
7250da6f3feSBharata B Rao 
7260da6f3feSBharata B Rao     _FDT(spapr_fixup_cpu_numa_dt(fdt, offset, cs));
7270da6f3feSBharata B Rao 
7280da6f3feSBharata B Rao     _FDT(spapr_fixup_cpu_smt_dt(fdt, offset, cpu,
7290da6f3feSBharata B Rao                                 ppc_get_compat_smt_threads(cpu)));
7300da6f3feSBharata B Rao }
7310da6f3feSBharata B Rao 
7320da6f3feSBharata B Rao static void spapr_populate_cpus_dt_node(void *fdt, sPAPRMachineState *spapr)
7330da6f3feSBharata B Rao {
7340da6f3feSBharata B Rao     CPUState *cs;
7350da6f3feSBharata B Rao     int cpus_offset;
7360da6f3feSBharata B Rao     char *nodename;
7370da6f3feSBharata B Rao     int smt = kvmppc_smt_threads();
7380da6f3feSBharata B Rao 
7390da6f3feSBharata B Rao     cpus_offset = fdt_add_subnode(fdt, 0, "cpus");
7400da6f3feSBharata B Rao     _FDT(cpus_offset);
7410da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, cpus_offset, "#address-cells", 0x1)));
7420da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, cpus_offset, "#size-cells", 0x0)));
7430da6f3feSBharata B Rao 
7440da6f3feSBharata B Rao     /*
7450da6f3feSBharata B Rao      * We walk the CPUs in reverse order to ensure that CPU DT nodes
7460da6f3feSBharata B Rao      * created by fdt_add_subnode() end up in the right order in FDT
7470da6f3feSBharata B Rao      * for the guest kernel the enumerate the CPUs correctly.
7480da6f3feSBharata B Rao      */
7490da6f3feSBharata B Rao     CPU_FOREACH_REVERSE(cs) {
7500da6f3feSBharata B Rao         PowerPCCPU *cpu = POWERPC_CPU(cs);
7510da6f3feSBharata B Rao         int index = ppc_get_vcpu_dt_id(cpu);
7520da6f3feSBharata B Rao         DeviceClass *dc = DEVICE_GET_CLASS(cs);
7530da6f3feSBharata B Rao         int offset;
7540da6f3feSBharata B Rao 
7550da6f3feSBharata B Rao         if ((index % smt) != 0) {
7560da6f3feSBharata B Rao             continue;
7570da6f3feSBharata B Rao         }
7580da6f3feSBharata B Rao 
7590da6f3feSBharata B Rao         nodename = g_strdup_printf("%s@%x", dc->fw_name, index);
7600da6f3feSBharata B Rao         offset = fdt_add_subnode(fdt, cpus_offset, nodename);
7610da6f3feSBharata B Rao         g_free(nodename);
7620da6f3feSBharata B Rao         _FDT(offset);
7630da6f3feSBharata B Rao         spapr_populate_cpu_dt(cs, fdt, offset, spapr);
7640da6f3feSBharata B Rao     }
7650da6f3feSBharata B Rao 
7660da6f3feSBharata B Rao }
7670da6f3feSBharata B Rao 
76803d196b7SBharata B Rao /*
76903d196b7SBharata B Rao  * Adds ibm,dynamic-reconfiguration-memory node.
77003d196b7SBharata B Rao  * Refer to docs/specs/ppc-spapr-hotplug.txt for the documentation
77103d196b7SBharata B Rao  * of this device tree node.
77203d196b7SBharata B Rao  */
77303d196b7SBharata B Rao static int spapr_populate_drconf_memory(sPAPRMachineState *spapr, void *fdt)
77403d196b7SBharata B Rao {
77503d196b7SBharata B Rao     MachineState *machine = MACHINE(spapr);
77603d196b7SBharata B Rao     int ret, i, offset;
77703d196b7SBharata B Rao     uint64_t lmb_size = SPAPR_MEMORY_BLOCK_SIZE;
77803d196b7SBharata B Rao     uint32_t prop_lmb_size[] = {0, cpu_to_be32(lmb_size)};
779d0e5a8f2SBharata B Rao     uint32_t hotplug_lmb_start = spapr->hotplug_memory.base / lmb_size;
780d0e5a8f2SBharata B Rao     uint32_t nr_lmbs = (spapr->hotplug_memory.base +
781d0e5a8f2SBharata B Rao                        memory_region_size(&spapr->hotplug_memory.mr)) /
782d0e5a8f2SBharata B Rao                        lmb_size;
78303d196b7SBharata B Rao     uint32_t *int_buf, *cur_index, buf_len;
7846663864eSBharata B Rao     int nr_nodes = nb_numa_nodes ? nb_numa_nodes : 1;
78503d196b7SBharata B Rao 
786ef001f06SThomas Huth     /*
787d0e5a8f2SBharata B Rao      * Don't create the node if there is no hotpluggable memory
78816c25aefSBharata B Rao      */
789d0e5a8f2SBharata B Rao     if (machine->ram_size == machine->maxram_size) {
79016c25aefSBharata B Rao         return 0;
79116c25aefSBharata B Rao     }
79216c25aefSBharata B Rao 
79316c25aefSBharata B Rao     /*
794ef001f06SThomas Huth      * Allocate enough buffer size to fit in ibm,dynamic-memory
795ef001f06SThomas Huth      * or ibm,associativity-lookup-arrays
796ef001f06SThomas Huth      */
797ef001f06SThomas Huth     buf_len = MAX(nr_lmbs * SPAPR_DR_LMB_LIST_ENTRY_SIZE + 1, nr_nodes * 4 + 2)
798ef001f06SThomas Huth               * sizeof(uint32_t);
79903d196b7SBharata B Rao     cur_index = int_buf = g_malloc0(buf_len);
80003d196b7SBharata B Rao 
80103d196b7SBharata B Rao     offset = fdt_add_subnode(fdt, 0, "ibm,dynamic-reconfiguration-memory");
80203d196b7SBharata B Rao 
80303d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,lmb-size", prop_lmb_size,
80403d196b7SBharata B Rao                     sizeof(prop_lmb_size));
80503d196b7SBharata B Rao     if (ret < 0) {
80603d196b7SBharata B Rao         goto out;
80703d196b7SBharata B Rao     }
80803d196b7SBharata B Rao 
80903d196b7SBharata B Rao     ret = fdt_setprop_cell(fdt, offset, "ibm,memory-flags-mask", 0xff);
81003d196b7SBharata B Rao     if (ret < 0) {
81103d196b7SBharata B Rao         goto out;
81203d196b7SBharata B Rao     }
81303d196b7SBharata B Rao 
81403d196b7SBharata B Rao     ret = fdt_setprop_cell(fdt, offset, "ibm,memory-preservation-time", 0x0);
81503d196b7SBharata B Rao     if (ret < 0) {
81603d196b7SBharata B Rao         goto out;
81703d196b7SBharata B Rao     }
81803d196b7SBharata B Rao 
81903d196b7SBharata B Rao     /* ibm,dynamic-memory */
82003d196b7SBharata B Rao     int_buf[0] = cpu_to_be32(nr_lmbs);
82103d196b7SBharata B Rao     cur_index++;
82203d196b7SBharata B Rao     for (i = 0; i < nr_lmbs; i++) {
823d0e5a8f2SBharata B Rao         uint64_t addr = i * lmb_size;
82403d196b7SBharata B Rao         uint32_t *dynamic_memory = cur_index;
82503d196b7SBharata B Rao 
826d0e5a8f2SBharata B Rao         if (i >= hotplug_lmb_start) {
827d0e5a8f2SBharata B Rao             sPAPRDRConnector *drc;
828d0e5a8f2SBharata B Rao             sPAPRDRConnectorClass *drck;
829d0e5a8f2SBharata B Rao 
830d0e5a8f2SBharata B Rao             drc = spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_LMB, i);
83103d196b7SBharata B Rao             g_assert(drc);
83203d196b7SBharata B Rao             drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
83303d196b7SBharata B Rao 
83403d196b7SBharata B Rao             dynamic_memory[0] = cpu_to_be32(addr >> 32);
83503d196b7SBharata B Rao             dynamic_memory[1] = cpu_to_be32(addr & 0xffffffff);
83603d196b7SBharata B Rao             dynamic_memory[2] = cpu_to_be32(drck->get_index(drc));
83703d196b7SBharata B Rao             dynamic_memory[3] = cpu_to_be32(0); /* reserved */
83803d196b7SBharata B Rao             dynamic_memory[4] = cpu_to_be32(numa_get_node(addr, NULL));
839d0e5a8f2SBharata B Rao             if (memory_region_present(get_system_memory(), addr)) {
84003d196b7SBharata B Rao                 dynamic_memory[5] = cpu_to_be32(SPAPR_LMB_FLAGS_ASSIGNED);
84103d196b7SBharata B Rao             } else {
84203d196b7SBharata B Rao                 dynamic_memory[5] = cpu_to_be32(0);
84303d196b7SBharata B Rao             }
844d0e5a8f2SBharata B Rao         } else {
845d0e5a8f2SBharata B Rao             /*
846d0e5a8f2SBharata B Rao              * LMB information for RMA, boot time RAM and gap b/n RAM and
847d0e5a8f2SBharata B Rao              * hotplug memory region -- all these are marked as reserved
848d0e5a8f2SBharata B Rao              * and as having no valid DRC.
849d0e5a8f2SBharata B Rao              */
850d0e5a8f2SBharata B Rao             dynamic_memory[0] = cpu_to_be32(addr >> 32);
851d0e5a8f2SBharata B Rao             dynamic_memory[1] = cpu_to_be32(addr & 0xffffffff);
852d0e5a8f2SBharata B Rao             dynamic_memory[2] = cpu_to_be32(0);
853d0e5a8f2SBharata B Rao             dynamic_memory[3] = cpu_to_be32(0); /* reserved */
854d0e5a8f2SBharata B Rao             dynamic_memory[4] = cpu_to_be32(-1);
855d0e5a8f2SBharata B Rao             dynamic_memory[5] = cpu_to_be32(SPAPR_LMB_FLAGS_RESERVED |
856d0e5a8f2SBharata B Rao                                             SPAPR_LMB_FLAGS_DRC_INVALID);
857d0e5a8f2SBharata B Rao         }
85803d196b7SBharata B Rao 
85903d196b7SBharata B Rao         cur_index += SPAPR_DR_LMB_LIST_ENTRY_SIZE;
86003d196b7SBharata B Rao     }
86103d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,dynamic-memory", int_buf, buf_len);
86203d196b7SBharata B Rao     if (ret < 0) {
86303d196b7SBharata B Rao         goto out;
86403d196b7SBharata B Rao     }
86503d196b7SBharata B Rao 
86603d196b7SBharata B Rao     /* ibm,associativity-lookup-arrays */
86703d196b7SBharata B Rao     cur_index = int_buf;
8686663864eSBharata B Rao     int_buf[0] = cpu_to_be32(nr_nodes);
86903d196b7SBharata B Rao     int_buf[1] = cpu_to_be32(4); /* Number of entries per associativity list */
87003d196b7SBharata B Rao     cur_index += 2;
8716663864eSBharata B Rao     for (i = 0; i < nr_nodes; i++) {
87203d196b7SBharata B Rao         uint32_t associativity[] = {
87303d196b7SBharata B Rao             cpu_to_be32(0x0),
87403d196b7SBharata B Rao             cpu_to_be32(0x0),
87503d196b7SBharata B Rao             cpu_to_be32(0x0),
87603d196b7SBharata B Rao             cpu_to_be32(i)
87703d196b7SBharata B Rao         };
87803d196b7SBharata B Rao         memcpy(cur_index, associativity, sizeof(associativity));
87903d196b7SBharata B Rao         cur_index += 4;
88003d196b7SBharata B Rao     }
88103d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,associativity-lookup-arrays", int_buf,
88203d196b7SBharata B Rao             (cur_index - int_buf) * sizeof(uint32_t));
88303d196b7SBharata B Rao out:
88403d196b7SBharata B Rao     g_free(int_buf);
88503d196b7SBharata B Rao     return ret;
88603d196b7SBharata B Rao }
88703d196b7SBharata B Rao 
88803d196b7SBharata B Rao int spapr_h_cas_compose_response(sPAPRMachineState *spapr,
88903d196b7SBharata B Rao                                  target_ulong addr, target_ulong size,
89003d196b7SBharata B Rao                                  bool cpu_update, bool memory_update)
89103d196b7SBharata B Rao {
89203d196b7SBharata B Rao     void *fdt, *fdt_skel;
89303d196b7SBharata B Rao     sPAPRDeviceTreeUpdateHeader hdr = { .version_id = 1 };
89403d196b7SBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(qdev_get_machine());
89503d196b7SBharata B Rao 
89603d196b7SBharata B Rao     size -= sizeof(hdr);
89703d196b7SBharata B Rao 
89803d196b7SBharata B Rao     /* Create sceleton */
89903d196b7SBharata B Rao     fdt_skel = g_malloc0(size);
90003d196b7SBharata B Rao     _FDT((fdt_create(fdt_skel, size)));
90103d196b7SBharata B Rao     _FDT((fdt_begin_node(fdt_skel, "")));
90203d196b7SBharata B Rao     _FDT((fdt_end_node(fdt_skel)));
90303d196b7SBharata B Rao     _FDT((fdt_finish(fdt_skel)));
90403d196b7SBharata B Rao     fdt = g_malloc0(size);
90503d196b7SBharata B Rao     _FDT((fdt_open_into(fdt_skel, fdt, size)));
90603d196b7SBharata B Rao     g_free(fdt_skel);
90703d196b7SBharata B Rao 
90803d196b7SBharata B Rao     /* Fixup cpu nodes */
90903d196b7SBharata B Rao     if (cpu_update) {
91003d196b7SBharata B Rao         _FDT((spapr_fixup_cpu_dt(fdt, spapr)));
91103d196b7SBharata B Rao     }
91203d196b7SBharata B Rao 
91316c25aefSBharata B Rao     /* Generate ibm,dynamic-reconfiguration-memory node if required */
91403d196b7SBharata B Rao     if (memory_update && smc->dr_lmb_enabled) {
91503d196b7SBharata B Rao         _FDT((spapr_populate_drconf_memory(spapr, fdt)));
91603d196b7SBharata B Rao     }
91703d196b7SBharata B Rao 
91803d196b7SBharata B Rao     /* Pack resulting tree */
91903d196b7SBharata B Rao     _FDT((fdt_pack(fdt)));
92003d196b7SBharata B Rao 
92103d196b7SBharata B Rao     if (fdt_totalsize(fdt) + sizeof(hdr) > size) {
92203d196b7SBharata B Rao         trace_spapr_cas_failed(size);
92303d196b7SBharata B Rao         return -1;
92403d196b7SBharata B Rao     }
92503d196b7SBharata B Rao 
92603d196b7SBharata B Rao     cpu_physical_memory_write(addr, &hdr, sizeof(hdr));
92703d196b7SBharata B Rao     cpu_physical_memory_write(addr + sizeof(hdr), fdt, fdt_totalsize(fdt));
92803d196b7SBharata B Rao     trace_spapr_cas_continue(fdt_totalsize(fdt) + sizeof(hdr));
92903d196b7SBharata B Rao     g_free(fdt);
93003d196b7SBharata B Rao 
93103d196b7SBharata B Rao     return 0;
93203d196b7SBharata B Rao }
93303d196b7SBharata B Rao 
93428e02042SDavid Gibson static void spapr_finalize_fdt(sPAPRMachineState *spapr,
93553018216SPaolo Bonzini                                hwaddr fdt_addr,
93653018216SPaolo Bonzini                                hwaddr rtas_addr,
93753018216SPaolo Bonzini                                hwaddr rtas_size)
93853018216SPaolo Bonzini {
9395b2128d2SAlexander Graf     MachineState *machine = MACHINE(qdev_get_machine());
940c20d332aSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(machine);
9415b2128d2SAlexander Graf     const char *boot_device = machine->boot_order;
94271461b0fSAlexey Kardashevskiy     int ret, i;
94371461b0fSAlexey Kardashevskiy     size_t cb = 0;
94471461b0fSAlexey Kardashevskiy     char *bootlist;
94553018216SPaolo Bonzini     void *fdt;
94653018216SPaolo Bonzini     sPAPRPHBState *phb;
94753018216SPaolo Bonzini 
94853018216SPaolo Bonzini     fdt = g_malloc(FDT_MAX_SIZE);
94953018216SPaolo Bonzini 
95053018216SPaolo Bonzini     /* open out the base tree into a temp buffer for the final tweaks */
95153018216SPaolo Bonzini     _FDT((fdt_open_into(spapr->fdt_skel, fdt, FDT_MAX_SIZE)));
95253018216SPaolo Bonzini 
953e8f986fcSBharata B Rao     ret = spapr_populate_memory(spapr, fdt);
954e8f986fcSBharata B Rao     if (ret < 0) {
955e8f986fcSBharata B Rao         fprintf(stderr, "couldn't setup memory nodes in fdt\n");
956e8f986fcSBharata B Rao         exit(1);
95753018216SPaolo Bonzini     }
95853018216SPaolo Bonzini 
95953018216SPaolo Bonzini     ret = spapr_populate_vdevice(spapr->vio_bus, fdt);
96053018216SPaolo Bonzini     if (ret < 0) {
96153018216SPaolo Bonzini         fprintf(stderr, "couldn't setup vio devices in fdt\n");
96253018216SPaolo Bonzini         exit(1);
96353018216SPaolo Bonzini     }
96453018216SPaolo Bonzini 
9654d9392beSThomas Huth     if (object_resolve_path_type("", TYPE_SPAPR_RNG, NULL)) {
9664d9392beSThomas Huth         ret = spapr_rng_populate_dt(fdt);
9674d9392beSThomas Huth         if (ret < 0) {
9684d9392beSThomas Huth             fprintf(stderr, "could not set up rng device in the fdt\n");
9694d9392beSThomas Huth             exit(1);
9704d9392beSThomas Huth         }
9714d9392beSThomas Huth     }
9724d9392beSThomas Huth 
97353018216SPaolo Bonzini     QLIST_FOREACH(phb, &spapr->phbs, list) {
97453018216SPaolo Bonzini         ret = spapr_populate_pci_dt(phb, PHANDLE_XICP, fdt);
97553018216SPaolo Bonzini         if (ret < 0) {
976da34fed7SThomas Huth             error_report("couldn't setup PCI devices in fdt");
97753018216SPaolo Bonzini             exit(1);
97853018216SPaolo Bonzini         }
979da34fed7SThomas Huth     }
98053018216SPaolo Bonzini 
98153018216SPaolo Bonzini     /* RTAS */
98253018216SPaolo Bonzini     ret = spapr_rtas_device_tree_setup(fdt, rtas_addr, rtas_size);
98353018216SPaolo Bonzini     if (ret < 0) {
98453018216SPaolo Bonzini         fprintf(stderr, "Couldn't set up RTAS device tree properties\n");
98553018216SPaolo Bonzini     }
98653018216SPaolo Bonzini 
9870da6f3feSBharata B Rao     /* cpus */
9880da6f3feSBharata B Rao     spapr_populate_cpus_dt_node(fdt, spapr);
98953018216SPaolo Bonzini 
99071461b0fSAlexey Kardashevskiy     bootlist = get_boot_devices_list(&cb, true);
99171461b0fSAlexey Kardashevskiy     if (cb && bootlist) {
99271461b0fSAlexey Kardashevskiy         int offset = fdt_path_offset(fdt, "/chosen");
99371461b0fSAlexey Kardashevskiy         if (offset < 0) {
99471461b0fSAlexey Kardashevskiy             exit(1);
99571461b0fSAlexey Kardashevskiy         }
99671461b0fSAlexey Kardashevskiy         for (i = 0; i < cb; i++) {
99771461b0fSAlexey Kardashevskiy             if (bootlist[i] == '\n') {
99871461b0fSAlexey Kardashevskiy                 bootlist[i] = ' ';
99971461b0fSAlexey Kardashevskiy             }
100071461b0fSAlexey Kardashevskiy 
100171461b0fSAlexey Kardashevskiy         }
100271461b0fSAlexey Kardashevskiy         ret = fdt_setprop_string(fdt, offset, "qemu,boot-list", bootlist);
100371461b0fSAlexey Kardashevskiy     }
100471461b0fSAlexey Kardashevskiy 
10055b2128d2SAlexander Graf     if (boot_device && strlen(boot_device)) {
10065b2128d2SAlexander Graf         int offset = fdt_path_offset(fdt, "/chosen");
10075b2128d2SAlexander Graf 
10085b2128d2SAlexander Graf         if (offset < 0) {
10095b2128d2SAlexander Graf             exit(1);
10105b2128d2SAlexander Graf         }
10115b2128d2SAlexander Graf         fdt_setprop_string(fdt, offset, "qemu,boot-device", boot_device);
10125b2128d2SAlexander Graf     }
10135b2128d2SAlexander Graf 
101453018216SPaolo Bonzini     if (!spapr->has_graphics) {
101553018216SPaolo Bonzini         spapr_populate_chosen_stdout(fdt, spapr->vio_bus);
101653018216SPaolo Bonzini     }
101753018216SPaolo Bonzini 
1018c20d332aSBharata B Rao     if (smc->dr_lmb_enabled) {
1019c20d332aSBharata B Rao         _FDT(spapr_drc_populate_dt(fdt, 0, NULL, SPAPR_DR_CONNECTOR_TYPE_LMB));
1020c20d332aSBharata B Rao     }
1021c20d332aSBharata B Rao 
1022af81cf32SBharata B Rao     if (smc->dr_cpu_enabled) {
1023af81cf32SBharata B Rao         int offset = fdt_path_offset(fdt, "/cpus");
1024af81cf32SBharata B Rao         ret = spapr_drc_populate_dt(fdt, offset, NULL,
1025af81cf32SBharata B Rao                                     SPAPR_DR_CONNECTOR_TYPE_CPU);
1026af81cf32SBharata B Rao         if (ret < 0) {
1027af81cf32SBharata B Rao             error_report("Couldn't set up CPU DR device tree properties");
1028af81cf32SBharata B Rao             exit(1);
1029af81cf32SBharata B Rao         }
1030af81cf32SBharata B Rao     }
1031af81cf32SBharata B Rao 
103253018216SPaolo Bonzini     _FDT((fdt_pack(fdt)));
103353018216SPaolo Bonzini 
103453018216SPaolo Bonzini     if (fdt_totalsize(fdt) > FDT_MAX_SIZE) {
1035730fce59SThomas Huth         error_report("FDT too big ! 0x%x bytes (max is 0x%x)",
103653018216SPaolo Bonzini                      fdt_totalsize(fdt), FDT_MAX_SIZE);
103753018216SPaolo Bonzini         exit(1);
103853018216SPaolo Bonzini     }
103953018216SPaolo Bonzini 
1040ad440b4aSAndrew Jones     qemu_fdt_dumpdtb(fdt, fdt_totalsize(fdt));
104153018216SPaolo Bonzini     cpu_physical_memory_write(fdt_addr, fdt, fdt_totalsize(fdt));
104253018216SPaolo Bonzini 
1043a21a7a70SGonglei     g_free(bootlist);
104453018216SPaolo Bonzini     g_free(fdt);
104553018216SPaolo Bonzini }
104653018216SPaolo Bonzini 
104753018216SPaolo Bonzini static uint64_t translate_kernel_address(void *opaque, uint64_t addr)
104853018216SPaolo Bonzini {
104953018216SPaolo Bonzini     return (addr & 0x0fffffff) + KERNEL_LOAD_ADDR;
105053018216SPaolo Bonzini }
105153018216SPaolo Bonzini 
105253018216SPaolo Bonzini static void emulate_spapr_hypercall(PowerPCCPU *cpu)
105353018216SPaolo Bonzini {
105453018216SPaolo Bonzini     CPUPPCState *env = &cpu->env;
105553018216SPaolo Bonzini 
105653018216SPaolo Bonzini     if (msr_pr) {
105753018216SPaolo Bonzini         hcall_dprintf("Hypercall made with MSR[PR]=1\n");
105853018216SPaolo Bonzini         env->gpr[3] = H_PRIVILEGE;
105953018216SPaolo Bonzini     } else {
106053018216SPaolo Bonzini         env->gpr[3] = spapr_hypercall(cpu, env->gpr[3], &env->gpr[4]);
106153018216SPaolo Bonzini     }
106253018216SPaolo Bonzini }
106353018216SPaolo Bonzini 
1064e6b8fd24SSamuel Mendoza-Jonas #define HPTE(_table, _i)   (void *)(((uint64_t *)(_table)) + ((_i) * 2))
1065e6b8fd24SSamuel Mendoza-Jonas #define HPTE_VALID(_hpte)  (tswap64(*((uint64_t *)(_hpte))) & HPTE64_V_VALID)
1066e6b8fd24SSamuel Mendoza-Jonas #define HPTE_DIRTY(_hpte)  (tswap64(*((uint64_t *)(_hpte))) & HPTE64_V_HPTE_DIRTY)
1067e6b8fd24SSamuel Mendoza-Jonas #define CLEAN_HPTE(_hpte)  ((*(uint64_t *)(_hpte)) &= tswap64(~HPTE64_V_HPTE_DIRTY))
1068e6b8fd24SSamuel Mendoza-Jonas #define DIRTY_HPTE(_hpte)  ((*(uint64_t *)(_hpte)) |= tswap64(HPTE64_V_HPTE_DIRTY))
1069e6b8fd24SSamuel Mendoza-Jonas 
1070715c5407SDavid Gibson /*
1071715c5407SDavid Gibson  * Get the fd to access the kernel htab, re-opening it if necessary
1072715c5407SDavid Gibson  */
1073715c5407SDavid Gibson static int get_htab_fd(sPAPRMachineState *spapr)
1074715c5407SDavid Gibson {
1075715c5407SDavid Gibson     if (spapr->htab_fd >= 0) {
1076715c5407SDavid Gibson         return spapr->htab_fd;
1077715c5407SDavid Gibson     }
1078715c5407SDavid Gibson 
1079715c5407SDavid Gibson     spapr->htab_fd = kvmppc_get_htab_fd(false);
1080715c5407SDavid Gibson     if (spapr->htab_fd < 0) {
1081715c5407SDavid Gibson         error_report("Unable to open fd for reading hash table from KVM: %s",
1082715c5407SDavid Gibson                      strerror(errno));
1083715c5407SDavid Gibson     }
1084715c5407SDavid Gibson 
1085715c5407SDavid Gibson     return spapr->htab_fd;
1086715c5407SDavid Gibson }
1087715c5407SDavid Gibson 
1088715c5407SDavid Gibson static void close_htab_fd(sPAPRMachineState *spapr)
1089715c5407SDavid Gibson {
1090715c5407SDavid Gibson     if (spapr->htab_fd >= 0) {
1091715c5407SDavid Gibson         close(spapr->htab_fd);
1092715c5407SDavid Gibson     }
1093715c5407SDavid Gibson     spapr->htab_fd = -1;
1094715c5407SDavid Gibson }
1095715c5407SDavid Gibson 
10968dfe8e7fSDavid Gibson static int spapr_hpt_shift_for_ramsize(uint64_t ramsize)
10978dfe8e7fSDavid Gibson {
10988dfe8e7fSDavid Gibson     int shift;
10998dfe8e7fSDavid Gibson 
11008dfe8e7fSDavid Gibson     /* We aim for a hash table of size 1/128 the size of RAM (rounded
11018dfe8e7fSDavid Gibson      * up).  The PAPR recommendation is actually 1/64 of RAM size, but
11028dfe8e7fSDavid Gibson      * that's much more than is needed for Linux guests */
11038dfe8e7fSDavid Gibson     shift = ctz64(pow2ceil(ramsize)) - 7;
11048dfe8e7fSDavid Gibson     shift = MAX(shift, 18); /* Minimum architected size */
11058dfe8e7fSDavid Gibson     shift = MIN(shift, 46); /* Maximum architected size */
11068dfe8e7fSDavid Gibson     return shift;
11078dfe8e7fSDavid Gibson }
11088dfe8e7fSDavid Gibson 
1109c5f54f3eSDavid Gibson static void spapr_reallocate_hpt(sPAPRMachineState *spapr, int shift,
1110c5f54f3eSDavid Gibson                                  Error **errp)
111153018216SPaolo Bonzini {
1112c5f54f3eSDavid Gibson     long rc;
111353018216SPaolo Bonzini 
1114c5f54f3eSDavid Gibson     /* Clean up any HPT info from a previous boot */
1115c5f54f3eSDavid Gibson     g_free(spapr->htab);
1116c5f54f3eSDavid Gibson     spapr->htab = NULL;
1117c5f54f3eSDavid Gibson     spapr->htab_shift = 0;
1118c5f54f3eSDavid Gibson     close_htab_fd(spapr);
111953018216SPaolo Bonzini 
1120c5f54f3eSDavid Gibson     rc = kvmppc_reset_htab(shift);
1121c5f54f3eSDavid Gibson     if (rc < 0) {
1122c5f54f3eSDavid Gibson         /* kernel-side HPT needed, but couldn't allocate one */
1123c5f54f3eSDavid Gibson         error_setg_errno(errp, errno,
1124c5f54f3eSDavid Gibson                          "Failed to allocate KVM HPT of order %d (try smaller maxmem?)",
1125c5f54f3eSDavid Gibson                          shift);
1126c5f54f3eSDavid Gibson         /* This is almost certainly fatal, but if the caller really
1127c5f54f3eSDavid Gibson          * wants to carry on with shift == 0, it's welcome to try */
1128c5f54f3eSDavid Gibson     } else if (rc > 0) {
1129c5f54f3eSDavid Gibson         /* kernel-side HPT allocated */
1130c5f54f3eSDavid Gibson         if (rc != shift) {
1131c5f54f3eSDavid Gibson             error_setg(errp,
1132c5f54f3eSDavid Gibson                        "Requested order %d HPT, but kernel allocated order %ld (try smaller maxmem?)",
1133c5f54f3eSDavid Gibson                        shift, rc);
11347735fedaSBharata B Rao         }
11357735fedaSBharata B Rao 
113653018216SPaolo Bonzini         spapr->htab_shift = shift;
1137c18ad9a5SDavid Gibson         spapr->htab = NULL;
1138b817772aSBharata B Rao     } else {
1139c5f54f3eSDavid Gibson         /* kernel-side HPT not needed, allocate in userspace instead */
1140c5f54f3eSDavid Gibson         size_t size = 1ULL << shift;
1141c5f54f3eSDavid Gibson         int i;
114201a57972SSamuel Mendoza-Jonas 
1143c5f54f3eSDavid Gibson         spapr->htab = qemu_memalign(size, size);
1144c5f54f3eSDavid Gibson         if (!spapr->htab) {
1145c5f54f3eSDavid Gibson             error_setg_errno(errp, errno,
1146c5f54f3eSDavid Gibson                              "Could not allocate HPT of order %d", shift);
1147c5f54f3eSDavid Gibson             return;
1148b817772aSBharata B Rao         }
1149b817772aSBharata B Rao 
1150c5f54f3eSDavid Gibson         memset(spapr->htab, 0, size);
1151c5f54f3eSDavid Gibson         spapr->htab_shift = shift;
1152b817772aSBharata B Rao 
1153c5f54f3eSDavid Gibson         for (i = 0; i < size / HASH_PTE_SIZE_64; i++) {
1154c5f54f3eSDavid Gibson             DIRTY_HPTE(HPTE(spapr->htab, i));
11557735fedaSBharata B Rao         }
115653018216SPaolo Bonzini     }
115753018216SPaolo Bonzini }
115853018216SPaolo Bonzini 
11599e3f9733SAlexander Graf static int find_unknown_sysbus_device(SysBusDevice *sbdev, void *opaque)
11609e3f9733SAlexander Graf {
11619e3f9733SAlexander Graf     bool matched = false;
11629e3f9733SAlexander Graf 
11639e3f9733SAlexander Graf     if (object_dynamic_cast(OBJECT(sbdev), TYPE_SPAPR_PCI_HOST_BRIDGE)) {
11649e3f9733SAlexander Graf         matched = true;
11659e3f9733SAlexander Graf     }
11669e3f9733SAlexander Graf 
11679e3f9733SAlexander Graf     if (!matched) {
11689e3f9733SAlexander Graf         error_report("Device %s is not supported by this machine yet.",
11699e3f9733SAlexander Graf                      qdev_fw_name(DEVICE(sbdev)));
11709e3f9733SAlexander Graf         exit(1);
11719e3f9733SAlexander Graf     }
11729e3f9733SAlexander Graf 
11739e3f9733SAlexander Graf     return 0;
11749e3f9733SAlexander Graf }
11759e3f9733SAlexander Graf 
117653018216SPaolo Bonzini static void ppc_spapr_reset(void)
117753018216SPaolo Bonzini {
1178c5f54f3eSDavid Gibson     MachineState *machine = MACHINE(qdev_get_machine());
1179c5f54f3eSDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
1180182735efSAndreas Färber     PowerPCCPU *first_ppc_cpu;
1181b7d1f77aSBenjamin Herrenschmidt     uint32_t rtas_limit;
1182259186a7SAndreas Färber 
11839e3f9733SAlexander Graf     /* Check for unknown sysbus devices */
11849e3f9733SAlexander Graf     foreach_dynamic_sysbus_device(find_unknown_sysbus_device, NULL);
11859e3f9733SAlexander Graf 
1186c5f54f3eSDavid Gibson     /* Allocate and/or reset the hash page table */
1187c5f54f3eSDavid Gibson     spapr_reallocate_hpt(spapr,
1188c5f54f3eSDavid Gibson                          spapr_hpt_shift_for_ramsize(machine->maxram_size),
1189c5f54f3eSDavid Gibson                          &error_fatal);
1190c5f54f3eSDavid Gibson 
1191c5f54f3eSDavid Gibson     /* Update the RMA size if necessary */
1192c5f54f3eSDavid Gibson     if (spapr->vrma_adjust) {
1193c5f54f3eSDavid Gibson         spapr->rma_size = kvmppc_rma_size(spapr_node0_size(),
1194c5f54f3eSDavid Gibson                                           spapr->htab_shift);
1195c5f54f3eSDavid Gibson     }
119653018216SPaolo Bonzini 
119753018216SPaolo Bonzini     qemu_devices_reset();
119853018216SPaolo Bonzini 
1199b7d1f77aSBenjamin Herrenschmidt     /*
1200b7d1f77aSBenjamin Herrenschmidt      * We place the device tree and RTAS just below either the top of the RMA,
1201b7d1f77aSBenjamin Herrenschmidt      * or just below 2GB, whichever is lowere, so that it can be
1202b7d1f77aSBenjamin Herrenschmidt      * processed with 32-bit real mode code if necessary
1203b7d1f77aSBenjamin Herrenschmidt      */
1204b7d1f77aSBenjamin Herrenschmidt     rtas_limit = MIN(spapr->rma_size, RTAS_MAX_ADDR);
1205b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_addr = rtas_limit - RTAS_MAX_SIZE;
1206b7d1f77aSBenjamin Herrenschmidt     spapr->fdt_addr = spapr->rtas_addr - FDT_MAX_SIZE;
1207b7d1f77aSBenjamin Herrenschmidt 
120853018216SPaolo Bonzini     /* Load the fdt */
120953018216SPaolo Bonzini     spapr_finalize_fdt(spapr, spapr->fdt_addr, spapr->rtas_addr,
121053018216SPaolo Bonzini                        spapr->rtas_size);
121153018216SPaolo Bonzini 
1212b7d1f77aSBenjamin Herrenschmidt     /* Copy RTAS over */
1213b7d1f77aSBenjamin Herrenschmidt     cpu_physical_memory_write(spapr->rtas_addr, spapr->rtas_blob,
1214b7d1f77aSBenjamin Herrenschmidt                               spapr->rtas_size);
1215b7d1f77aSBenjamin Herrenschmidt 
121653018216SPaolo Bonzini     /* Set up the entry state */
1217182735efSAndreas Färber     first_ppc_cpu = POWERPC_CPU(first_cpu);
1218182735efSAndreas Färber     first_ppc_cpu->env.gpr[3] = spapr->fdt_addr;
1219182735efSAndreas Färber     first_ppc_cpu->env.gpr[5] = 0;
1220182735efSAndreas Färber     first_cpu->halted = 0;
12211b718907SDavid Gibson     first_ppc_cpu->env.nip = SPAPR_ENTRY_POINT;
122253018216SPaolo Bonzini 
122353018216SPaolo Bonzini }
122453018216SPaolo Bonzini 
122528e02042SDavid Gibson static void spapr_create_nvram(sPAPRMachineState *spapr)
122653018216SPaolo Bonzini {
12272ff3de68SMarkus Armbruster     DeviceState *dev = qdev_create(&spapr->vio_bus->bus, "spapr-nvram");
12283978b863SPaolo Bonzini     DriveInfo *dinfo = drive_get(IF_PFLASH, 0, 0);
122953018216SPaolo Bonzini 
12303978b863SPaolo Bonzini     if (dinfo) {
12316231a6daSMarkus Armbruster         qdev_prop_set_drive(dev, "drive", blk_by_legacy_dinfo(dinfo),
12326231a6daSMarkus Armbruster                             &error_fatal);
123353018216SPaolo Bonzini     }
123453018216SPaolo Bonzini 
123553018216SPaolo Bonzini     qdev_init_nofail(dev);
123653018216SPaolo Bonzini 
123753018216SPaolo Bonzini     spapr->nvram = (struct sPAPRNVRAM *)dev;
123853018216SPaolo Bonzini }
123953018216SPaolo Bonzini 
124028e02042SDavid Gibson static void spapr_rtc_create(sPAPRMachineState *spapr)
124128df36a1SDavid Gibson {
124228df36a1SDavid Gibson     DeviceState *dev = qdev_create(NULL, TYPE_SPAPR_RTC);
124328df36a1SDavid Gibson 
124428df36a1SDavid Gibson     qdev_init_nofail(dev);
124528df36a1SDavid Gibson     spapr->rtc = dev;
124674e5ae28SDavid Gibson 
124774e5ae28SDavid Gibson     object_property_add_alias(qdev_get_machine(), "rtc-time",
124874e5ae28SDavid Gibson                               OBJECT(spapr->rtc), "date", NULL);
124928df36a1SDavid Gibson }
125028df36a1SDavid Gibson 
125153018216SPaolo Bonzini /* Returns whether we want to use VGA or not */
125214c6a894SDavid Gibson static bool spapr_vga_init(PCIBus *pci_bus, Error **errp)
125353018216SPaolo Bonzini {
125453018216SPaolo Bonzini     switch (vga_interface_type) {
125553018216SPaolo Bonzini     case VGA_NONE:
12567effdaa3SMark Wu         return false;
12577effdaa3SMark Wu     case VGA_DEVICE:
12587effdaa3SMark Wu         return true;
125953018216SPaolo Bonzini     case VGA_STD:
1260b798c190SBenjamin Herrenschmidt     case VGA_VIRTIO:
126153018216SPaolo Bonzini         return pci_vga_init(pci_bus) != NULL;
126253018216SPaolo Bonzini     default:
126314c6a894SDavid Gibson         error_setg(errp,
126414c6a894SDavid Gibson                    "Unsupported VGA mode, only -vga std or -vga virtio is supported");
126514c6a894SDavid Gibson         return false;
126653018216SPaolo Bonzini     }
126753018216SPaolo Bonzini }
126853018216SPaolo Bonzini 
1269880ae7deSDavid Gibson static int spapr_post_load(void *opaque, int version_id)
1270880ae7deSDavid Gibson {
127128e02042SDavid Gibson     sPAPRMachineState *spapr = (sPAPRMachineState *)opaque;
1272880ae7deSDavid Gibson     int err = 0;
1273880ae7deSDavid Gibson 
1274631b22eaSStefan Weil     /* In earlier versions, there was no separate qdev for the PAPR
1275880ae7deSDavid Gibson      * RTC, so the RTC offset was stored directly in sPAPREnvironment.
1276880ae7deSDavid Gibson      * So when migrating from those versions, poke the incoming offset
1277880ae7deSDavid Gibson      * value into the RTC device */
1278880ae7deSDavid Gibson     if (version_id < 3) {
1279880ae7deSDavid Gibson         err = spapr_rtc_import_offset(spapr->rtc, spapr->rtc_offset);
1280880ae7deSDavid Gibson     }
1281880ae7deSDavid Gibson 
1282880ae7deSDavid Gibson     return err;
1283880ae7deSDavid Gibson }
1284880ae7deSDavid Gibson 
1285880ae7deSDavid Gibson static bool version_before_3(void *opaque, int version_id)
1286880ae7deSDavid Gibson {
1287880ae7deSDavid Gibson     return version_id < 3;
1288880ae7deSDavid Gibson }
1289880ae7deSDavid Gibson 
12904be21d56SDavid Gibson static const VMStateDescription vmstate_spapr = {
12914be21d56SDavid Gibson     .name = "spapr",
1292880ae7deSDavid Gibson     .version_id = 3,
12934be21d56SDavid Gibson     .minimum_version_id = 1,
1294880ae7deSDavid Gibson     .post_load = spapr_post_load,
12954be21d56SDavid Gibson     .fields = (VMStateField[]) {
1296880ae7deSDavid Gibson         /* used to be @next_irq */
1297880ae7deSDavid Gibson         VMSTATE_UNUSED_BUFFER(version_before_3, 0, 4),
12984be21d56SDavid Gibson 
12994be21d56SDavid Gibson         /* RTC offset */
130028e02042SDavid Gibson         VMSTATE_UINT64_TEST(rtc_offset, sPAPRMachineState, version_before_3),
1301880ae7deSDavid Gibson 
130228e02042SDavid Gibson         VMSTATE_PPC_TIMEBASE_V(tb, sPAPRMachineState, 2),
13034be21d56SDavid Gibson         VMSTATE_END_OF_LIST()
13044be21d56SDavid Gibson     },
13054be21d56SDavid Gibson };
13064be21d56SDavid Gibson 
13074be21d56SDavid Gibson static int htab_save_setup(QEMUFile *f, void *opaque)
13084be21d56SDavid Gibson {
130928e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
13104be21d56SDavid Gibson 
13114be21d56SDavid Gibson     /* "Iteration" header */
13124be21d56SDavid Gibson     qemu_put_be32(f, spapr->htab_shift);
13134be21d56SDavid Gibson 
1314e68cb8b4SAlexey Kardashevskiy     if (spapr->htab) {
1315e68cb8b4SAlexey Kardashevskiy         spapr->htab_save_index = 0;
1316e68cb8b4SAlexey Kardashevskiy         spapr->htab_first_pass = true;
1317e68cb8b4SAlexey Kardashevskiy     } else {
1318e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
13194be21d56SDavid Gibson     }
13204be21d56SDavid Gibson 
1321e68cb8b4SAlexey Kardashevskiy 
1322e68cb8b4SAlexey Kardashevskiy     return 0;
1323e68cb8b4SAlexey Kardashevskiy }
13244be21d56SDavid Gibson 
132528e02042SDavid Gibson static void htab_save_first_pass(QEMUFile *f, sPAPRMachineState *spapr,
13264be21d56SDavid Gibson                                  int64_t max_ns)
13274be21d56SDavid Gibson {
1328378bc217SDavid Gibson     bool has_timeout = max_ns != -1;
13294be21d56SDavid Gibson     int htabslots = HTAB_SIZE(spapr) / HASH_PTE_SIZE_64;
13304be21d56SDavid Gibson     int index = spapr->htab_save_index;
1331bc72ad67SAlex Bligh     int64_t starttime = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
13324be21d56SDavid Gibson 
13334be21d56SDavid Gibson     assert(spapr->htab_first_pass);
13344be21d56SDavid Gibson 
13354be21d56SDavid Gibson     do {
13364be21d56SDavid Gibson         int chunkstart;
13374be21d56SDavid Gibson 
13384be21d56SDavid Gibson         /* Consume invalid HPTEs */
13394be21d56SDavid Gibson         while ((index < htabslots)
13404be21d56SDavid Gibson                && !HPTE_VALID(HPTE(spapr->htab, index))) {
13414be21d56SDavid Gibson             index++;
13424be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
13434be21d56SDavid Gibson         }
13444be21d56SDavid Gibson 
13454be21d56SDavid Gibson         /* Consume valid HPTEs */
13464be21d56SDavid Gibson         chunkstart = index;
1347338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - chunkstart < USHRT_MAX)
13484be21d56SDavid Gibson                && HPTE_VALID(HPTE(spapr->htab, index))) {
13494be21d56SDavid Gibson             index++;
13504be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
13514be21d56SDavid Gibson         }
13524be21d56SDavid Gibson 
13534be21d56SDavid Gibson         if (index > chunkstart) {
13544be21d56SDavid Gibson             int n_valid = index - chunkstart;
13554be21d56SDavid Gibson 
13564be21d56SDavid Gibson             qemu_put_be32(f, chunkstart);
13574be21d56SDavid Gibson             qemu_put_be16(f, n_valid);
13584be21d56SDavid Gibson             qemu_put_be16(f, 0);
13594be21d56SDavid Gibson             qemu_put_buffer(f, HPTE(spapr->htab, chunkstart),
13604be21d56SDavid Gibson                             HASH_PTE_SIZE_64 * n_valid);
13614be21d56SDavid Gibson 
1362378bc217SDavid Gibson             if (has_timeout &&
1363378bc217SDavid Gibson                 (qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - starttime) > max_ns) {
13644be21d56SDavid Gibson                 break;
13654be21d56SDavid Gibson             }
13664be21d56SDavid Gibson         }
13674be21d56SDavid Gibson     } while ((index < htabslots) && !qemu_file_rate_limit(f));
13684be21d56SDavid Gibson 
13694be21d56SDavid Gibson     if (index >= htabslots) {
13704be21d56SDavid Gibson         assert(index == htabslots);
13714be21d56SDavid Gibson         index = 0;
13724be21d56SDavid Gibson         spapr->htab_first_pass = false;
13734be21d56SDavid Gibson     }
13744be21d56SDavid Gibson     spapr->htab_save_index = index;
13754be21d56SDavid Gibson }
13764be21d56SDavid Gibson 
137728e02042SDavid Gibson static int htab_save_later_pass(QEMUFile *f, sPAPRMachineState *spapr,
13784be21d56SDavid Gibson                                 int64_t max_ns)
13794be21d56SDavid Gibson {
13804be21d56SDavid Gibson     bool final = max_ns < 0;
13814be21d56SDavid Gibson     int htabslots = HTAB_SIZE(spapr) / HASH_PTE_SIZE_64;
13824be21d56SDavid Gibson     int examined = 0, sent = 0;
13834be21d56SDavid Gibson     int index = spapr->htab_save_index;
1384bc72ad67SAlex Bligh     int64_t starttime = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
13854be21d56SDavid Gibson 
13864be21d56SDavid Gibson     assert(!spapr->htab_first_pass);
13874be21d56SDavid Gibson 
13884be21d56SDavid Gibson     do {
13894be21d56SDavid Gibson         int chunkstart, invalidstart;
13904be21d56SDavid Gibson 
13914be21d56SDavid Gibson         /* Consume non-dirty HPTEs */
13924be21d56SDavid Gibson         while ((index < htabslots)
13934be21d56SDavid Gibson                && !HPTE_DIRTY(HPTE(spapr->htab, index))) {
13944be21d56SDavid Gibson             index++;
13954be21d56SDavid Gibson             examined++;
13964be21d56SDavid Gibson         }
13974be21d56SDavid Gibson 
13984be21d56SDavid Gibson         chunkstart = index;
13994be21d56SDavid Gibson         /* Consume valid dirty HPTEs */
1400338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - chunkstart < USHRT_MAX)
14014be21d56SDavid Gibson                && HPTE_DIRTY(HPTE(spapr->htab, index))
14024be21d56SDavid Gibson                && HPTE_VALID(HPTE(spapr->htab, index))) {
14034be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
14044be21d56SDavid Gibson             index++;
14054be21d56SDavid Gibson             examined++;
14064be21d56SDavid Gibson         }
14074be21d56SDavid Gibson 
14084be21d56SDavid Gibson         invalidstart = index;
14094be21d56SDavid Gibson         /* Consume invalid dirty HPTEs */
1410338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - invalidstart < USHRT_MAX)
14114be21d56SDavid Gibson                && HPTE_DIRTY(HPTE(spapr->htab, index))
14124be21d56SDavid Gibson                && !HPTE_VALID(HPTE(spapr->htab, index))) {
14134be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
14144be21d56SDavid Gibson             index++;
14154be21d56SDavid Gibson             examined++;
14164be21d56SDavid Gibson         }
14174be21d56SDavid Gibson 
14184be21d56SDavid Gibson         if (index > chunkstart) {
14194be21d56SDavid Gibson             int n_valid = invalidstart - chunkstart;
14204be21d56SDavid Gibson             int n_invalid = index - invalidstart;
14214be21d56SDavid Gibson 
14224be21d56SDavid Gibson             qemu_put_be32(f, chunkstart);
14234be21d56SDavid Gibson             qemu_put_be16(f, n_valid);
14244be21d56SDavid Gibson             qemu_put_be16(f, n_invalid);
14254be21d56SDavid Gibson             qemu_put_buffer(f, HPTE(spapr->htab, chunkstart),
14264be21d56SDavid Gibson                             HASH_PTE_SIZE_64 * n_valid);
14274be21d56SDavid Gibson             sent += index - chunkstart;
14284be21d56SDavid Gibson 
1429bc72ad67SAlex Bligh             if (!final && (qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - starttime) > max_ns) {
14304be21d56SDavid Gibson                 break;
14314be21d56SDavid Gibson             }
14324be21d56SDavid Gibson         }
14334be21d56SDavid Gibson 
14344be21d56SDavid Gibson         if (examined >= htabslots) {
14354be21d56SDavid Gibson             break;
14364be21d56SDavid Gibson         }
14374be21d56SDavid Gibson 
14384be21d56SDavid Gibson         if (index >= htabslots) {
14394be21d56SDavid Gibson             assert(index == htabslots);
14404be21d56SDavid Gibson             index = 0;
14414be21d56SDavid Gibson         }
14424be21d56SDavid Gibson     } while ((examined < htabslots) && (!qemu_file_rate_limit(f) || final));
14434be21d56SDavid Gibson 
14444be21d56SDavid Gibson     if (index >= htabslots) {
14454be21d56SDavid Gibson         assert(index == htabslots);
14464be21d56SDavid Gibson         index = 0;
14474be21d56SDavid Gibson     }
14484be21d56SDavid Gibson 
14494be21d56SDavid Gibson     spapr->htab_save_index = index;
14504be21d56SDavid Gibson 
1451e68cb8b4SAlexey Kardashevskiy     return (examined >= htabslots) && (sent == 0) ? 1 : 0;
14524be21d56SDavid Gibson }
14534be21d56SDavid Gibson 
1454e68cb8b4SAlexey Kardashevskiy #define MAX_ITERATION_NS    5000000 /* 5 ms */
1455e68cb8b4SAlexey Kardashevskiy #define MAX_KVM_BUF_SIZE    2048
1456e68cb8b4SAlexey Kardashevskiy 
14574be21d56SDavid Gibson static int htab_save_iterate(QEMUFile *f, void *opaque)
14584be21d56SDavid Gibson {
145928e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
1460715c5407SDavid Gibson     int fd;
1461e68cb8b4SAlexey Kardashevskiy     int rc = 0;
14624be21d56SDavid Gibson 
14634be21d56SDavid Gibson     /* Iteration header */
14644be21d56SDavid Gibson     qemu_put_be32(f, 0);
14654be21d56SDavid Gibson 
1466e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1467e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1468e68cb8b4SAlexey Kardashevskiy 
1469715c5407SDavid Gibson         fd = get_htab_fd(spapr);
1470715c5407SDavid Gibson         if (fd < 0) {
1471715c5407SDavid Gibson             return fd;
147201a57972SSamuel Mendoza-Jonas         }
147301a57972SSamuel Mendoza-Jonas 
1474715c5407SDavid Gibson         rc = kvmppc_save_htab(f, fd, MAX_KVM_BUF_SIZE, MAX_ITERATION_NS);
1475e68cb8b4SAlexey Kardashevskiy         if (rc < 0) {
1476e68cb8b4SAlexey Kardashevskiy             return rc;
1477e68cb8b4SAlexey Kardashevskiy         }
1478e68cb8b4SAlexey Kardashevskiy     } else  if (spapr->htab_first_pass) {
14794be21d56SDavid Gibson         htab_save_first_pass(f, spapr, MAX_ITERATION_NS);
14804be21d56SDavid Gibson     } else {
1481e68cb8b4SAlexey Kardashevskiy         rc = htab_save_later_pass(f, spapr, MAX_ITERATION_NS);
14824be21d56SDavid Gibson     }
14834be21d56SDavid Gibson 
14844be21d56SDavid Gibson     /* End marker */
14854be21d56SDavid Gibson     qemu_put_be32(f, 0);
14864be21d56SDavid Gibson     qemu_put_be16(f, 0);
14874be21d56SDavid Gibson     qemu_put_be16(f, 0);
14884be21d56SDavid Gibson 
1489e68cb8b4SAlexey Kardashevskiy     return rc;
14904be21d56SDavid Gibson }
14914be21d56SDavid Gibson 
14924be21d56SDavid Gibson static int htab_save_complete(QEMUFile *f, void *opaque)
14934be21d56SDavid Gibson {
149428e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
1495715c5407SDavid Gibson     int fd;
14964be21d56SDavid Gibson 
14974be21d56SDavid Gibson     /* Iteration header */
14984be21d56SDavid Gibson     qemu_put_be32(f, 0);
14994be21d56SDavid Gibson 
1500e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1501e68cb8b4SAlexey Kardashevskiy         int rc;
1502e68cb8b4SAlexey Kardashevskiy 
1503e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1504e68cb8b4SAlexey Kardashevskiy 
1505715c5407SDavid Gibson         fd = get_htab_fd(spapr);
1506715c5407SDavid Gibson         if (fd < 0) {
1507715c5407SDavid Gibson             return fd;
150801a57972SSamuel Mendoza-Jonas         }
150901a57972SSamuel Mendoza-Jonas 
1510715c5407SDavid Gibson         rc = kvmppc_save_htab(f, fd, MAX_KVM_BUF_SIZE, -1);
1511e68cb8b4SAlexey Kardashevskiy         if (rc < 0) {
1512e68cb8b4SAlexey Kardashevskiy             return rc;
1513e68cb8b4SAlexey Kardashevskiy         }
1514715c5407SDavid Gibson         close_htab_fd(spapr);
1515e68cb8b4SAlexey Kardashevskiy     } else {
1516378bc217SDavid Gibson         if (spapr->htab_first_pass) {
1517378bc217SDavid Gibson             htab_save_first_pass(f, spapr, -1);
1518378bc217SDavid Gibson         }
15194be21d56SDavid Gibson         htab_save_later_pass(f, spapr, -1);
1520e68cb8b4SAlexey Kardashevskiy     }
15214be21d56SDavid Gibson 
15224be21d56SDavid Gibson     /* End marker */
15234be21d56SDavid Gibson     qemu_put_be32(f, 0);
15244be21d56SDavid Gibson     qemu_put_be16(f, 0);
15254be21d56SDavid Gibson     qemu_put_be16(f, 0);
15264be21d56SDavid Gibson 
15274be21d56SDavid Gibson     return 0;
15284be21d56SDavid Gibson }
15294be21d56SDavid Gibson 
15304be21d56SDavid Gibson static int htab_load(QEMUFile *f, void *opaque, int version_id)
15314be21d56SDavid Gibson {
153228e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
15334be21d56SDavid Gibson     uint32_t section_hdr;
1534e68cb8b4SAlexey Kardashevskiy     int fd = -1;
15354be21d56SDavid Gibson 
15364be21d56SDavid Gibson     if (version_id < 1 || version_id > 1) {
153798a5d100SDavid Gibson         error_report("htab_load() bad version");
15384be21d56SDavid Gibson         return -EINVAL;
15394be21d56SDavid Gibson     }
15404be21d56SDavid Gibson 
15414be21d56SDavid Gibson     section_hdr = qemu_get_be32(f);
15424be21d56SDavid Gibson 
15434be21d56SDavid Gibson     if (section_hdr) {
15449897e462SGreg Kurz         Error *local_err = NULL;
1545c5f54f3eSDavid Gibson 
1546c5f54f3eSDavid Gibson         /* First section gives the htab size */
1547c5f54f3eSDavid Gibson         spapr_reallocate_hpt(spapr, section_hdr, &local_err);
1548c5f54f3eSDavid Gibson         if (local_err) {
1549c5f54f3eSDavid Gibson             error_report_err(local_err);
15504be21d56SDavid Gibson             return -EINVAL;
15514be21d56SDavid Gibson         }
15524be21d56SDavid Gibson         return 0;
15534be21d56SDavid Gibson     }
15544be21d56SDavid Gibson 
1555e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1556e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1557e68cb8b4SAlexey Kardashevskiy 
1558e68cb8b4SAlexey Kardashevskiy         fd = kvmppc_get_htab_fd(true);
1559e68cb8b4SAlexey Kardashevskiy         if (fd < 0) {
156098a5d100SDavid Gibson             error_report("Unable to open fd to restore KVM hash table: %s",
1561e68cb8b4SAlexey Kardashevskiy                          strerror(errno));
1562e68cb8b4SAlexey Kardashevskiy         }
1563e68cb8b4SAlexey Kardashevskiy     }
1564e68cb8b4SAlexey Kardashevskiy 
15654be21d56SDavid Gibson     while (true) {
15664be21d56SDavid Gibson         uint32_t index;
15674be21d56SDavid Gibson         uint16_t n_valid, n_invalid;
15684be21d56SDavid Gibson 
15694be21d56SDavid Gibson         index = qemu_get_be32(f);
15704be21d56SDavid Gibson         n_valid = qemu_get_be16(f);
15714be21d56SDavid Gibson         n_invalid = qemu_get_be16(f);
15724be21d56SDavid Gibson 
15734be21d56SDavid Gibson         if ((index == 0) && (n_valid == 0) && (n_invalid == 0)) {
15744be21d56SDavid Gibson             /* End of Stream */
15754be21d56SDavid Gibson             break;
15764be21d56SDavid Gibson         }
15774be21d56SDavid Gibson 
1578e68cb8b4SAlexey Kardashevskiy         if ((index + n_valid + n_invalid) >
15794be21d56SDavid Gibson             (HTAB_SIZE(spapr) / HASH_PTE_SIZE_64)) {
15804be21d56SDavid Gibson             /* Bad index in stream */
158198a5d100SDavid Gibson             error_report(
158298a5d100SDavid Gibson                 "htab_load() bad index %d (%hd+%hd entries) in htab stream (htab_shift=%d)",
158398a5d100SDavid Gibson                 index, n_valid, n_invalid, spapr->htab_shift);
15844be21d56SDavid Gibson             return -EINVAL;
15854be21d56SDavid Gibson         }
15864be21d56SDavid Gibson 
1587e68cb8b4SAlexey Kardashevskiy         if (spapr->htab) {
15884be21d56SDavid Gibson             if (n_valid) {
15894be21d56SDavid Gibson                 qemu_get_buffer(f, HPTE(spapr->htab, index),
15904be21d56SDavid Gibson                                 HASH_PTE_SIZE_64 * n_valid);
15914be21d56SDavid Gibson             }
15924be21d56SDavid Gibson             if (n_invalid) {
15934be21d56SDavid Gibson                 memset(HPTE(spapr->htab, index + n_valid), 0,
15944be21d56SDavid Gibson                        HASH_PTE_SIZE_64 * n_invalid);
15954be21d56SDavid Gibson             }
1596e68cb8b4SAlexey Kardashevskiy         } else {
1597e68cb8b4SAlexey Kardashevskiy             int rc;
1598e68cb8b4SAlexey Kardashevskiy 
1599e68cb8b4SAlexey Kardashevskiy             assert(fd >= 0);
1600e68cb8b4SAlexey Kardashevskiy 
1601e68cb8b4SAlexey Kardashevskiy             rc = kvmppc_load_htab_chunk(f, fd, index, n_valid, n_invalid);
1602e68cb8b4SAlexey Kardashevskiy             if (rc < 0) {
1603e68cb8b4SAlexey Kardashevskiy                 return rc;
1604e68cb8b4SAlexey Kardashevskiy             }
1605e68cb8b4SAlexey Kardashevskiy         }
1606e68cb8b4SAlexey Kardashevskiy     }
1607e68cb8b4SAlexey Kardashevskiy 
1608e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1609e68cb8b4SAlexey Kardashevskiy         assert(fd >= 0);
1610e68cb8b4SAlexey Kardashevskiy         close(fd);
16114be21d56SDavid Gibson     }
16124be21d56SDavid Gibson 
16134be21d56SDavid Gibson     return 0;
16144be21d56SDavid Gibson }
16154be21d56SDavid Gibson 
16164be21d56SDavid Gibson static SaveVMHandlers savevm_htab_handlers = {
16174be21d56SDavid Gibson     .save_live_setup = htab_save_setup,
16184be21d56SDavid Gibson     .save_live_iterate = htab_save_iterate,
1619a3e06c3dSDr. David Alan Gilbert     .save_live_complete_precopy = htab_save_complete,
16204be21d56SDavid Gibson     .load_state = htab_load,
16214be21d56SDavid Gibson };
16224be21d56SDavid Gibson 
16235b2128d2SAlexander Graf static void spapr_boot_set(void *opaque, const char *boot_device,
16245b2128d2SAlexander Graf                            Error **errp)
16255b2128d2SAlexander Graf {
16265b2128d2SAlexander Graf     MachineState *machine = MACHINE(qdev_get_machine());
16275b2128d2SAlexander Graf     machine->boot_order = g_strdup(boot_device);
16285b2128d2SAlexander Graf }
16295b2128d2SAlexander Graf 
1630224245bfSDavid Gibson /*
1631224245bfSDavid Gibson  * Reset routine for LMB DR devices.
1632224245bfSDavid Gibson  *
1633224245bfSDavid Gibson  * Unlike PCI DR devices, LMB DR devices explicitly register this reset
1634224245bfSDavid Gibson  * routine. Reset for PCI DR devices will be handled by PHB reset routine
1635224245bfSDavid Gibson  * when it walks all its children devices. LMB devices reset occurs
1636224245bfSDavid Gibson  * as part of spapr_ppc_reset().
1637224245bfSDavid Gibson  */
1638224245bfSDavid Gibson static void spapr_drc_reset(void *opaque)
1639224245bfSDavid Gibson {
1640224245bfSDavid Gibson     sPAPRDRConnector *drc = opaque;
1641224245bfSDavid Gibson     DeviceState *d = DEVICE(drc);
1642224245bfSDavid Gibson 
1643224245bfSDavid Gibson     if (d) {
1644224245bfSDavid Gibson         device_reset(d);
1645224245bfSDavid Gibson     }
1646224245bfSDavid Gibson }
1647224245bfSDavid Gibson 
1648224245bfSDavid Gibson static void spapr_create_lmb_dr_connectors(sPAPRMachineState *spapr)
1649224245bfSDavid Gibson {
1650224245bfSDavid Gibson     MachineState *machine = MACHINE(spapr);
1651224245bfSDavid Gibson     uint64_t lmb_size = SPAPR_MEMORY_BLOCK_SIZE;
1652e8f986fcSBharata B Rao     uint32_t nr_lmbs = (machine->maxram_size - machine->ram_size)/lmb_size;
1653224245bfSDavid Gibson     int i;
1654224245bfSDavid Gibson 
1655224245bfSDavid Gibson     for (i = 0; i < nr_lmbs; i++) {
1656224245bfSDavid Gibson         sPAPRDRConnector *drc;
1657224245bfSDavid Gibson         uint64_t addr;
1658224245bfSDavid Gibson 
1659e8f986fcSBharata B Rao         addr = i * lmb_size + spapr->hotplug_memory.base;
1660224245bfSDavid Gibson         drc = spapr_dr_connector_new(OBJECT(spapr), SPAPR_DR_CONNECTOR_TYPE_LMB,
1661224245bfSDavid Gibson                                      addr/lmb_size);
1662224245bfSDavid Gibson         qemu_register_reset(spapr_drc_reset, drc);
1663224245bfSDavid Gibson     }
1664224245bfSDavid Gibson }
1665224245bfSDavid Gibson 
1666224245bfSDavid Gibson /*
1667224245bfSDavid Gibson  * If RAM size, maxmem size and individual node mem sizes aren't aligned
1668224245bfSDavid Gibson  * to SPAPR_MEMORY_BLOCK_SIZE(256MB), then refuse to start the guest
1669224245bfSDavid Gibson  * since we can't support such unaligned sizes with DRCONF_MEMORY.
1670224245bfSDavid Gibson  */
16717c150d6fSDavid Gibson static void spapr_validate_node_memory(MachineState *machine, Error **errp)
1672224245bfSDavid Gibson {
1673224245bfSDavid Gibson     int i;
1674224245bfSDavid Gibson 
16757c150d6fSDavid Gibson     if (machine->ram_size % SPAPR_MEMORY_BLOCK_SIZE) {
16767c150d6fSDavid Gibson         error_setg(errp, "Memory size 0x" RAM_ADDR_FMT
16777c150d6fSDavid Gibson                    " is not aligned to %llu MiB",
16787c150d6fSDavid Gibson                    machine->ram_size,
1679224245bfSDavid Gibson                    SPAPR_MEMORY_BLOCK_SIZE / M_BYTE);
16807c150d6fSDavid Gibson         return;
16817c150d6fSDavid Gibson     }
16827c150d6fSDavid Gibson 
16837c150d6fSDavid Gibson     if (machine->maxram_size % SPAPR_MEMORY_BLOCK_SIZE) {
16847c150d6fSDavid Gibson         error_setg(errp, "Maximum memory size 0x" RAM_ADDR_FMT
16857c150d6fSDavid Gibson                    " is not aligned to %llu MiB",
16867c150d6fSDavid Gibson                    machine->ram_size,
16877c150d6fSDavid Gibson                    SPAPR_MEMORY_BLOCK_SIZE / M_BYTE);
16887c150d6fSDavid Gibson         return;
1689224245bfSDavid Gibson     }
1690224245bfSDavid Gibson 
1691224245bfSDavid Gibson     for (i = 0; i < nb_numa_nodes; i++) {
1692224245bfSDavid Gibson         if (numa_info[i].node_mem % SPAPR_MEMORY_BLOCK_SIZE) {
16937c150d6fSDavid Gibson             error_setg(errp,
16947c150d6fSDavid Gibson                        "Node %d memory size 0x%" PRIx64
16957c150d6fSDavid Gibson                        " is not aligned to %llu MiB",
16967c150d6fSDavid Gibson                        i, numa_info[i].node_mem,
1697224245bfSDavid Gibson                        SPAPR_MEMORY_BLOCK_SIZE / M_BYTE);
16987c150d6fSDavid Gibson             return;
1699224245bfSDavid Gibson         }
1700224245bfSDavid Gibson     }
1701224245bfSDavid Gibson }
1702224245bfSDavid Gibson 
170353018216SPaolo Bonzini /* pSeries LPAR / sPAPR hardware init */
17043ef96221SMarcel Apfelbaum static void ppc_spapr_init(MachineState *machine)
170553018216SPaolo Bonzini {
170628e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
1707224245bfSDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(machine);
17083ef96221SMarcel Apfelbaum     const char *kernel_filename = machine->kernel_filename;
17093ef96221SMarcel Apfelbaum     const char *kernel_cmdline = machine->kernel_cmdline;
17103ef96221SMarcel Apfelbaum     const char *initrd_filename = machine->initrd_filename;
171153018216SPaolo Bonzini     PCIHostState *phb;
171253018216SPaolo Bonzini     int i;
171353018216SPaolo Bonzini     MemoryRegion *sysmem = get_system_memory();
171453018216SPaolo Bonzini     MemoryRegion *ram = g_new(MemoryRegion, 1);
1715658fa66bSAlexey Kardashevskiy     MemoryRegion *rma_region;
1716658fa66bSAlexey Kardashevskiy     void *rma = NULL;
171753018216SPaolo Bonzini     hwaddr rma_alloc_size;
1718b082d65aSAlexey Kardashevskiy     hwaddr node0_size = spapr_node0_size();
171953018216SPaolo Bonzini     uint32_t initrd_base = 0;
172053018216SPaolo Bonzini     long kernel_size = 0, initrd_size = 0;
1721b7d1f77aSBenjamin Herrenschmidt     long load_limit, fw_size;
172216457e7fSBenjamin Herrenschmidt     bool kernel_le = false;
172353018216SPaolo Bonzini     char *filename;
172494a94e4cSBharata B Rao     int smt = kvmppc_smt_threads();
172594a94e4cSBharata B Rao     int spapr_cores = smp_cpus / smp_threads;
172694a94e4cSBharata B Rao     int spapr_max_cores = max_cpus / smp_threads;
172794a94e4cSBharata B Rao 
172894a94e4cSBharata B Rao     if (smc->dr_cpu_enabled) {
172994a94e4cSBharata B Rao         if (smp_cpus % smp_threads) {
173094a94e4cSBharata B Rao             error_report("smp_cpus (%u) must be multiple of threads (%u)",
173194a94e4cSBharata B Rao                          smp_cpus, smp_threads);
173294a94e4cSBharata B Rao             exit(1);
173394a94e4cSBharata B Rao         }
173494a94e4cSBharata B Rao         if (max_cpus % smp_threads) {
173594a94e4cSBharata B Rao             error_report("max_cpus (%u) must be multiple of threads (%u)",
173694a94e4cSBharata B Rao                          max_cpus, smp_threads);
173794a94e4cSBharata B Rao             exit(1);
173894a94e4cSBharata B Rao         }
173994a94e4cSBharata B Rao     }
174053018216SPaolo Bonzini 
1741226419d6SMichael S. Tsirkin     msi_nonbroken = true;
174253018216SPaolo Bonzini 
174353018216SPaolo Bonzini     QLIST_INIT(&spapr->phbs);
174453018216SPaolo Bonzini 
174553018216SPaolo Bonzini     cpu_ppc_hypercall = emulate_spapr_hypercall;
174653018216SPaolo Bonzini 
174753018216SPaolo Bonzini     /* Allocate RMA if necessary */
1748658fa66bSAlexey Kardashevskiy     rma_alloc_size = kvmppc_alloc_rma(&rma);
174953018216SPaolo Bonzini 
175053018216SPaolo Bonzini     if (rma_alloc_size == -1) {
1751730fce59SThomas Huth         error_report("Unable to create RMA");
175253018216SPaolo Bonzini         exit(1);
175353018216SPaolo Bonzini     }
175453018216SPaolo Bonzini 
1755c4177479SAlexey Kardashevskiy     if (rma_alloc_size && (rma_alloc_size < node0_size)) {
175653018216SPaolo Bonzini         spapr->rma_size = rma_alloc_size;
175753018216SPaolo Bonzini     } else {
1758c4177479SAlexey Kardashevskiy         spapr->rma_size = node0_size;
175953018216SPaolo Bonzini 
176053018216SPaolo Bonzini         /* With KVM, we don't actually know whether KVM supports an
176153018216SPaolo Bonzini          * unbounded RMA (PR KVM) or is limited by the hash table size
176253018216SPaolo Bonzini          * (HV KVM using VRMA), so we always assume the latter
176353018216SPaolo Bonzini          *
176453018216SPaolo Bonzini          * In that case, we also limit the initial allocations for RTAS
176553018216SPaolo Bonzini          * etc... to 256M since we have no way to know what the VRMA size
176653018216SPaolo Bonzini          * is going to be as it depends on the size of the hash table
176753018216SPaolo Bonzini          * isn't determined yet.
176853018216SPaolo Bonzini          */
176953018216SPaolo Bonzini         if (kvm_enabled()) {
177053018216SPaolo Bonzini             spapr->vrma_adjust = 1;
177153018216SPaolo Bonzini             spapr->rma_size = MIN(spapr->rma_size, 0x10000000);
177253018216SPaolo Bonzini         }
177353018216SPaolo Bonzini     }
177453018216SPaolo Bonzini 
1775c4177479SAlexey Kardashevskiy     if (spapr->rma_size > node0_size) {
1776d54e4d76SDavid Gibson         error_report("Numa node 0 has to span the RMA (%#08"HWADDR_PRIx")",
1777c4177479SAlexey Kardashevskiy                      spapr->rma_size);
1778c4177479SAlexey Kardashevskiy         exit(1);
1779c4177479SAlexey Kardashevskiy     }
1780c4177479SAlexey Kardashevskiy 
1781b7d1f77aSBenjamin Herrenschmidt     /* Setup a load limit for the ramdisk leaving room for SLOF and FDT */
1782b7d1f77aSBenjamin Herrenschmidt     load_limit = MIN(spapr->rma_size, RTAS_MAX_ADDR) - FW_OVERHEAD;
178353018216SPaolo Bonzini 
17847b565160SDavid Gibson     /* Set up Interrupt Controller before we create the VCPUs */
1785446f16a6SMarcel Apfelbaum     spapr->icp = xics_system_init(machine,
178694a94e4cSBharata B Rao                                   DIV_ROUND_UP(max_cpus * smt, smp_threads),
17871e49182dSDavid Gibson                                   XICS_IRQS, &error_fatal);
17887b565160SDavid Gibson 
1789224245bfSDavid Gibson     if (smc->dr_lmb_enabled) {
17907c150d6fSDavid Gibson         spapr_validate_node_memory(machine, &error_fatal);
1791224245bfSDavid Gibson     }
1792224245bfSDavid Gibson 
179353018216SPaolo Bonzini     /* init CPUs */
179419fb2c36SBharata B Rao     if (machine->cpu_model == NULL) {
179519fb2c36SBharata B Rao         machine->cpu_model = kvm_enabled() ? "host" : "POWER7";
179653018216SPaolo Bonzini     }
179794a94e4cSBharata B Rao 
179894a94e4cSBharata B Rao     if (smc->dr_cpu_enabled) {
179994a94e4cSBharata B Rao         char *type = spapr_get_cpu_core_type(machine->cpu_model);
180094a94e4cSBharata B Rao 
180194a94e4cSBharata B Rao         spapr->cores = g_new0(Object *, spapr_max_cores);
1802af81cf32SBharata B Rao         for (i = 0; i < spapr_max_cores; i++) {
180394a94e4cSBharata B Rao             int core_dt_id = i * smt;
1804af81cf32SBharata B Rao             sPAPRDRConnector *drc =
1805af81cf32SBharata B Rao                 spapr_dr_connector_new(OBJECT(spapr),
1806af81cf32SBharata B Rao                                        SPAPR_DR_CONNECTOR_TYPE_CPU, core_dt_id);
1807af81cf32SBharata B Rao 
1808af81cf32SBharata B Rao             qemu_register_reset(spapr_drc_reset, drc);
1809af81cf32SBharata B Rao 
1810af81cf32SBharata B Rao             if (i < spapr_cores) {
1811af81cf32SBharata B Rao                 char *type = spapr_get_cpu_core_type(machine->cpu_model);
181294a94e4cSBharata B Rao                 Object *core;
181394a94e4cSBharata B Rao 
181494a94e4cSBharata B Rao                 if (!object_class_by_name(type)) {
181594a94e4cSBharata B Rao                     error_report("Unable to find sPAPR CPU Core definition");
181694a94e4cSBharata B Rao                     exit(1);
181794a94e4cSBharata B Rao                 }
181894a94e4cSBharata B Rao 
181994a94e4cSBharata B Rao                 core  = object_new(type);
182094a94e4cSBharata B Rao                 object_property_set_int(core, smp_threads, "nr-threads",
182194a94e4cSBharata B Rao                                         &error_fatal);
182294a94e4cSBharata B Rao                 object_property_set_int(core, core_dt_id, CPU_CORE_PROP_CORE_ID,
182394a94e4cSBharata B Rao                                         &error_fatal);
182494a94e4cSBharata B Rao                 object_property_set_bool(core, true, "realized", &error_fatal);
182594a94e4cSBharata B Rao             }
1826af81cf32SBharata B Rao         }
182794a94e4cSBharata B Rao         g_free(type);
182894a94e4cSBharata B Rao     } else {
182953018216SPaolo Bonzini         for (i = 0; i < smp_cpus; i++) {
183094a94e4cSBharata B Rao             PowerPCCPU *cpu = cpu_ppc_init(machine->cpu_model);
183153018216SPaolo Bonzini             if (cpu == NULL) {
1832569f4967SDavid Gibson                 error_report("Unable to find PowerPC CPU definition");
183353018216SPaolo Bonzini                 exit(1);
183453018216SPaolo Bonzini             }
1835569f4967SDavid Gibson             spapr_cpu_init(spapr, cpu, &error_fatal);
183653018216SPaolo Bonzini        }
183794a94e4cSBharata B Rao     }
183853018216SPaolo Bonzini 
1839026bfd89SDavid Gibson     if (kvm_enabled()) {
1840026bfd89SDavid Gibson         /* Enable H_LOGICAL_CI_* so SLOF can talk to in-kernel devices */
1841026bfd89SDavid Gibson         kvmppc_enable_logical_ci_hcalls();
1842ef9971ddSAlexey Kardashevskiy         kvmppc_enable_set_mode_hcall();
1843026bfd89SDavid Gibson     }
1844026bfd89SDavid Gibson 
184553018216SPaolo Bonzini     /* allocate RAM */
1846f92f5da1SAlexey Kardashevskiy     memory_region_allocate_system_memory(ram, NULL, "ppc_spapr.ram",
1847fb164994SDavid Gibson                                          machine->ram_size);
1848f92f5da1SAlexey Kardashevskiy     memory_region_add_subregion(sysmem, 0, ram);
184953018216SPaolo Bonzini 
1850658fa66bSAlexey Kardashevskiy     if (rma_alloc_size && rma) {
1851658fa66bSAlexey Kardashevskiy         rma_region = g_new(MemoryRegion, 1);
1852658fa66bSAlexey Kardashevskiy         memory_region_init_ram_ptr(rma_region, NULL, "ppc_spapr.rma",
1853658fa66bSAlexey Kardashevskiy                                    rma_alloc_size, rma);
1854658fa66bSAlexey Kardashevskiy         vmstate_register_ram_global(rma_region);
1855658fa66bSAlexey Kardashevskiy         memory_region_add_subregion(sysmem, 0, rma_region);
1856658fa66bSAlexey Kardashevskiy     }
1857658fa66bSAlexey Kardashevskiy 
18584a1c9cf0SBharata B Rao     /* initialize hotplug memory address space */
18594a1c9cf0SBharata B Rao     if (machine->ram_size < machine->maxram_size) {
18604a1c9cf0SBharata B Rao         ram_addr_t hotplug_mem_size = machine->maxram_size - machine->ram_size;
186171c9a3ddSBharata B Rao         /*
186271c9a3ddSBharata B Rao          * Limit the number of hotpluggable memory slots to half the number
186371c9a3ddSBharata B Rao          * slots that KVM supports, leaving the other half for PCI and other
186471c9a3ddSBharata B Rao          * devices. However ensure that number of slots doesn't drop below 32.
186571c9a3ddSBharata B Rao          */
186671c9a3ddSBharata B Rao         int max_memslots = kvm_enabled() ? kvm_get_max_memslots() / 2 :
186771c9a3ddSBharata B Rao                            SPAPR_MAX_RAM_SLOTS;
18684a1c9cf0SBharata B Rao 
186971c9a3ddSBharata B Rao         if (max_memslots < SPAPR_MAX_RAM_SLOTS) {
187071c9a3ddSBharata B Rao             max_memslots = SPAPR_MAX_RAM_SLOTS;
187171c9a3ddSBharata B Rao         }
187271c9a3ddSBharata B Rao         if (machine->ram_slots > max_memslots) {
1873d54e4d76SDavid Gibson             error_report("Specified number of memory slots %"
1874d54e4d76SDavid Gibson                          PRIu64" exceeds max supported %d",
187571c9a3ddSBharata B Rao                          machine->ram_slots, max_memslots);
1876d54e4d76SDavid Gibson             exit(1);
18774a1c9cf0SBharata B Rao         }
18784a1c9cf0SBharata B Rao 
18794a1c9cf0SBharata B Rao         spapr->hotplug_memory.base = ROUND_UP(machine->ram_size,
18804a1c9cf0SBharata B Rao                                               SPAPR_HOTPLUG_MEM_ALIGN);
18814a1c9cf0SBharata B Rao         memory_region_init(&spapr->hotplug_memory.mr, OBJECT(spapr),
18824a1c9cf0SBharata B Rao                            "hotplug-memory", hotplug_mem_size);
18834a1c9cf0SBharata B Rao         memory_region_add_subregion(sysmem, spapr->hotplug_memory.base,
18844a1c9cf0SBharata B Rao                                     &spapr->hotplug_memory.mr);
18854a1c9cf0SBharata B Rao     }
18864a1c9cf0SBharata B Rao 
1887224245bfSDavid Gibson     if (smc->dr_lmb_enabled) {
1888224245bfSDavid Gibson         spapr_create_lmb_dr_connectors(spapr);
1889224245bfSDavid Gibson     }
1890224245bfSDavid Gibson 
189153018216SPaolo Bonzini     filename = qemu_find_file(QEMU_FILE_TYPE_BIOS, "spapr-rtas.bin");
18924c56440dSStefan Weil     if (!filename) {
1893730fce59SThomas Huth         error_report("Could not find LPAR rtas '%s'", "spapr-rtas.bin");
18944c56440dSStefan Weil         exit(1);
18954c56440dSStefan Weil     }
1896b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_size = get_image_size(filename);
18978afc22a2SZhou Jie     if (spapr->rtas_size < 0) {
18988afc22a2SZhou Jie         error_report("Could not get size of LPAR rtas '%s'", filename);
18998afc22a2SZhou Jie         exit(1);
19008afc22a2SZhou Jie     }
1901b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_blob = g_malloc(spapr->rtas_size);
1902b7d1f77aSBenjamin Herrenschmidt     if (load_image_size(filename, spapr->rtas_blob, spapr->rtas_size) < 0) {
1903730fce59SThomas Huth         error_report("Could not load LPAR rtas '%s'", filename);
190453018216SPaolo Bonzini         exit(1);
190553018216SPaolo Bonzini     }
190653018216SPaolo Bonzini     if (spapr->rtas_size > RTAS_MAX_SIZE) {
1907730fce59SThomas Huth         error_report("RTAS too big ! 0x%zx bytes (max is 0x%x)",
19082f285bddSPeter Maydell                      (size_t)spapr->rtas_size, RTAS_MAX_SIZE);
190953018216SPaolo Bonzini         exit(1);
191053018216SPaolo Bonzini     }
191153018216SPaolo Bonzini     g_free(filename);
191253018216SPaolo Bonzini 
191353018216SPaolo Bonzini     /* Set up EPOW events infrastructure */
191453018216SPaolo Bonzini     spapr_events_init(spapr);
191553018216SPaolo Bonzini 
191612f42174SDavid Gibson     /* Set up the RTC RTAS interfaces */
191728df36a1SDavid Gibson     spapr_rtc_create(spapr);
191812f42174SDavid Gibson 
191953018216SPaolo Bonzini     /* Set up VIO bus */
192053018216SPaolo Bonzini     spapr->vio_bus = spapr_vio_bus_init();
192153018216SPaolo Bonzini 
192253018216SPaolo Bonzini     for (i = 0; i < MAX_SERIAL_PORTS; i++) {
192353018216SPaolo Bonzini         if (serial_hds[i]) {
192453018216SPaolo Bonzini             spapr_vty_create(spapr->vio_bus, serial_hds[i]);
192553018216SPaolo Bonzini         }
192653018216SPaolo Bonzini     }
192753018216SPaolo Bonzini 
192853018216SPaolo Bonzini     /* We always have at least the nvram device on VIO */
192953018216SPaolo Bonzini     spapr_create_nvram(spapr);
193053018216SPaolo Bonzini 
193153018216SPaolo Bonzini     /* Set up PCI */
193253018216SPaolo Bonzini     spapr_pci_rtas_init();
193353018216SPaolo Bonzini 
193489dfd6e1SDavid Gibson     phb = spapr_create_phb(spapr, 0);
193553018216SPaolo Bonzini 
193653018216SPaolo Bonzini     for (i = 0; i < nb_nics; i++) {
193753018216SPaolo Bonzini         NICInfo *nd = &nd_table[i];
193853018216SPaolo Bonzini 
193953018216SPaolo Bonzini         if (!nd->model) {
194053018216SPaolo Bonzini             nd->model = g_strdup("ibmveth");
194153018216SPaolo Bonzini         }
194253018216SPaolo Bonzini 
194353018216SPaolo Bonzini         if (strcmp(nd->model, "ibmveth") == 0) {
194453018216SPaolo Bonzini             spapr_vlan_create(spapr->vio_bus, nd);
194553018216SPaolo Bonzini         } else {
194629b358f9SDavid Gibson             pci_nic_init_nofail(&nd_table[i], phb->bus, nd->model, NULL);
194753018216SPaolo Bonzini         }
194853018216SPaolo Bonzini     }
194953018216SPaolo Bonzini 
195053018216SPaolo Bonzini     for (i = 0; i <= drive_get_max_bus(IF_SCSI); i++) {
195153018216SPaolo Bonzini         spapr_vscsi_create(spapr->vio_bus);
195253018216SPaolo Bonzini     }
195353018216SPaolo Bonzini 
195453018216SPaolo Bonzini     /* Graphics */
195514c6a894SDavid Gibson     if (spapr_vga_init(phb->bus, &error_fatal)) {
195653018216SPaolo Bonzini         spapr->has_graphics = true;
1957c6e76503SPaolo Bonzini         machine->usb |= defaults_enabled() && !machine->usb_disabled;
195853018216SPaolo Bonzini     }
195953018216SPaolo Bonzini 
19604ee9ced9SMarcel Apfelbaum     if (machine->usb) {
196157040d45SThomas Huth         if (smc->use_ohci_by_default) {
196253018216SPaolo Bonzini             pci_create_simple(phb->bus, -1, "pci-ohci");
196357040d45SThomas Huth         } else {
196457040d45SThomas Huth             pci_create_simple(phb->bus, -1, "nec-usb-xhci");
196557040d45SThomas Huth         }
1966c86580b8SMarkus Armbruster 
196753018216SPaolo Bonzini         if (spapr->has_graphics) {
1968c86580b8SMarkus Armbruster             USBBus *usb_bus = usb_bus_find(-1);
1969c86580b8SMarkus Armbruster 
1970c86580b8SMarkus Armbruster             usb_create_simple(usb_bus, "usb-kbd");
1971c86580b8SMarkus Armbruster             usb_create_simple(usb_bus, "usb-mouse");
197253018216SPaolo Bonzini         }
197353018216SPaolo Bonzini     }
197453018216SPaolo Bonzini 
197553018216SPaolo Bonzini     if (spapr->rma_size < (MIN_RMA_SLOF << 20)) {
1976d54e4d76SDavid Gibson         error_report(
1977d54e4d76SDavid Gibson             "pSeries SLOF firmware requires >= %ldM guest RMA (Real Mode Area memory)",
1978d54e4d76SDavid Gibson             MIN_RMA_SLOF);
197953018216SPaolo Bonzini         exit(1);
198053018216SPaolo Bonzini     }
198153018216SPaolo Bonzini 
198253018216SPaolo Bonzini     if (kernel_filename) {
198353018216SPaolo Bonzini         uint64_t lowaddr = 0;
198453018216SPaolo Bonzini 
198553018216SPaolo Bonzini         kernel_size = load_elf(kernel_filename, translate_kernel_address, NULL,
19867ef295eaSPeter Crosthwaite                                NULL, &lowaddr, NULL, 1, PPC_ELF_MACHINE,
19877ef295eaSPeter Crosthwaite                                0, 0);
19883b66da82SAlexey Kardashevskiy         if (kernel_size == ELF_LOAD_WRONG_ENDIAN) {
198916457e7fSBenjamin Herrenschmidt             kernel_size = load_elf(kernel_filename,
199016457e7fSBenjamin Herrenschmidt                                    translate_kernel_address, NULL,
19917ef295eaSPeter Crosthwaite                                    NULL, &lowaddr, NULL, 0, PPC_ELF_MACHINE,
19927ef295eaSPeter Crosthwaite                                    0, 0);
199316457e7fSBenjamin Herrenschmidt             kernel_le = kernel_size > 0;
199416457e7fSBenjamin Herrenschmidt         }
199516457e7fSBenjamin Herrenschmidt         if (kernel_size < 0) {
1996d54e4d76SDavid Gibson             error_report("error loading %s: %s",
19973b66da82SAlexey Kardashevskiy                          kernel_filename, load_elf_strerror(kernel_size));
199853018216SPaolo Bonzini             exit(1);
199953018216SPaolo Bonzini         }
200053018216SPaolo Bonzini 
200153018216SPaolo Bonzini         /* load initrd */
200253018216SPaolo Bonzini         if (initrd_filename) {
200353018216SPaolo Bonzini             /* Try to locate the initrd in the gap between the kernel
200453018216SPaolo Bonzini              * and the firmware. Add a bit of space just in case
200553018216SPaolo Bonzini              */
200653018216SPaolo Bonzini             initrd_base = (KERNEL_LOAD_ADDR + kernel_size + 0x1ffff) & ~0xffff;
200753018216SPaolo Bonzini             initrd_size = load_image_targphys(initrd_filename, initrd_base,
200853018216SPaolo Bonzini                                               load_limit - initrd_base);
200953018216SPaolo Bonzini             if (initrd_size < 0) {
2010d54e4d76SDavid Gibson                 error_report("could not load initial ram disk '%s'",
201153018216SPaolo Bonzini                              initrd_filename);
201253018216SPaolo Bonzini                 exit(1);
201353018216SPaolo Bonzini             }
201453018216SPaolo Bonzini         } else {
201553018216SPaolo Bonzini             initrd_base = 0;
201653018216SPaolo Bonzini             initrd_size = 0;
201753018216SPaolo Bonzini         }
201853018216SPaolo Bonzini     }
201953018216SPaolo Bonzini 
20208e7ea787SAndreas Färber     if (bios_name == NULL) {
20218e7ea787SAndreas Färber         bios_name = FW_FILE_NAME;
20228e7ea787SAndreas Färber     }
20238e7ea787SAndreas Färber     filename = qemu_find_file(QEMU_FILE_TYPE_BIOS, bios_name);
20244c56440dSStefan Weil     if (!filename) {
202568fea5a0SThomas Huth         error_report("Could not find LPAR firmware '%s'", bios_name);
20264c56440dSStefan Weil         exit(1);
20274c56440dSStefan Weil     }
202853018216SPaolo Bonzini     fw_size = load_image_targphys(filename, 0, FW_MAX_SIZE);
202968fea5a0SThomas Huth     if (fw_size <= 0) {
203068fea5a0SThomas Huth         error_report("Could not load LPAR firmware '%s'", filename);
203153018216SPaolo Bonzini         exit(1);
203253018216SPaolo Bonzini     }
203353018216SPaolo Bonzini     g_free(filename);
203453018216SPaolo Bonzini 
203528e02042SDavid Gibson     /* FIXME: Should register things through the MachineState's qdev
203628e02042SDavid Gibson      * interface, this is a legacy from the sPAPREnvironment structure
203728e02042SDavid Gibson      * which predated MachineState but had a similar function */
20384be21d56SDavid Gibson     vmstate_register(NULL, 0, &vmstate_spapr, spapr);
20394be21d56SDavid Gibson     register_savevm_live(NULL, "spapr/htab", -1, 1,
20404be21d56SDavid Gibson                          &savevm_htab_handlers, spapr);
20414be21d56SDavid Gibson 
204253018216SPaolo Bonzini     /* Prepare the device tree */
20433bbf37f2SAndreas Färber     spapr->fdt_skel = spapr_create_fdt_skel(initrd_base, initrd_size,
204416457e7fSBenjamin Herrenschmidt                                             kernel_size, kernel_le,
204531fe14d1SNathan Fontenot                                             kernel_cmdline,
204631fe14d1SNathan Fontenot                                             spapr->check_exception_irq);
204753018216SPaolo Bonzini     assert(spapr->fdt_skel != NULL);
20485b2128d2SAlexander Graf 
204946503c2bSMichael Roth     /* used by RTAS */
205046503c2bSMichael Roth     QTAILQ_INIT(&spapr->ccs_list);
205146503c2bSMichael Roth     qemu_register_reset(spapr_ccs_reset_hook, spapr);
205246503c2bSMichael Roth 
20535b2128d2SAlexander Graf     qemu_register_boot_set(spapr_boot_set, spapr);
205453018216SPaolo Bonzini }
205553018216SPaolo Bonzini 
2056135a129aSAneesh Kumar K.V static int spapr_kvm_type(const char *vm_type)
2057135a129aSAneesh Kumar K.V {
2058135a129aSAneesh Kumar K.V     if (!vm_type) {
2059135a129aSAneesh Kumar K.V         return 0;
2060135a129aSAneesh Kumar K.V     }
2061135a129aSAneesh Kumar K.V 
2062135a129aSAneesh Kumar K.V     if (!strcmp(vm_type, "HV")) {
2063135a129aSAneesh Kumar K.V         return 1;
2064135a129aSAneesh Kumar K.V     }
2065135a129aSAneesh Kumar K.V 
2066135a129aSAneesh Kumar K.V     if (!strcmp(vm_type, "PR")) {
2067135a129aSAneesh Kumar K.V         return 2;
2068135a129aSAneesh Kumar K.V     }
2069135a129aSAneesh Kumar K.V 
2070135a129aSAneesh Kumar K.V     error_report("Unknown kvm-type specified '%s'", vm_type);
2071135a129aSAneesh Kumar K.V     exit(1);
2072135a129aSAneesh Kumar K.V }
2073135a129aSAneesh Kumar K.V 
207471461b0fSAlexey Kardashevskiy /*
2075627b84f4SGonglei  * Implementation of an interface to adjust firmware path
207671461b0fSAlexey Kardashevskiy  * for the bootindex property handling.
207771461b0fSAlexey Kardashevskiy  */
207871461b0fSAlexey Kardashevskiy static char *spapr_get_fw_dev_path(FWPathProvider *p, BusState *bus,
207971461b0fSAlexey Kardashevskiy                                    DeviceState *dev)
208071461b0fSAlexey Kardashevskiy {
208171461b0fSAlexey Kardashevskiy #define CAST(type, obj, name) \
208271461b0fSAlexey Kardashevskiy     ((type *)object_dynamic_cast(OBJECT(obj), (name)))
208371461b0fSAlexey Kardashevskiy     SCSIDevice *d = CAST(SCSIDevice,  dev, TYPE_SCSI_DEVICE);
208471461b0fSAlexey Kardashevskiy     sPAPRPHBState *phb = CAST(sPAPRPHBState, dev, TYPE_SPAPR_PCI_HOST_BRIDGE);
208571461b0fSAlexey Kardashevskiy 
208671461b0fSAlexey Kardashevskiy     if (d) {
208771461b0fSAlexey Kardashevskiy         void *spapr = CAST(void, bus->parent, "spapr-vscsi");
208871461b0fSAlexey Kardashevskiy         VirtIOSCSI *virtio = CAST(VirtIOSCSI, bus->parent, TYPE_VIRTIO_SCSI);
208971461b0fSAlexey Kardashevskiy         USBDevice *usb = CAST(USBDevice, bus->parent, TYPE_USB_DEVICE);
209071461b0fSAlexey Kardashevskiy 
209171461b0fSAlexey Kardashevskiy         if (spapr) {
209271461b0fSAlexey Kardashevskiy             /*
209371461b0fSAlexey Kardashevskiy              * Replace "channel@0/disk@0,0" with "disk@8000000000000000":
209471461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 8000 | (bus << 8) | (id << 5) | lun
209571461b0fSAlexey Kardashevskiy              * in the top 16 bits of the 64-bit LUN
209671461b0fSAlexey Kardashevskiy              */
209771461b0fSAlexey Kardashevskiy             unsigned id = 0x8000 | (d->id << 8) | d->lun;
209871461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
209971461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 48);
210071461b0fSAlexey Kardashevskiy         } else if (virtio) {
210171461b0fSAlexey Kardashevskiy             /*
210271461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 01000000 | (target << 8) | lun
210371461b0fSAlexey Kardashevskiy              * in the top 32 bits of the 64-bit LUN
210471461b0fSAlexey Kardashevskiy              * Note: the quote above is from SLOF and it is wrong,
210571461b0fSAlexey Kardashevskiy              * the actual binding is:
210671461b0fSAlexey Kardashevskiy              * swap 0100 or 10 << or 20 << ( target lun-id -- srplun )
210771461b0fSAlexey Kardashevskiy              */
210871461b0fSAlexey Kardashevskiy             unsigned id = 0x1000000 | (d->id << 16) | d->lun;
210971461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
211071461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 32);
211171461b0fSAlexey Kardashevskiy         } else if (usb) {
211271461b0fSAlexey Kardashevskiy             /*
211371461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 01000000 | (usb-port << 16) | lun
211471461b0fSAlexey Kardashevskiy              * in the top 32 bits of the 64-bit LUN
211571461b0fSAlexey Kardashevskiy              */
211671461b0fSAlexey Kardashevskiy             unsigned usb_port = atoi(usb->port->path);
211771461b0fSAlexey Kardashevskiy             unsigned id = 0x1000000 | (usb_port << 16) | d->lun;
211871461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
211971461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 32);
212071461b0fSAlexey Kardashevskiy         }
212171461b0fSAlexey Kardashevskiy     }
212271461b0fSAlexey Kardashevskiy 
212371461b0fSAlexey Kardashevskiy     if (phb) {
212471461b0fSAlexey Kardashevskiy         /* Replace "pci" with "pci@800000020000000" */
212571461b0fSAlexey Kardashevskiy         return g_strdup_printf("pci@%"PRIX64, phb->buid);
212671461b0fSAlexey Kardashevskiy     }
212771461b0fSAlexey Kardashevskiy 
212871461b0fSAlexey Kardashevskiy     return NULL;
212971461b0fSAlexey Kardashevskiy }
213071461b0fSAlexey Kardashevskiy 
213123825581SEduardo Habkost static char *spapr_get_kvm_type(Object *obj, Error **errp)
213223825581SEduardo Habkost {
213328e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
213423825581SEduardo Habkost 
213528e02042SDavid Gibson     return g_strdup(spapr->kvm_type);
213623825581SEduardo Habkost }
213723825581SEduardo Habkost 
213823825581SEduardo Habkost static void spapr_set_kvm_type(Object *obj, const char *value, Error **errp)
213923825581SEduardo Habkost {
214028e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
214123825581SEduardo Habkost 
214228e02042SDavid Gibson     g_free(spapr->kvm_type);
214328e02042SDavid Gibson     spapr->kvm_type = g_strdup(value);
214423825581SEduardo Habkost }
214523825581SEduardo Habkost 
214623825581SEduardo Habkost static void spapr_machine_initfn(Object *obj)
214723825581SEduardo Habkost {
2148715c5407SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
2149715c5407SDavid Gibson 
2150715c5407SDavid Gibson     spapr->htab_fd = -1;
215123825581SEduardo Habkost     object_property_add_str(obj, "kvm-type",
215223825581SEduardo Habkost                             spapr_get_kvm_type, spapr_set_kvm_type, NULL);
215349d2e648SMarcel Apfelbaum     object_property_set_description(obj, "kvm-type",
215449d2e648SMarcel Apfelbaum                                     "Specifies the KVM virtualization mode (HV, PR)",
215549d2e648SMarcel Apfelbaum                                     NULL);
215623825581SEduardo Habkost }
215723825581SEduardo Habkost 
215887bbdd9cSDavid Gibson static void spapr_machine_finalizefn(Object *obj)
215987bbdd9cSDavid Gibson {
216087bbdd9cSDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
216187bbdd9cSDavid Gibson 
216287bbdd9cSDavid Gibson     g_free(spapr->kvm_type);
216387bbdd9cSDavid Gibson }
216487bbdd9cSDavid Gibson 
216534316482SAlexey Kardashevskiy static void ppc_cpu_do_nmi_on_cpu(void *arg)
216634316482SAlexey Kardashevskiy {
216734316482SAlexey Kardashevskiy     CPUState *cs = arg;
216834316482SAlexey Kardashevskiy 
216934316482SAlexey Kardashevskiy     cpu_synchronize_state(cs);
217034316482SAlexey Kardashevskiy     ppc_cpu_do_system_reset(cs);
217134316482SAlexey Kardashevskiy }
217234316482SAlexey Kardashevskiy 
217334316482SAlexey Kardashevskiy static void spapr_nmi(NMIState *n, int cpu_index, Error **errp)
217434316482SAlexey Kardashevskiy {
217534316482SAlexey Kardashevskiy     CPUState *cs;
217634316482SAlexey Kardashevskiy 
217734316482SAlexey Kardashevskiy     CPU_FOREACH(cs) {
217834316482SAlexey Kardashevskiy         async_run_on_cpu(cs, ppc_cpu_do_nmi_on_cpu, cs);
217934316482SAlexey Kardashevskiy     }
218034316482SAlexey Kardashevskiy }
218134316482SAlexey Kardashevskiy 
2182c20d332aSBharata B Rao static void spapr_add_lmbs(DeviceState *dev, uint64_t addr, uint64_t size,
2183c20d332aSBharata B Rao                            uint32_t node, Error **errp)
2184c20d332aSBharata B Rao {
2185c20d332aSBharata B Rao     sPAPRDRConnector *drc;
2186c20d332aSBharata B Rao     sPAPRDRConnectorClass *drck;
2187c20d332aSBharata B Rao     uint32_t nr_lmbs = size/SPAPR_MEMORY_BLOCK_SIZE;
2188c20d332aSBharata B Rao     int i, fdt_offset, fdt_size;
2189c20d332aSBharata B Rao     void *fdt;
2190c20d332aSBharata B Rao 
2191c20d332aSBharata B Rao     for (i = 0; i < nr_lmbs; i++) {
2192c20d332aSBharata B Rao         drc = spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_LMB,
2193c20d332aSBharata B Rao                 addr/SPAPR_MEMORY_BLOCK_SIZE);
2194c20d332aSBharata B Rao         g_assert(drc);
2195c20d332aSBharata B Rao 
2196c20d332aSBharata B Rao         fdt = create_device_tree(&fdt_size);
2197c20d332aSBharata B Rao         fdt_offset = spapr_populate_memory_node(fdt, node, addr,
2198c20d332aSBharata B Rao                                                 SPAPR_MEMORY_BLOCK_SIZE);
2199c20d332aSBharata B Rao 
2200c20d332aSBharata B Rao         drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
2201c20d332aSBharata B Rao         drck->attach(drc, dev, fdt, fdt_offset, !dev->hotplugged, errp);
2202c20d332aSBharata B Rao         addr += SPAPR_MEMORY_BLOCK_SIZE;
2203c20d332aSBharata B Rao     }
22045dd5238cSJianjun Duan     /* send hotplug notification to the
22055dd5238cSJianjun Duan      * guest only in case of hotplugged memory
22065dd5238cSJianjun Duan      */
22075dd5238cSJianjun Duan     if (dev->hotplugged) {
22080a417869SBharata B Rao        spapr_hotplug_req_add_by_count(SPAPR_DR_CONNECTOR_TYPE_LMB, nr_lmbs);
2209c20d332aSBharata B Rao     }
22105dd5238cSJianjun Duan }
2211c20d332aSBharata B Rao 
2212c20d332aSBharata B Rao static void spapr_memory_plug(HotplugHandler *hotplug_dev, DeviceState *dev,
2213c20d332aSBharata B Rao                               uint32_t node, Error **errp)
2214c20d332aSBharata B Rao {
2215c20d332aSBharata B Rao     Error *local_err = NULL;
2216c20d332aSBharata B Rao     sPAPRMachineState *ms = SPAPR_MACHINE(hotplug_dev);
2217c20d332aSBharata B Rao     PCDIMMDevice *dimm = PC_DIMM(dev);
2218c20d332aSBharata B Rao     PCDIMMDeviceClass *ddc = PC_DIMM_GET_CLASS(dimm);
2219c20d332aSBharata B Rao     MemoryRegion *mr = ddc->get_memory_region(dimm);
2220c20d332aSBharata B Rao     uint64_t align = memory_region_get_alignment(mr);
2221c20d332aSBharata B Rao     uint64_t size = memory_region_size(mr);
2222c20d332aSBharata B Rao     uint64_t addr;
2223c20d332aSBharata B Rao 
2224c20d332aSBharata B Rao     if (size % SPAPR_MEMORY_BLOCK_SIZE) {
2225c20d332aSBharata B Rao         error_setg(&local_err, "Hotplugged memory size must be a multiple of "
2226c20d332aSBharata B Rao                       "%lld MB", SPAPR_MEMORY_BLOCK_SIZE/M_BYTE);
2227c20d332aSBharata B Rao         goto out;
2228c20d332aSBharata B Rao     }
2229c20d332aSBharata B Rao 
2230d6a9b0b8SMichael S. Tsirkin     pc_dimm_memory_plug(dev, &ms->hotplug_memory, mr, align, &local_err);
2231c20d332aSBharata B Rao     if (local_err) {
2232c20d332aSBharata B Rao         goto out;
2233c20d332aSBharata B Rao     }
2234c20d332aSBharata B Rao 
2235c20d332aSBharata B Rao     addr = object_property_get_int(OBJECT(dimm), PC_DIMM_ADDR_PROP, &local_err);
2236c20d332aSBharata B Rao     if (local_err) {
2237c20d332aSBharata B Rao         pc_dimm_memory_unplug(dev, &ms->hotplug_memory, mr);
2238c20d332aSBharata B Rao         goto out;
2239c20d332aSBharata B Rao     }
2240c20d332aSBharata B Rao 
2241c20d332aSBharata B Rao     spapr_add_lmbs(dev, addr, size, node, &error_abort);
2242c20d332aSBharata B Rao 
2243c20d332aSBharata B Rao out:
2244c20d332aSBharata B Rao     error_propagate(errp, local_err);
2245c20d332aSBharata B Rao }
2246c20d332aSBharata B Rao 
2247af81cf32SBharata B Rao void *spapr_populate_hotplug_cpu_dt(CPUState *cs, int *fdt_offset,
2248af81cf32SBharata B Rao                                     sPAPRMachineState *spapr)
2249af81cf32SBharata B Rao {
2250af81cf32SBharata B Rao     PowerPCCPU *cpu = POWERPC_CPU(cs);
2251af81cf32SBharata B Rao     DeviceClass *dc = DEVICE_GET_CLASS(cs);
2252af81cf32SBharata B Rao     int id = ppc_get_vcpu_dt_id(cpu);
2253af81cf32SBharata B Rao     void *fdt;
2254af81cf32SBharata B Rao     int offset, fdt_size;
2255af81cf32SBharata B Rao     char *nodename;
2256af81cf32SBharata B Rao 
2257af81cf32SBharata B Rao     fdt = create_device_tree(&fdt_size);
2258af81cf32SBharata B Rao     nodename = g_strdup_printf("%s@%x", dc->fw_name, id);
2259af81cf32SBharata B Rao     offset = fdt_add_subnode(fdt, 0, nodename);
2260af81cf32SBharata B Rao 
2261af81cf32SBharata B Rao     spapr_populate_cpu_dt(cs, fdt, offset, spapr);
2262af81cf32SBharata B Rao     g_free(nodename);
2263af81cf32SBharata B Rao 
2264af81cf32SBharata B Rao     *fdt_offset = offset;
2265af81cf32SBharata B Rao     return fdt;
2266af81cf32SBharata B Rao }
2267af81cf32SBharata B Rao 
2268c20d332aSBharata B Rao static void spapr_machine_device_plug(HotplugHandler *hotplug_dev,
2269c20d332aSBharata B Rao                                       DeviceState *dev, Error **errp)
2270c20d332aSBharata B Rao {
2271c20d332aSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(qdev_get_machine());
2272c20d332aSBharata B Rao 
2273c20d332aSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2274b556854bSBharata B Rao         int node;
2275c20d332aSBharata B Rao 
2276c20d332aSBharata B Rao         if (!smc->dr_lmb_enabled) {
2277c20d332aSBharata B Rao             error_setg(errp, "Memory hotplug not supported for this machine");
2278c20d332aSBharata B Rao             return;
2279c20d332aSBharata B Rao         }
2280c20d332aSBharata B Rao         node = object_property_get_int(OBJECT(dev), PC_DIMM_NODE_PROP, errp);
2281c20d332aSBharata B Rao         if (*errp) {
2282c20d332aSBharata B Rao             return;
2283c20d332aSBharata B Rao         }
22841a5512bbSGonglei         if (node < 0 || node >= MAX_NODES) {
22851a5512bbSGonglei             error_setg(errp, "Invaild node %d", node);
22861a5512bbSGonglei             return;
22871a5512bbSGonglei         }
2288c20d332aSBharata B Rao 
2289b556854bSBharata B Rao         /*
2290b556854bSBharata B Rao          * Currently PowerPC kernel doesn't allow hot-adding memory to
2291b556854bSBharata B Rao          * memory-less node, but instead will silently add the memory
2292b556854bSBharata B Rao          * to the first node that has some memory. This causes two
2293b556854bSBharata B Rao          * unexpected behaviours for the user.
2294b556854bSBharata B Rao          *
2295b556854bSBharata B Rao          * - Memory gets hotplugged to a different node than what the user
2296b556854bSBharata B Rao          *   specified.
2297b556854bSBharata B Rao          * - Since pc-dimm subsystem in QEMU still thinks that memory belongs
2298b556854bSBharata B Rao          *   to memory-less node, a reboot will set things accordingly
2299b556854bSBharata B Rao          *   and the previously hotplugged memory now ends in the right node.
2300b556854bSBharata B Rao          *   This appears as if some memory moved from one node to another.
2301b556854bSBharata B Rao          *
2302b556854bSBharata B Rao          * So until kernel starts supporting memory hotplug to memory-less
2303b556854bSBharata B Rao          * nodes, just prevent such attempts upfront in QEMU.
2304b556854bSBharata B Rao          */
2305b556854bSBharata B Rao         if (nb_numa_nodes && !numa_info[node].node_mem) {
2306b556854bSBharata B Rao             error_setg(errp, "Can't hotplug memory to memory-less node %d",
2307b556854bSBharata B Rao                        node);
2308b556854bSBharata B Rao             return;
2309b556854bSBharata B Rao         }
2310b556854bSBharata B Rao 
2311c20d332aSBharata B Rao         spapr_memory_plug(hotplug_dev, dev, node, errp);
2312af81cf32SBharata B Rao     } else if (object_dynamic_cast(OBJECT(dev), TYPE_SPAPR_CPU_CORE)) {
2313af81cf32SBharata B Rao         spapr_core_plug(hotplug_dev, dev, errp);
2314c20d332aSBharata B Rao     }
2315c20d332aSBharata B Rao }
2316c20d332aSBharata B Rao 
2317c20d332aSBharata B Rao static void spapr_machine_device_unplug(HotplugHandler *hotplug_dev,
2318c20d332aSBharata B Rao                                       DeviceState *dev, Error **errp)
2319c20d332aSBharata B Rao {
23206f4b5c3eSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(qdev_get_machine());
23216f4b5c3eSBharata B Rao 
2322c20d332aSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2323c20d332aSBharata B Rao         error_setg(errp, "Memory hot unplug not supported by sPAPR");
23246f4b5c3eSBharata B Rao     } else if (object_dynamic_cast(OBJECT(dev), TYPE_SPAPR_CPU_CORE)) {
23256f4b5c3eSBharata B Rao         if (!smc->dr_cpu_enabled) {
23266f4b5c3eSBharata B Rao             error_setg(errp, "CPU hot unplug not supported on this machine");
23276f4b5c3eSBharata B Rao             return;
23286f4b5c3eSBharata B Rao         }
23296f4b5c3eSBharata B Rao         spapr_core_unplug(hotplug_dev, dev, errp);
2330c20d332aSBharata B Rao     }
2331c20d332aSBharata B Rao }
2332c20d332aSBharata B Rao 
233394a94e4cSBharata B Rao static void spapr_machine_device_pre_plug(HotplugHandler *hotplug_dev,
233494a94e4cSBharata B Rao                                           DeviceState *dev, Error **errp)
233594a94e4cSBharata B Rao {
233694a94e4cSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_SPAPR_CPU_CORE)) {
233794a94e4cSBharata B Rao         spapr_core_pre_plug(hotplug_dev, dev, errp);
233894a94e4cSBharata B Rao     }
233994a94e4cSBharata B Rao }
234094a94e4cSBharata B Rao 
2341c20d332aSBharata B Rao static HotplugHandler *spapr_get_hotpug_handler(MachineState *machine,
2342c20d332aSBharata B Rao                                              DeviceState *dev)
2343c20d332aSBharata B Rao {
234494a94e4cSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM) ||
234594a94e4cSBharata B Rao         object_dynamic_cast(OBJECT(dev), TYPE_SPAPR_CPU_CORE)) {
2346c20d332aSBharata B Rao         return HOTPLUG_HANDLER(machine);
2347c20d332aSBharata B Rao     }
2348c20d332aSBharata B Rao     return NULL;
2349c20d332aSBharata B Rao }
2350c20d332aSBharata B Rao 
235120bb648dSDavid Gibson static unsigned spapr_cpu_index_to_socket_id(unsigned cpu_index)
235220bb648dSDavid Gibson {
235320bb648dSDavid Gibson     /* Allocate to NUMA nodes on a "socket" basis (not that concept of
235420bb648dSDavid Gibson      * socket means much for the paravirtualized PAPR platform) */
235520bb648dSDavid Gibson     return cpu_index / smp_threads / smp_cores;
235620bb648dSDavid Gibson }
235720bb648dSDavid Gibson 
23582474bfd4SIgor Mammedov static HotpluggableCPUList *spapr_query_hotpluggable_cpus(MachineState *machine)
23592474bfd4SIgor Mammedov {
23602474bfd4SIgor Mammedov     int i;
23612474bfd4SIgor Mammedov     HotpluggableCPUList *head = NULL;
23622474bfd4SIgor Mammedov     sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
23632474bfd4SIgor Mammedov     int spapr_max_cores = max_cpus / smp_threads;
23642474bfd4SIgor Mammedov     int smt = kvmppc_smt_threads();
23652474bfd4SIgor Mammedov 
23662474bfd4SIgor Mammedov     for (i = 0; i < spapr_max_cores; i++) {
23672474bfd4SIgor Mammedov         HotpluggableCPUList *list_item = g_new0(typeof(*list_item), 1);
23682474bfd4SIgor Mammedov         HotpluggableCPU *cpu_item = g_new0(typeof(*cpu_item), 1);
23692474bfd4SIgor Mammedov         CpuInstanceProperties *cpu_props = g_new0(typeof(*cpu_props), 1);
23702474bfd4SIgor Mammedov 
23712474bfd4SIgor Mammedov         cpu_item->type = spapr_get_cpu_core_type(machine->cpu_model);
23722474bfd4SIgor Mammedov         cpu_item->vcpus_count = smp_threads;
237327393c33SPeter Krempa         cpu_props->has_core_id = true;
237427393c33SPeter Krempa         cpu_props->core_id = i * smt;
23752474bfd4SIgor Mammedov         /* TODO: add 'has_node/node' here to describe
23762474bfd4SIgor Mammedov            to which node core belongs */
23772474bfd4SIgor Mammedov 
23782474bfd4SIgor Mammedov         cpu_item->props = cpu_props;
23792474bfd4SIgor Mammedov         if (spapr->cores[i]) {
23802474bfd4SIgor Mammedov             cpu_item->has_qom_path = true;
23812474bfd4SIgor Mammedov             cpu_item->qom_path = object_get_canonical_path(spapr->cores[i]);
23822474bfd4SIgor Mammedov         }
23832474bfd4SIgor Mammedov         list_item->value = cpu_item;
23842474bfd4SIgor Mammedov         list_item->next = head;
23852474bfd4SIgor Mammedov         head = list_item;
23862474bfd4SIgor Mammedov     }
23872474bfd4SIgor Mammedov     return head;
23882474bfd4SIgor Mammedov }
23892474bfd4SIgor Mammedov 
239029ee3247SAlexey Kardashevskiy static void spapr_machine_class_init(ObjectClass *oc, void *data)
239153018216SPaolo Bonzini {
239229ee3247SAlexey Kardashevskiy     MachineClass *mc = MACHINE_CLASS(oc);
2393224245bfSDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(oc);
239471461b0fSAlexey Kardashevskiy     FWPathProviderClass *fwc = FW_PATH_PROVIDER_CLASS(oc);
239534316482SAlexey Kardashevskiy     NMIClass *nc = NMI_CLASS(oc);
2396c20d332aSBharata B Rao     HotplugHandlerClass *hc = HOTPLUG_HANDLER_CLASS(oc);
239729ee3247SAlexey Kardashevskiy 
23980eb9054cSDavid Gibson     mc->desc = "pSeries Logical Partition (PAPR compliant)";
2399fc9f38c3SDavid Gibson 
2400fc9f38c3SDavid Gibson     /*
2401fc9f38c3SDavid Gibson      * We set up the default / latest behaviour here.  The class_init
2402fc9f38c3SDavid Gibson      * functions for the specific versioned machine types can override
2403fc9f38c3SDavid Gibson      * these details for backwards compatibility
2404fc9f38c3SDavid Gibson      */
2405958db90cSMarcel Apfelbaum     mc->init = ppc_spapr_init;
2406958db90cSMarcel Apfelbaum     mc->reset = ppc_spapr_reset;
2407958db90cSMarcel Apfelbaum     mc->block_default_type = IF_SCSI;
240838b02bd8SAlexey Kardashevskiy     mc->max_cpus = MAX_CPUMASK_BITS;
2409958db90cSMarcel Apfelbaum     mc->no_parallel = 1;
24105b2128d2SAlexander Graf     mc->default_boot_order = "";
2411a34944feSNikunj A Dadhania     mc->default_ram_size = 512 * M_BYTE;
2412958db90cSMarcel Apfelbaum     mc->kvm_type = spapr_kvm_type;
24139e3f9733SAlexander Graf     mc->has_dynamic_sysbus = true;
2414e4024630SLaurent Vivier     mc->pci_allow_0_address = true;
2415c20d332aSBharata B Rao     mc->get_hotplug_handler = spapr_get_hotpug_handler;
241694a94e4cSBharata B Rao     hc->pre_plug = spapr_machine_device_pre_plug;
2417c20d332aSBharata B Rao     hc->plug = spapr_machine_device_plug;
2418c20d332aSBharata B Rao     hc->unplug = spapr_machine_device_unplug;
241920bb648dSDavid Gibson     mc->cpu_index_to_socket_id = spapr_cpu_index_to_socket_id;
24202474bfd4SIgor Mammedov     mc->query_hotpluggable_cpus = spapr_query_hotpluggable_cpus;
242100b4fbe2SMarcel Apfelbaum 
2422fc9f38c3SDavid Gibson     smc->dr_lmb_enabled = true;
242394a94e4cSBharata B Rao     smc->dr_cpu_enabled = true;
242471461b0fSAlexey Kardashevskiy     fwc->get_dev_path = spapr_get_fw_dev_path;
242534316482SAlexey Kardashevskiy     nc->nmi_monitor_handler = spapr_nmi;
242653018216SPaolo Bonzini }
242753018216SPaolo Bonzini 
242829ee3247SAlexey Kardashevskiy static const TypeInfo spapr_machine_info = {
242929ee3247SAlexey Kardashevskiy     .name          = TYPE_SPAPR_MACHINE,
243029ee3247SAlexey Kardashevskiy     .parent        = TYPE_MACHINE,
24314aee7362SDavid Gibson     .abstract      = true,
24326ca1502eSAlexey Kardashevskiy     .instance_size = sizeof(sPAPRMachineState),
243323825581SEduardo Habkost     .instance_init = spapr_machine_initfn,
243487bbdd9cSDavid Gibson     .instance_finalize = spapr_machine_finalizefn,
2435183930c0SDavid Gibson     .class_size    = sizeof(sPAPRMachineClass),
243629ee3247SAlexey Kardashevskiy     .class_init    = spapr_machine_class_init,
243771461b0fSAlexey Kardashevskiy     .interfaces = (InterfaceInfo[]) {
243871461b0fSAlexey Kardashevskiy         { TYPE_FW_PATH_PROVIDER },
243934316482SAlexey Kardashevskiy         { TYPE_NMI },
2440c20d332aSBharata B Rao         { TYPE_HOTPLUG_HANDLER },
244171461b0fSAlexey Kardashevskiy         { }
244271461b0fSAlexey Kardashevskiy     },
244329ee3247SAlexey Kardashevskiy };
244429ee3247SAlexey Kardashevskiy 
2445fccbc785SDavid Gibson #define DEFINE_SPAPR_MACHINE(suffix, verstr, latest)                 \
24465013c547SDavid Gibson     static void spapr_machine_##suffix##_class_init(ObjectClass *oc, \
24475013c547SDavid Gibson                                                     void *data)      \
24485013c547SDavid Gibson     {                                                                \
24495013c547SDavid Gibson         MachineClass *mc = MACHINE_CLASS(oc);                        \
24505013c547SDavid Gibson         spapr_machine_##suffix##_class_options(mc);                  \
2451fccbc785SDavid Gibson         if (latest) {                                                \
2452fccbc785SDavid Gibson             mc->alias = "pseries";                                   \
2453fccbc785SDavid Gibson             mc->is_default = 1;                                      \
2454fccbc785SDavid Gibson         }                                                            \
24555013c547SDavid Gibson     }                                                                \
24565013c547SDavid Gibson     static void spapr_machine_##suffix##_instance_init(Object *obj)  \
24575013c547SDavid Gibson     {                                                                \
24585013c547SDavid Gibson         MachineState *machine = MACHINE(obj);                        \
24595013c547SDavid Gibson         spapr_machine_##suffix##_instance_options(machine);          \
24605013c547SDavid Gibson     }                                                                \
24615013c547SDavid Gibson     static const TypeInfo spapr_machine_##suffix##_info = {          \
24625013c547SDavid Gibson         .name = MACHINE_TYPE_NAME("pseries-" verstr),                \
24635013c547SDavid Gibson         .parent = TYPE_SPAPR_MACHINE,                                \
24645013c547SDavid Gibson         .class_init = spapr_machine_##suffix##_class_init,           \
24655013c547SDavid Gibson         .instance_init = spapr_machine_##suffix##_instance_init,     \
24665013c547SDavid Gibson     };                                                               \
24675013c547SDavid Gibson     static void spapr_machine_register_##suffix(void)                \
24685013c547SDavid Gibson     {                                                                \
24695013c547SDavid Gibson         type_register(&spapr_machine_##suffix##_info);               \
24705013c547SDavid Gibson     }                                                                \
24710e6aac87SEduardo Habkost     type_init(spapr_machine_register_##suffix)
24725013c547SDavid Gibson 
24731c5f29bbSDavid Gibson /*
24741ea1eefcSBharata B Rao  * pseries-2.7
24751ea1eefcSBharata B Rao  */
24761ea1eefcSBharata B Rao static void spapr_machine_2_7_instance_options(MachineState *machine)
24771ea1eefcSBharata B Rao {
24781ea1eefcSBharata B Rao }
24791ea1eefcSBharata B Rao 
24801ea1eefcSBharata B Rao static void spapr_machine_2_7_class_options(MachineClass *mc)
24811ea1eefcSBharata B Rao {
24821ea1eefcSBharata B Rao     /* Defaults for the latest behaviour inherited from the base class */
24831ea1eefcSBharata B Rao }
24841ea1eefcSBharata B Rao 
24851ea1eefcSBharata B Rao DEFINE_SPAPR_MACHINE(2_7, "2.7", true);
24861ea1eefcSBharata B Rao 
24871ea1eefcSBharata B Rao /*
24884b23699cSDavid Gibson  * pseries-2.6
24894b23699cSDavid Gibson  */
24901ea1eefcSBharata B Rao #define SPAPR_COMPAT_2_6 \
24911ea1eefcSBharata B Rao     HW_COMPAT_2_6
24921ea1eefcSBharata B Rao 
24934b23699cSDavid Gibson static void spapr_machine_2_6_instance_options(MachineState *machine)
24944b23699cSDavid Gibson {
24954b23699cSDavid Gibson }
24964b23699cSDavid Gibson 
24974b23699cSDavid Gibson static void spapr_machine_2_6_class_options(MachineClass *mc)
24984b23699cSDavid Gibson {
249994a94e4cSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc);
250094a94e4cSBharata B Rao 
25011ea1eefcSBharata B Rao     spapr_machine_2_7_class_options(mc);
250294a94e4cSBharata B Rao     smc->dr_cpu_enabled = false;
25031ea1eefcSBharata B Rao     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_6);
25044b23699cSDavid Gibson }
25054b23699cSDavid Gibson 
25061ea1eefcSBharata B Rao DEFINE_SPAPR_MACHINE(2_6, "2.6", false);
25074b23699cSDavid Gibson 
25084b23699cSDavid Gibson /*
25091c5f29bbSDavid Gibson  * pseries-2.5
25101c5f29bbSDavid Gibson  */
25114b23699cSDavid Gibson #define SPAPR_COMPAT_2_5 \
251257c522f4SThomas Huth     HW_COMPAT_2_5 \
251357c522f4SThomas Huth     { \
251457c522f4SThomas Huth         .driver   = "spapr-vlan", \
251557c522f4SThomas Huth         .property = "use-rx-buffer-pools", \
251657c522f4SThomas Huth         .value    = "off", \
251757c522f4SThomas Huth     },
25184b23699cSDavid Gibson 
25195013c547SDavid Gibson static void spapr_machine_2_5_instance_options(MachineState *machine)
25201c5f29bbSDavid Gibson {
25215013c547SDavid Gibson }
25225013c547SDavid Gibson 
25235013c547SDavid Gibson static void spapr_machine_2_5_class_options(MachineClass *mc)
25245013c547SDavid Gibson {
252557040d45SThomas Huth     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc);
252657040d45SThomas Huth 
25274b23699cSDavid Gibson     spapr_machine_2_6_class_options(mc);
252857040d45SThomas Huth     smc->use_ohci_by_default = true;
25294b23699cSDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_5);
25301c5f29bbSDavid Gibson }
25311c5f29bbSDavid Gibson 
25324b23699cSDavid Gibson DEFINE_SPAPR_MACHINE(2_5, "2.5", false);
25331c5f29bbSDavid Gibson 
25341c5f29bbSDavid Gibson /*
25351c5f29bbSDavid Gibson  * pseries-2.4
25361c5f29bbSDavid Gibson  */
253780fd50f9SCornelia Huck #define SPAPR_COMPAT_2_4 \
253880fd50f9SCornelia Huck         HW_COMPAT_2_4
253980fd50f9SCornelia Huck 
25405013c547SDavid Gibson static void spapr_machine_2_4_instance_options(MachineState *machine)
25411c5f29bbSDavid Gibson {
25425013c547SDavid Gibson     spapr_machine_2_5_instance_options(machine);
25435013c547SDavid Gibson }
25441c5f29bbSDavid Gibson 
25455013c547SDavid Gibson static void spapr_machine_2_4_class_options(MachineClass *mc)
25465013c547SDavid Gibson {
2547fc9f38c3SDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc);
2548fc9f38c3SDavid Gibson 
2549fc9f38c3SDavid Gibson     spapr_machine_2_5_class_options(mc);
2550fc9f38c3SDavid Gibson     smc->dr_lmb_enabled = false;
2551f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_4);
25521c5f29bbSDavid Gibson }
25531c5f29bbSDavid Gibson 
2554fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_4, "2.4", false);
25551c5f29bbSDavid Gibson 
25561c5f29bbSDavid Gibson /*
25571c5f29bbSDavid Gibson  * pseries-2.3
25581c5f29bbSDavid Gibson  */
255938ff32c6SEduardo Habkost #define SPAPR_COMPAT_2_3 \
25607619c7b0SMichael Roth         HW_COMPAT_2_3 \
25617619c7b0SMichael Roth         {\
25627619c7b0SMichael Roth             .driver   = "spapr-pci-host-bridge",\
25637619c7b0SMichael Roth             .property = "dynamic-reconfiguration",\
25647619c7b0SMichael Roth             .value    = "off",\
25657619c7b0SMichael Roth         },
256638ff32c6SEduardo Habkost 
25675013c547SDavid Gibson static void spapr_machine_2_3_instance_options(MachineState *machine)
25681c5f29bbSDavid Gibson {
25695013c547SDavid Gibson     spapr_machine_2_4_instance_options(machine);
25701c5f29bbSDavid Gibson     savevm_skip_section_footers();
25711c5f29bbSDavid Gibson     global_state_set_optional();
257209b5e30dSGreg Kurz     savevm_skip_configuration();
25731c5f29bbSDavid Gibson }
25741c5f29bbSDavid Gibson 
25755013c547SDavid Gibson static void spapr_machine_2_3_class_options(MachineClass *mc)
25761c5f29bbSDavid Gibson {
2577fc9f38c3SDavid Gibson     spapr_machine_2_4_class_options(mc);
2578f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_3);
25791c5f29bbSDavid Gibson }
2580fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_3, "2.3", false);
25811c5f29bbSDavid Gibson 
25821c5f29bbSDavid Gibson /*
25831c5f29bbSDavid Gibson  * pseries-2.2
25841c5f29bbSDavid Gibson  */
25851c5f29bbSDavid Gibson 
2586b194df47SAlexey Kardashevskiy #define SPAPR_COMPAT_2_2 \
25874dfd8eaaSEduardo Habkost         HW_COMPAT_2_2 \
2588b194df47SAlexey Kardashevskiy         {\
2589b194df47SAlexey Kardashevskiy             .driver   = TYPE_SPAPR_PCI_HOST_BRIDGE,\
2590b194df47SAlexey Kardashevskiy             .property = "mem_win_size",\
2591b194df47SAlexey Kardashevskiy             .value    = "0x20000000",\
2592dd754bafSEduardo Habkost         },
2593b194df47SAlexey Kardashevskiy 
25945013c547SDavid Gibson static void spapr_machine_2_2_instance_options(MachineState *machine)
2595b0e966d0SJason Wang {
25965013c547SDavid Gibson     spapr_machine_2_3_instance_options(machine);
2597cba0e779SGreg Kurz     machine->suppress_vmdesc = true;
2598b0e966d0SJason Wang }
2599b0e966d0SJason Wang 
26005013c547SDavid Gibson static void spapr_machine_2_2_class_options(MachineClass *mc)
2601b0e966d0SJason Wang {
2602fc9f38c3SDavid Gibson     spapr_machine_2_3_class_options(mc);
2603f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_2);
26041c5f29bbSDavid Gibson }
2605fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_2, "2.2", false);
26061c5f29bbSDavid Gibson 
26071c5f29bbSDavid Gibson /*
26081c5f29bbSDavid Gibson  * pseries-2.1
26091c5f29bbSDavid Gibson  */
26101c5f29bbSDavid Gibson #define SPAPR_COMPAT_2_1 \
26111c5f29bbSDavid Gibson         HW_COMPAT_2_1
26121c5f29bbSDavid Gibson 
26135013c547SDavid Gibson static void spapr_machine_2_1_instance_options(MachineState *machine)
26141c5f29bbSDavid Gibson {
26155013c547SDavid Gibson     spapr_machine_2_2_instance_options(machine);
26161c5f29bbSDavid Gibson }
26171c5f29bbSDavid Gibson 
26185013c547SDavid Gibson static void spapr_machine_2_1_class_options(MachineClass *mc)
2619b0e966d0SJason Wang {
2620fc9f38c3SDavid Gibson     spapr_machine_2_2_class_options(mc);
2621f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_1);
26226026db45SAlexey Kardashevskiy }
2623fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_1, "2.1", false);
26246026db45SAlexey Kardashevskiy 
262529ee3247SAlexey Kardashevskiy static void spapr_machine_register_types(void)
262629ee3247SAlexey Kardashevskiy {
262729ee3247SAlexey Kardashevskiy     type_register_static(&spapr_machine_info);
262829ee3247SAlexey Kardashevskiy }
262929ee3247SAlexey Kardashevskiy 
263029ee3247SAlexey Kardashevskiy type_init(spapr_machine_register_types)
2631