xref: /openbmc/qemu/hw/ppc/spapr.c (revision 569f4967)
153018216SPaolo Bonzini /*
253018216SPaolo Bonzini  * QEMU PowerPC pSeries Logical Partition (aka sPAPR) hardware System Emulator
353018216SPaolo Bonzini  *
453018216SPaolo Bonzini  * Copyright (c) 2004-2007 Fabrice Bellard
553018216SPaolo Bonzini  * Copyright (c) 2007 Jocelyn Mayer
653018216SPaolo Bonzini  * Copyright (c) 2010 David Gibson, IBM Corporation.
753018216SPaolo Bonzini  *
853018216SPaolo Bonzini  * Permission is hereby granted, free of charge, to any person obtaining a copy
953018216SPaolo Bonzini  * of this software and associated documentation files (the "Software"), to deal
1053018216SPaolo Bonzini  * in the Software without restriction, including without limitation the rights
1153018216SPaolo Bonzini  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
1253018216SPaolo Bonzini  * copies of the Software, and to permit persons to whom the Software is
1353018216SPaolo Bonzini  * furnished to do so, subject to the following conditions:
1453018216SPaolo Bonzini  *
1553018216SPaolo Bonzini  * The above copyright notice and this permission notice shall be included in
1653018216SPaolo Bonzini  * all copies or substantial portions of the Software.
1753018216SPaolo Bonzini  *
1853018216SPaolo Bonzini  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1953018216SPaolo Bonzini  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
2053018216SPaolo Bonzini  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
2153018216SPaolo Bonzini  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
2253018216SPaolo Bonzini  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
2353018216SPaolo Bonzini  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
2453018216SPaolo Bonzini  * THE SOFTWARE.
2553018216SPaolo Bonzini  *
2653018216SPaolo Bonzini  */
270d75590dSPeter Maydell #include "qemu/osdep.h"
2853018216SPaolo Bonzini #include "sysemu/sysemu.h"
29e35704baSEduardo Habkost #include "sysemu/numa.h"
3053018216SPaolo Bonzini #include "hw/hw.h"
3171461b0fSAlexey Kardashevskiy #include "hw/fw-path-provider.h"
3253018216SPaolo Bonzini #include "elf.h"
3353018216SPaolo Bonzini #include "net/net.h"
34ad440b4aSAndrew Jones #include "sysemu/device_tree.h"
35fa1d36dfSMarkus Armbruster #include "sysemu/block-backend.h"
3653018216SPaolo Bonzini #include "sysemu/cpus.h"
3753018216SPaolo Bonzini #include "sysemu/kvm.h"
38c20d332aSBharata B Rao #include "sysemu/device_tree.h"
3953018216SPaolo Bonzini #include "kvm_ppc.h"
40ff14e817SDr. David Alan Gilbert #include "migration/migration.h"
414be21d56SDavid Gibson #include "mmu-hash64.h"
423794d548SAlexey Kardashevskiy #include "qom/cpu.h"
4353018216SPaolo Bonzini 
4453018216SPaolo Bonzini #include "hw/boards.h"
450d09e41aSPaolo Bonzini #include "hw/ppc/ppc.h"
4653018216SPaolo Bonzini #include "hw/loader.h"
4753018216SPaolo Bonzini 
480d09e41aSPaolo Bonzini #include "hw/ppc/spapr.h"
490d09e41aSPaolo Bonzini #include "hw/ppc/spapr_vio.h"
500d09e41aSPaolo Bonzini #include "hw/pci-host/spapr.h"
510d09e41aSPaolo Bonzini #include "hw/ppc/xics.h"
5253018216SPaolo Bonzini #include "hw/pci/msi.h"
5353018216SPaolo Bonzini 
5453018216SPaolo Bonzini #include "hw/pci/pci.h"
5571461b0fSAlexey Kardashevskiy #include "hw/scsi/scsi.h"
5671461b0fSAlexey Kardashevskiy #include "hw/virtio/virtio-scsi.h"
5753018216SPaolo Bonzini 
5853018216SPaolo Bonzini #include "exec/address-spaces.h"
5953018216SPaolo Bonzini #include "hw/usb.h"
6053018216SPaolo Bonzini #include "qemu/config-file.h"
61135a129aSAneesh Kumar K.V #include "qemu/error-report.h"
622a6593cbSAlexey Kardashevskiy #include "trace.h"
6334316482SAlexey Kardashevskiy #include "hw/nmi.h"
6453018216SPaolo Bonzini 
6568a27b20SMichael S. Tsirkin #include "hw/compat.h"
66224245bfSDavid Gibson #include "qemu-common.h"
6768a27b20SMichael S. Tsirkin 
6853018216SPaolo Bonzini #include <libfdt.h>
6953018216SPaolo Bonzini 
7053018216SPaolo Bonzini /* SLOF memory layout:
7153018216SPaolo Bonzini  *
7253018216SPaolo Bonzini  * SLOF raw image loaded at 0, copies its romfs right below the flat
7353018216SPaolo Bonzini  * device-tree, then position SLOF itself 31M below that
7453018216SPaolo Bonzini  *
7553018216SPaolo Bonzini  * So we set FW_OVERHEAD to 40MB which should account for all of that
7653018216SPaolo Bonzini  * and more
7753018216SPaolo Bonzini  *
7853018216SPaolo Bonzini  * We load our kernel at 4M, leaving space for SLOF initial image
7953018216SPaolo Bonzini  */
8038b02bd8SAlexey Kardashevskiy #define FDT_MAX_SIZE            0x100000
8153018216SPaolo Bonzini #define RTAS_MAX_SIZE           0x10000
82b7d1f77aSBenjamin Herrenschmidt #define RTAS_MAX_ADDR           0x80000000 /* RTAS must stay below that */
8353018216SPaolo Bonzini #define FW_MAX_SIZE             0x400000
8453018216SPaolo Bonzini #define FW_FILE_NAME            "slof.bin"
8553018216SPaolo Bonzini #define FW_OVERHEAD             0x2800000
8653018216SPaolo Bonzini #define KERNEL_LOAD_ADDR        FW_MAX_SIZE
8753018216SPaolo Bonzini 
8853018216SPaolo Bonzini #define MIN_RMA_SLOF            128UL
8953018216SPaolo Bonzini 
9053018216SPaolo Bonzini #define TIMEBASE_FREQ           512000000ULL
9153018216SPaolo Bonzini 
9253018216SPaolo Bonzini #define PHANDLE_XICP            0x00001111
9353018216SPaolo Bonzini 
9453018216SPaolo Bonzini #define HTAB_SIZE(spapr)        (1ULL << ((spapr)->htab_shift))
9553018216SPaolo Bonzini 
96c04d6cfaSAnthony Liguori static XICSState *try_create_xics(const char *type, int nr_servers,
9734f2af3dSMarkus Armbruster                                   int nr_irqs, Error **errp)
98c04d6cfaSAnthony Liguori {
9934f2af3dSMarkus Armbruster     Error *err = NULL;
100c04d6cfaSAnthony Liguori     DeviceState *dev;
101c04d6cfaSAnthony Liguori 
102c04d6cfaSAnthony Liguori     dev = qdev_create(NULL, type);
103c04d6cfaSAnthony Liguori     qdev_prop_set_uint32(dev, "nr_servers", nr_servers);
104c04d6cfaSAnthony Liguori     qdev_prop_set_uint32(dev, "nr_irqs", nr_irqs);
10534f2af3dSMarkus Armbruster     object_property_set_bool(OBJECT(dev), true, "realized", &err);
10634f2af3dSMarkus Armbruster     if (err) {
10734f2af3dSMarkus Armbruster         error_propagate(errp, err);
10834f2af3dSMarkus Armbruster         object_unparent(OBJECT(dev));
109c04d6cfaSAnthony Liguori         return NULL;
110c04d6cfaSAnthony Liguori     }
1115a3d7b23SAlexey Kardashevskiy     return XICS_COMMON(dev);
112c04d6cfaSAnthony Liguori }
113c04d6cfaSAnthony Liguori 
114446f16a6SMarcel Apfelbaum static XICSState *xics_system_init(MachineState *machine,
115446f16a6SMarcel Apfelbaum                                    int nr_servers, int nr_irqs)
116c04d6cfaSAnthony Liguori {
117c04d6cfaSAnthony Liguori     XICSState *icp = NULL;
118c04d6cfaSAnthony Liguori 
11911ad93f6SDavid Gibson     if (kvm_enabled()) {
12034f2af3dSMarkus Armbruster         Error *err = NULL;
12134f2af3dSMarkus Armbruster 
122446f16a6SMarcel Apfelbaum         if (machine_kernel_irqchip_allowed(machine)) {
12334f2af3dSMarkus Armbruster             icp = try_create_xics(TYPE_KVM_XICS, nr_servers, nr_irqs, &err);
12411ad93f6SDavid Gibson         }
125446f16a6SMarcel Apfelbaum         if (machine_kernel_irqchip_required(machine) && !icp) {
126b83baa60SMarkus Armbruster             error_reportf_err(err,
127b83baa60SMarkus Armbruster                               "kernel_irqchip requested but unavailable: ");
128b83baa60SMarkus Armbruster         } else {
129903a41d3SStefano Dong (董兴水)             error_free(err);
13011ad93f6SDavid Gibson         }
131b83baa60SMarkus Armbruster     }
13211ad93f6SDavid Gibson 
13311ad93f6SDavid Gibson     if (!icp) {
13434f2af3dSMarkus Armbruster         icp = try_create_xics(TYPE_XICS, nr_servers, nr_irqs, &error_abort);
135c04d6cfaSAnthony Liguori     }
136c04d6cfaSAnthony Liguori 
137c04d6cfaSAnthony Liguori     return icp;
138c04d6cfaSAnthony Liguori }
139c04d6cfaSAnthony Liguori 
140833d4668SAlexey Kardashevskiy static int spapr_fixup_cpu_smt_dt(void *fdt, int offset, PowerPCCPU *cpu,
141833d4668SAlexey Kardashevskiy                                   int smt_threads)
142833d4668SAlexey Kardashevskiy {
143833d4668SAlexey Kardashevskiy     int i, ret = 0;
144833d4668SAlexey Kardashevskiy     uint32_t servers_prop[smt_threads];
145833d4668SAlexey Kardashevskiy     uint32_t gservers_prop[smt_threads * 2];
146833d4668SAlexey Kardashevskiy     int index = ppc_get_vcpu_dt_id(cpu);
147833d4668SAlexey Kardashevskiy 
1486d9412eaSAlexey Kardashevskiy     if (cpu->cpu_version) {
1494bce526eSLaurent Dufour         ret = fdt_setprop_cell(fdt, offset, "cpu-version", cpu->cpu_version);
1506d9412eaSAlexey Kardashevskiy         if (ret < 0) {
1516d9412eaSAlexey Kardashevskiy             return ret;
1526d9412eaSAlexey Kardashevskiy         }
1536d9412eaSAlexey Kardashevskiy     }
1546d9412eaSAlexey Kardashevskiy 
155833d4668SAlexey Kardashevskiy     /* Build interrupt servers and gservers properties */
156833d4668SAlexey Kardashevskiy     for (i = 0; i < smt_threads; i++) {
157833d4668SAlexey Kardashevskiy         servers_prop[i] = cpu_to_be32(index + i);
158833d4668SAlexey Kardashevskiy         /* Hack, direct the group queues back to cpu 0 */
159833d4668SAlexey Kardashevskiy         gservers_prop[i*2] = cpu_to_be32(index + i);
160833d4668SAlexey Kardashevskiy         gservers_prop[i*2 + 1] = 0;
161833d4668SAlexey Kardashevskiy     }
162833d4668SAlexey Kardashevskiy     ret = fdt_setprop(fdt, offset, "ibm,ppc-interrupt-server#s",
163833d4668SAlexey Kardashevskiy                       servers_prop, sizeof(servers_prop));
164833d4668SAlexey Kardashevskiy     if (ret < 0) {
165833d4668SAlexey Kardashevskiy         return ret;
166833d4668SAlexey Kardashevskiy     }
167833d4668SAlexey Kardashevskiy     ret = fdt_setprop(fdt, offset, "ibm,ppc-interrupt-gserver#s",
168833d4668SAlexey Kardashevskiy                       gservers_prop, sizeof(gservers_prop));
169833d4668SAlexey Kardashevskiy 
170833d4668SAlexey Kardashevskiy     return ret;
171833d4668SAlexey Kardashevskiy }
172833d4668SAlexey Kardashevskiy 
1730da6f3feSBharata B Rao static int spapr_fixup_cpu_numa_dt(void *fdt, int offset, CPUState *cs)
1740da6f3feSBharata B Rao {
1750da6f3feSBharata B Rao     int ret = 0;
1760da6f3feSBharata B Rao     PowerPCCPU *cpu = POWERPC_CPU(cs);
1770da6f3feSBharata B Rao     int index = ppc_get_vcpu_dt_id(cpu);
1780da6f3feSBharata B Rao     uint32_t associativity[] = {cpu_to_be32(0x5),
1790da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1800da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1810da6f3feSBharata B Rao                                 cpu_to_be32(0x0),
1820da6f3feSBharata B Rao                                 cpu_to_be32(cs->numa_node),
1830da6f3feSBharata B Rao                                 cpu_to_be32(index)};
1840da6f3feSBharata B Rao 
1850da6f3feSBharata B Rao     /* Advertise NUMA via ibm,associativity */
1860da6f3feSBharata B Rao     if (nb_numa_nodes > 1) {
1870da6f3feSBharata B Rao         ret = fdt_setprop(fdt, offset, "ibm,associativity", associativity,
1880da6f3feSBharata B Rao                           sizeof(associativity));
1890da6f3feSBharata B Rao     }
1900da6f3feSBharata B Rao 
1910da6f3feSBharata B Rao     return ret;
1920da6f3feSBharata B Rao }
1930da6f3feSBharata B Rao 
19428e02042SDavid Gibson static int spapr_fixup_cpu_dt(void *fdt, sPAPRMachineState *spapr)
19553018216SPaolo Bonzini {
19682677ed2SAlexey Kardashevskiy     int ret = 0, offset, cpus_offset;
19782677ed2SAlexey Kardashevskiy     CPUState *cs;
19853018216SPaolo Bonzini     char cpu_model[32];
19953018216SPaolo Bonzini     int smt = kvmppc_smt_threads();
20053018216SPaolo Bonzini     uint32_t pft_size_prop[] = {0, cpu_to_be32(spapr->htab_shift)};
20153018216SPaolo Bonzini 
20282677ed2SAlexey Kardashevskiy     CPU_FOREACH(cs) {
20382677ed2SAlexey Kardashevskiy         PowerPCCPU *cpu = POWERPC_CPU(cs);
20482677ed2SAlexey Kardashevskiy         DeviceClass *dc = DEVICE_GET_CLASS(cs);
20582677ed2SAlexey Kardashevskiy         int index = ppc_get_vcpu_dt_id(cpu);
20653018216SPaolo Bonzini 
2070f20ba62SAlexey Kardashevskiy         if ((index % smt) != 0) {
20853018216SPaolo Bonzini             continue;
20953018216SPaolo Bonzini         }
21053018216SPaolo Bonzini 
21182677ed2SAlexey Kardashevskiy         snprintf(cpu_model, 32, "%s@%x", dc->fw_name, index);
21253018216SPaolo Bonzini 
21382677ed2SAlexey Kardashevskiy         cpus_offset = fdt_path_offset(fdt, "/cpus");
21482677ed2SAlexey Kardashevskiy         if (cpus_offset < 0) {
21582677ed2SAlexey Kardashevskiy             cpus_offset = fdt_add_subnode(fdt, fdt_path_offset(fdt, "/"),
21682677ed2SAlexey Kardashevskiy                                           "cpus");
21782677ed2SAlexey Kardashevskiy             if (cpus_offset < 0) {
21882677ed2SAlexey Kardashevskiy                 return cpus_offset;
21982677ed2SAlexey Kardashevskiy             }
22082677ed2SAlexey Kardashevskiy         }
22182677ed2SAlexey Kardashevskiy         offset = fdt_subnode_offset(fdt, cpus_offset, cpu_model);
22282677ed2SAlexey Kardashevskiy         if (offset < 0) {
22382677ed2SAlexey Kardashevskiy             offset = fdt_add_subnode(fdt, cpus_offset, cpu_model);
22453018216SPaolo Bonzini             if (offset < 0) {
22553018216SPaolo Bonzini                 return offset;
22653018216SPaolo Bonzini             }
22782677ed2SAlexey Kardashevskiy         }
22853018216SPaolo Bonzini 
2290da6f3feSBharata B Rao         ret = fdt_setprop(fdt, offset, "ibm,pft-size",
2300da6f3feSBharata B Rao                           pft_size_prop, sizeof(pft_size_prop));
23153018216SPaolo Bonzini         if (ret < 0) {
23253018216SPaolo Bonzini             return ret;
23353018216SPaolo Bonzini         }
23453018216SPaolo Bonzini 
2350da6f3feSBharata B Rao         ret = spapr_fixup_cpu_numa_dt(fdt, offset, cs);
23653018216SPaolo Bonzini         if (ret < 0) {
23753018216SPaolo Bonzini             return ret;
23853018216SPaolo Bonzini         }
239833d4668SAlexey Kardashevskiy 
24082677ed2SAlexey Kardashevskiy         ret = spapr_fixup_cpu_smt_dt(fdt, offset, cpu,
2412a48d993SAlexey Kardashevskiy                                      ppc_get_compat_smt_threads(cpu));
242833d4668SAlexey Kardashevskiy         if (ret < 0) {
243833d4668SAlexey Kardashevskiy             return ret;
244833d4668SAlexey Kardashevskiy         }
24553018216SPaolo Bonzini     }
24653018216SPaolo Bonzini     return ret;
24753018216SPaolo Bonzini }
24853018216SPaolo Bonzini 
24953018216SPaolo Bonzini 
25053018216SPaolo Bonzini static size_t create_page_sizes_prop(CPUPPCState *env, uint32_t *prop,
25153018216SPaolo Bonzini                                      size_t maxsize)
25253018216SPaolo Bonzini {
25353018216SPaolo Bonzini     size_t maxcells = maxsize / sizeof(uint32_t);
25453018216SPaolo Bonzini     int i, j, count;
25553018216SPaolo Bonzini     uint32_t *p = prop;
25653018216SPaolo Bonzini 
25753018216SPaolo Bonzini     for (i = 0; i < PPC_PAGE_SIZES_MAX_SZ; i++) {
25853018216SPaolo Bonzini         struct ppc_one_seg_page_size *sps = &env->sps.sps[i];
25953018216SPaolo Bonzini 
26053018216SPaolo Bonzini         if (!sps->page_shift) {
26153018216SPaolo Bonzini             break;
26253018216SPaolo Bonzini         }
26353018216SPaolo Bonzini         for (count = 0; count < PPC_PAGE_SIZES_MAX_SZ; count++) {
26453018216SPaolo Bonzini             if (sps->enc[count].page_shift == 0) {
26553018216SPaolo Bonzini                 break;
26653018216SPaolo Bonzini             }
26753018216SPaolo Bonzini         }
26853018216SPaolo Bonzini         if ((p - prop) >= (maxcells - 3 - count * 2)) {
26953018216SPaolo Bonzini             break;
27053018216SPaolo Bonzini         }
27153018216SPaolo Bonzini         *(p++) = cpu_to_be32(sps->page_shift);
27253018216SPaolo Bonzini         *(p++) = cpu_to_be32(sps->slb_enc);
27353018216SPaolo Bonzini         *(p++) = cpu_to_be32(count);
27453018216SPaolo Bonzini         for (j = 0; j < count; j++) {
27553018216SPaolo Bonzini             *(p++) = cpu_to_be32(sps->enc[j].page_shift);
27653018216SPaolo Bonzini             *(p++) = cpu_to_be32(sps->enc[j].pte_enc);
27753018216SPaolo Bonzini         }
27853018216SPaolo Bonzini     }
27953018216SPaolo Bonzini 
28053018216SPaolo Bonzini     return (p - prop) * sizeof(uint32_t);
28153018216SPaolo Bonzini }
28253018216SPaolo Bonzini 
283b082d65aSAlexey Kardashevskiy static hwaddr spapr_node0_size(void)
284b082d65aSAlexey Kardashevskiy {
285fb164994SDavid Gibson     MachineState *machine = MACHINE(qdev_get_machine());
286fb164994SDavid Gibson 
287b082d65aSAlexey Kardashevskiy     if (nb_numa_nodes) {
288b082d65aSAlexey Kardashevskiy         int i;
289b082d65aSAlexey Kardashevskiy         for (i = 0; i < nb_numa_nodes; ++i) {
290b082d65aSAlexey Kardashevskiy             if (numa_info[i].node_mem) {
291fb164994SDavid Gibson                 return MIN(pow2floor(numa_info[i].node_mem),
292fb164994SDavid Gibson                            machine->ram_size);
293b082d65aSAlexey Kardashevskiy             }
294b082d65aSAlexey Kardashevskiy         }
295b082d65aSAlexey Kardashevskiy     }
296fb164994SDavid Gibson     return machine->ram_size;
297b082d65aSAlexey Kardashevskiy }
298b082d65aSAlexey Kardashevskiy 
29953018216SPaolo Bonzini #define _FDT(exp) \
30053018216SPaolo Bonzini     do { \
30153018216SPaolo Bonzini         int ret = (exp);                                           \
30253018216SPaolo Bonzini         if (ret < 0) {                                             \
30353018216SPaolo Bonzini             fprintf(stderr, "qemu: error creating device tree: %s: %s\n", \
30453018216SPaolo Bonzini                     #exp, fdt_strerror(ret));                      \
30553018216SPaolo Bonzini             exit(1);                                               \
30653018216SPaolo Bonzini         }                                                          \
30753018216SPaolo Bonzini     } while (0)
30853018216SPaolo Bonzini 
309a1d59c0fSAlexey Kardashevskiy static void add_str(GString *s, const gchar *s1)
310a1d59c0fSAlexey Kardashevskiy {
311a1d59c0fSAlexey Kardashevskiy     g_string_append_len(s, s1, strlen(s1) + 1);
312a1d59c0fSAlexey Kardashevskiy }
31353018216SPaolo Bonzini 
3143bbf37f2SAndreas Färber static void *spapr_create_fdt_skel(hwaddr initrd_base,
31553018216SPaolo Bonzini                                    hwaddr initrd_size,
31653018216SPaolo Bonzini                                    hwaddr kernel_size,
31716457e7fSBenjamin Herrenschmidt                                    bool little_endian,
31853018216SPaolo Bonzini                                    const char *kernel_cmdline,
31953018216SPaolo Bonzini                                    uint32_t epow_irq)
32053018216SPaolo Bonzini {
32153018216SPaolo Bonzini     void *fdt;
32253018216SPaolo Bonzini     uint32_t start_prop = cpu_to_be32(initrd_base);
32353018216SPaolo Bonzini     uint32_t end_prop = cpu_to_be32(initrd_base + initrd_size);
324a1d59c0fSAlexey Kardashevskiy     GString *hypertas = g_string_sized_new(256);
325a1d59c0fSAlexey Kardashevskiy     GString *qemu_hypertas = g_string_sized_new(256);
32653018216SPaolo Bonzini     uint32_t refpoints[] = {cpu_to_be32(0x4), cpu_to_be32(0x4)};
3279e734e3dSBharata B Rao     uint32_t interrupt_server_ranges_prop[] = {0, cpu_to_be32(max_cpus)};
32853018216SPaolo Bonzini     unsigned char vec5[] = {0x0, 0x0, 0x0, 0x0, 0x0, 0x80};
329ef951443SNikunj A Dadhania     char *buf;
33053018216SPaolo Bonzini 
331a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-pft");
332a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-term");
333a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-dabr");
334a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-interrupt");
335a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-tce");
336a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-vio");
337a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-splpar");
338a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-bulk");
339a1d59c0fSAlexey Kardashevskiy     add_str(hypertas, "hcall-set-mode");
340a1d59c0fSAlexey Kardashevskiy     add_str(qemu_hypertas, "hcall-memop1");
341a1d59c0fSAlexey Kardashevskiy 
34253018216SPaolo Bonzini     fdt = g_malloc0(FDT_MAX_SIZE);
34353018216SPaolo Bonzini     _FDT((fdt_create(fdt, FDT_MAX_SIZE)));
34453018216SPaolo Bonzini 
34553018216SPaolo Bonzini     if (kernel_size) {
34653018216SPaolo Bonzini         _FDT((fdt_add_reservemap_entry(fdt, KERNEL_LOAD_ADDR, kernel_size)));
34753018216SPaolo Bonzini     }
34853018216SPaolo Bonzini     if (initrd_size) {
34953018216SPaolo Bonzini         _FDT((fdt_add_reservemap_entry(fdt, initrd_base, initrd_size)));
35053018216SPaolo Bonzini     }
35153018216SPaolo Bonzini     _FDT((fdt_finish_reservemap(fdt)));
35253018216SPaolo Bonzini 
35353018216SPaolo Bonzini     /* Root node */
35453018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "")));
35553018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type", "chrp")));
35653018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "model", "IBM pSeries (emulated by qemu)")));
357fa388916SAnthony Liguori     _FDT((fdt_property_string(fdt, "compatible", "qemu,pseries")));
35853018216SPaolo Bonzini 
359ef951443SNikunj A Dadhania     /*
360ef951443SNikunj A Dadhania      * Add info to guest to indentify which host is it being run on
361ef951443SNikunj A Dadhania      * and what is the uuid of the guest
362ef951443SNikunj A Dadhania      */
363ef951443SNikunj A Dadhania     if (kvmppc_get_host_model(&buf)) {
364ef951443SNikunj A Dadhania         _FDT((fdt_property_string(fdt, "host-model", buf)));
365ef951443SNikunj A Dadhania         g_free(buf);
366ef951443SNikunj A Dadhania     }
367ef951443SNikunj A Dadhania     if (kvmppc_get_host_serial(&buf)) {
368ef951443SNikunj A Dadhania         _FDT((fdt_property_string(fdt, "host-serial", buf)));
369ef951443SNikunj A Dadhania         g_free(buf);
370ef951443SNikunj A Dadhania     }
371ef951443SNikunj A Dadhania 
372ef951443SNikunj A Dadhania     buf = g_strdup_printf(UUID_FMT, qemu_uuid[0], qemu_uuid[1],
373ef951443SNikunj A Dadhania                           qemu_uuid[2], qemu_uuid[3], qemu_uuid[4],
374ef951443SNikunj A Dadhania                           qemu_uuid[5], qemu_uuid[6], qemu_uuid[7],
375ef951443SNikunj A Dadhania                           qemu_uuid[8], qemu_uuid[9], qemu_uuid[10],
376ef951443SNikunj A Dadhania                           qemu_uuid[11], qemu_uuid[12], qemu_uuid[13],
377ef951443SNikunj A Dadhania                           qemu_uuid[14], qemu_uuid[15]);
378ef951443SNikunj A Dadhania 
379ef951443SNikunj A Dadhania     _FDT((fdt_property_string(fdt, "vm,uuid", buf)));
3803dc0a66dSAlexey Kardashevskiy     if (qemu_uuid_set) {
3813dc0a66dSAlexey Kardashevskiy         _FDT((fdt_property_string(fdt, "system-id", buf)));
3823dc0a66dSAlexey Kardashevskiy     }
383ef951443SNikunj A Dadhania     g_free(buf);
384ef951443SNikunj A Dadhania 
3852c1aaa81SSam Bobroff     if (qemu_get_vm_name()) {
3862c1aaa81SSam Bobroff         _FDT((fdt_property_string(fdt, "ibm,partition-name",
3872c1aaa81SSam Bobroff                                   qemu_get_vm_name())));
3882c1aaa81SSam Bobroff     }
3892c1aaa81SSam Bobroff 
39053018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#address-cells", 0x2)));
39153018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#size-cells", 0x2)));
39253018216SPaolo Bonzini 
39353018216SPaolo Bonzini     /* /chosen */
39453018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "chosen")));
39553018216SPaolo Bonzini 
39653018216SPaolo Bonzini     /* Set Form1_affinity */
39753018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,architecture-vec-5", vec5, sizeof(vec5))));
39853018216SPaolo Bonzini 
39953018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "bootargs", kernel_cmdline)));
40053018216SPaolo Bonzini     _FDT((fdt_property(fdt, "linux,initrd-start",
40153018216SPaolo Bonzini                        &start_prop, sizeof(start_prop))));
40253018216SPaolo Bonzini     _FDT((fdt_property(fdt, "linux,initrd-end",
40353018216SPaolo Bonzini                        &end_prop, sizeof(end_prop))));
40453018216SPaolo Bonzini     if (kernel_size) {
40553018216SPaolo Bonzini         uint64_t kprop[2] = { cpu_to_be64(KERNEL_LOAD_ADDR),
40653018216SPaolo Bonzini                               cpu_to_be64(kernel_size) };
40753018216SPaolo Bonzini 
40853018216SPaolo Bonzini         _FDT((fdt_property(fdt, "qemu,boot-kernel", &kprop, sizeof(kprop))));
40916457e7fSBenjamin Herrenschmidt         if (little_endian) {
41016457e7fSBenjamin Herrenschmidt             _FDT((fdt_property(fdt, "qemu,boot-kernel-le", NULL, 0)));
41116457e7fSBenjamin Herrenschmidt         }
41253018216SPaolo Bonzini     }
413cc84c0f3SAvik Sil     if (boot_menu) {
414cc84c0f3SAvik Sil         _FDT((fdt_property_cell(fdt, "qemu,boot-menu", boot_menu)));
415cc84c0f3SAvik Sil     }
41653018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-width", graphic_width)));
41753018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-height", graphic_height)));
41853018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "qemu,graphic-depth", graphic_depth)));
41953018216SPaolo Bonzini 
42053018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
42153018216SPaolo Bonzini 
42253018216SPaolo Bonzini     /* RTAS */
42353018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "rtas")));
42453018216SPaolo Bonzini 
425da95324eSAlexey Kardashevskiy     if (!kvm_enabled() || kvmppc_spapr_use_multitce()) {
426da95324eSAlexey Kardashevskiy         add_str(hypertas, "hcall-multi-tce");
427da95324eSAlexey Kardashevskiy     }
428a1d59c0fSAlexey Kardashevskiy     _FDT((fdt_property(fdt, "ibm,hypertas-functions", hypertas->str,
429a1d59c0fSAlexey Kardashevskiy                        hypertas->len)));
430a1d59c0fSAlexey Kardashevskiy     g_string_free(hypertas, TRUE);
431a1d59c0fSAlexey Kardashevskiy     _FDT((fdt_property(fdt, "qemu,hypertas-functions", qemu_hypertas->str,
432a1d59c0fSAlexey Kardashevskiy                        qemu_hypertas->len)));
433a1d59c0fSAlexey Kardashevskiy     g_string_free(qemu_hypertas, TRUE);
43453018216SPaolo Bonzini 
43553018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,associativity-reference-points",
43653018216SPaolo Bonzini         refpoints, sizeof(refpoints))));
43753018216SPaolo Bonzini 
43853018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "rtas-error-log-max", RTAS_ERROR_LOG_MAX)));
43979853e18STyrel Datwyler     _FDT((fdt_property_cell(fdt, "rtas-event-scan-rate",
44079853e18STyrel Datwyler                             RTAS_EVENT_SCAN_RATE)));
44153018216SPaolo Bonzini 
442a95f9922SSam Bobroff     if (msi_supported) {
443a95f9922SSam Bobroff         _FDT((fdt_property(fdt, "ibm,change-msix-capable", NULL, 0)));
444a95f9922SSam Bobroff     }
445a95f9922SSam Bobroff 
4462e14072fSNikunj A Dadhania     /*
4479d632f5fSzhanghailiang      * According to PAPR, rtas ibm,os-term does not guarantee a return
4482e14072fSNikunj A Dadhania      * back to the guest cpu.
4492e14072fSNikunj A Dadhania      *
4502e14072fSNikunj A Dadhania      * While an additional ibm,extended-os-term property indicates that
4512e14072fSNikunj A Dadhania      * rtas call return will always occur. Set this property.
4522e14072fSNikunj A Dadhania      */
4532e14072fSNikunj A Dadhania     _FDT((fdt_property(fdt, "ibm,extended-os-term", NULL, 0)));
4542e14072fSNikunj A Dadhania 
45553018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
45653018216SPaolo Bonzini 
45753018216SPaolo Bonzini     /* interrupt controller */
45853018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "interrupt-controller")));
45953018216SPaolo Bonzini 
46053018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type",
46153018216SPaolo Bonzini                               "PowerPC-External-Interrupt-Presentation")));
46253018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "compatible", "IBM,ppc-xicp")));
46353018216SPaolo Bonzini     _FDT((fdt_property(fdt, "interrupt-controller", NULL, 0)));
46453018216SPaolo Bonzini     _FDT((fdt_property(fdt, "ibm,interrupt-server-ranges",
46553018216SPaolo Bonzini                        interrupt_server_ranges_prop,
46653018216SPaolo Bonzini                        sizeof(interrupt_server_ranges_prop))));
46753018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#interrupt-cells", 2)));
46853018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "linux,phandle", PHANDLE_XICP)));
46953018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "phandle", PHANDLE_XICP)));
47053018216SPaolo Bonzini 
47153018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
47253018216SPaolo Bonzini 
47353018216SPaolo Bonzini     /* vdevice */
47453018216SPaolo Bonzini     _FDT((fdt_begin_node(fdt, "vdevice")));
47553018216SPaolo Bonzini 
47653018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "device_type", "vdevice")));
47753018216SPaolo Bonzini     _FDT((fdt_property_string(fdt, "compatible", "IBM,vdevice")));
47853018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#address-cells", 0x1)));
47953018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#size-cells", 0x0)));
48053018216SPaolo Bonzini     _FDT((fdt_property_cell(fdt, "#interrupt-cells", 0x2)));
48153018216SPaolo Bonzini     _FDT((fdt_property(fdt, "interrupt-controller", NULL, 0)));
48253018216SPaolo Bonzini 
48353018216SPaolo Bonzini     _FDT((fdt_end_node(fdt)));
48453018216SPaolo Bonzini 
48553018216SPaolo Bonzini     /* event-sources */
48653018216SPaolo Bonzini     spapr_events_fdt_skel(fdt, epow_irq);
48753018216SPaolo Bonzini 
488f7d69146SAlexander Graf     /* /hypervisor node */
489f7d69146SAlexander Graf     if (kvm_enabled()) {
490f7d69146SAlexander Graf         uint8_t hypercall[16];
491f7d69146SAlexander Graf 
492f7d69146SAlexander Graf         /* indicate KVM hypercall interface */
493f7d69146SAlexander Graf         _FDT((fdt_begin_node(fdt, "hypervisor")));
494f7d69146SAlexander Graf         _FDT((fdt_property_string(fdt, "compatible", "linux,kvm")));
495f7d69146SAlexander Graf         if (kvmppc_has_cap_fixup_hcalls()) {
496f7d69146SAlexander Graf             /*
497f7d69146SAlexander Graf              * Older KVM versions with older guest kernels were broken with the
498f7d69146SAlexander Graf              * magic page, don't allow the guest to map it.
499f7d69146SAlexander Graf              */
500f7d69146SAlexander Graf             kvmppc_get_hypercall(first_cpu->env_ptr, hypercall,
501f7d69146SAlexander Graf                                  sizeof(hypercall));
502f7d69146SAlexander Graf             _FDT((fdt_property(fdt, "hcall-instructions", hypercall,
503f7d69146SAlexander Graf                               sizeof(hypercall))));
504f7d69146SAlexander Graf         }
505f7d69146SAlexander Graf         _FDT((fdt_end_node(fdt)));
506f7d69146SAlexander Graf     }
507f7d69146SAlexander Graf 
50853018216SPaolo Bonzini     _FDT((fdt_end_node(fdt))); /* close root node */
50953018216SPaolo Bonzini     _FDT((fdt_finish(fdt)));
51053018216SPaolo Bonzini 
51153018216SPaolo Bonzini     return fdt;
51253018216SPaolo Bonzini }
51353018216SPaolo Bonzini 
51403d196b7SBharata B Rao static int spapr_populate_memory_node(void *fdt, int nodeid, hwaddr start,
51526a8c353SAlexey Kardashevskiy                                        hwaddr size)
51626a8c353SAlexey Kardashevskiy {
51726a8c353SAlexey Kardashevskiy     uint32_t associativity[] = {
51826a8c353SAlexey Kardashevskiy         cpu_to_be32(0x4), /* length */
51926a8c353SAlexey Kardashevskiy         cpu_to_be32(0x0), cpu_to_be32(0x0),
520c3b4f589SAlexey Kardashevskiy         cpu_to_be32(0x0), cpu_to_be32(nodeid)
52126a8c353SAlexey Kardashevskiy     };
52226a8c353SAlexey Kardashevskiy     char mem_name[32];
52326a8c353SAlexey Kardashevskiy     uint64_t mem_reg_property[2];
52426a8c353SAlexey Kardashevskiy     int off;
52526a8c353SAlexey Kardashevskiy 
52626a8c353SAlexey Kardashevskiy     mem_reg_property[0] = cpu_to_be64(start);
52726a8c353SAlexey Kardashevskiy     mem_reg_property[1] = cpu_to_be64(size);
52826a8c353SAlexey Kardashevskiy 
52926a8c353SAlexey Kardashevskiy     sprintf(mem_name, "memory@" TARGET_FMT_lx, start);
53026a8c353SAlexey Kardashevskiy     off = fdt_add_subnode(fdt, 0, mem_name);
53126a8c353SAlexey Kardashevskiy     _FDT(off);
53226a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop_string(fdt, off, "device_type", "memory")));
53326a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop(fdt, off, "reg", mem_reg_property,
53426a8c353SAlexey Kardashevskiy                       sizeof(mem_reg_property))));
53526a8c353SAlexey Kardashevskiy     _FDT((fdt_setprop(fdt, off, "ibm,associativity", associativity,
53626a8c353SAlexey Kardashevskiy                       sizeof(associativity))));
53703d196b7SBharata B Rao     return off;
53826a8c353SAlexey Kardashevskiy }
53926a8c353SAlexey Kardashevskiy 
54028e02042SDavid Gibson static int spapr_populate_memory(sPAPRMachineState *spapr, void *fdt)
54153018216SPaolo Bonzini {
542fb164994SDavid Gibson     MachineState *machine = MACHINE(spapr);
5437db8a127SAlexey Kardashevskiy     hwaddr mem_start, node_size;
5447db8a127SAlexey Kardashevskiy     int i, nb_nodes = nb_numa_nodes;
5457db8a127SAlexey Kardashevskiy     NodeInfo *nodes = numa_info;
5467db8a127SAlexey Kardashevskiy     NodeInfo ramnode;
54753018216SPaolo Bonzini 
5487db8a127SAlexey Kardashevskiy     /* No NUMA nodes, assume there is just one node with whole RAM */
5497db8a127SAlexey Kardashevskiy     if (!nb_numa_nodes) {
5507db8a127SAlexey Kardashevskiy         nb_nodes = 1;
551fb164994SDavid Gibson         ramnode.node_mem = machine->ram_size;
5527db8a127SAlexey Kardashevskiy         nodes = &ramnode;
5535fe269b1SPaul Mackerras     }
55453018216SPaolo Bonzini 
5557db8a127SAlexey Kardashevskiy     for (i = 0, mem_start = 0; i < nb_nodes; ++i) {
5567db8a127SAlexey Kardashevskiy         if (!nodes[i].node_mem) {
5577db8a127SAlexey Kardashevskiy             continue;
55853018216SPaolo Bonzini         }
559fb164994SDavid Gibson         if (mem_start >= machine->ram_size) {
5605fe269b1SPaul Mackerras             node_size = 0;
5615fe269b1SPaul Mackerras         } else {
5627db8a127SAlexey Kardashevskiy             node_size = nodes[i].node_mem;
563fb164994SDavid Gibson             if (node_size > machine->ram_size - mem_start) {
564fb164994SDavid Gibson                 node_size = machine->ram_size - mem_start;
5655fe269b1SPaul Mackerras             }
5665fe269b1SPaul Mackerras         }
5677db8a127SAlexey Kardashevskiy         if (!mem_start) {
5687db8a127SAlexey Kardashevskiy             /* ppc_spapr_init() checks for rma_size <= node0_size already */
569e8f986fcSBharata B Rao             spapr_populate_memory_node(fdt, i, 0, spapr->rma_size);
5707db8a127SAlexey Kardashevskiy             mem_start += spapr->rma_size;
5717db8a127SAlexey Kardashevskiy             node_size -= spapr->rma_size;
5727db8a127SAlexey Kardashevskiy         }
5736010818cSAlexey Kardashevskiy         for ( ; node_size; ) {
5746010818cSAlexey Kardashevskiy             hwaddr sizetmp = pow2floor(node_size);
5756010818cSAlexey Kardashevskiy 
5766010818cSAlexey Kardashevskiy             /* mem_start != 0 here */
5776010818cSAlexey Kardashevskiy             if (ctzl(mem_start) < ctzl(sizetmp)) {
5786010818cSAlexey Kardashevskiy                 sizetmp = 1ULL << ctzl(mem_start);
5796010818cSAlexey Kardashevskiy             }
5806010818cSAlexey Kardashevskiy 
5816010818cSAlexey Kardashevskiy             spapr_populate_memory_node(fdt, i, mem_start, sizetmp);
5826010818cSAlexey Kardashevskiy             node_size -= sizetmp;
5836010818cSAlexey Kardashevskiy             mem_start += sizetmp;
5846010818cSAlexey Kardashevskiy         }
58553018216SPaolo Bonzini     }
58653018216SPaolo Bonzini 
58753018216SPaolo Bonzini     return 0;
58853018216SPaolo Bonzini }
58953018216SPaolo Bonzini 
5900da6f3feSBharata B Rao static void spapr_populate_cpu_dt(CPUState *cs, void *fdt, int offset,
5910da6f3feSBharata B Rao                                   sPAPRMachineState *spapr)
5920da6f3feSBharata B Rao {
5930da6f3feSBharata B Rao     PowerPCCPU *cpu = POWERPC_CPU(cs);
5940da6f3feSBharata B Rao     CPUPPCState *env = &cpu->env;
5950da6f3feSBharata B Rao     PowerPCCPUClass *pcc = POWERPC_CPU_GET_CLASS(cs);
5960da6f3feSBharata B Rao     int index = ppc_get_vcpu_dt_id(cpu);
5970da6f3feSBharata B Rao     uint32_t segs[] = {cpu_to_be32(28), cpu_to_be32(40),
5980da6f3feSBharata B Rao                        0xffffffff, 0xffffffff};
5990da6f3feSBharata B Rao     uint32_t tbfreq = kvm_enabled() ? kvmppc_get_tbfreq() : TIMEBASE_FREQ;
6000da6f3feSBharata B Rao     uint32_t cpufreq = kvm_enabled() ? kvmppc_get_clockfreq() : 1000000000;
6010da6f3feSBharata B Rao     uint32_t page_sizes_prop[64];
6020da6f3feSBharata B Rao     size_t page_sizes_prop_size;
60322419c2aSDavid Gibson     uint32_t vcpus_per_socket = smp_threads * smp_cores;
6040da6f3feSBharata B Rao     uint32_t pft_size_prop[] = {0, cpu_to_be32(spapr->htab_shift)};
6050da6f3feSBharata B Rao 
60690da0d5aSBenjamin Herrenschmidt     /* Note: we keep CI large pages off for now because a 64K capable guest
60790da0d5aSBenjamin Herrenschmidt      * provisioned with large pages might otherwise try to map a qemu
60890da0d5aSBenjamin Herrenschmidt      * framebuffer (or other kind of memory mapped PCI BAR) using 64K pages
60990da0d5aSBenjamin Herrenschmidt      * even if that qemu runs on a 4k host.
61090da0d5aSBenjamin Herrenschmidt      *
61190da0d5aSBenjamin Herrenschmidt      * We can later add this bit back when we are confident this is not
61290da0d5aSBenjamin Herrenschmidt      * an issue (!HV KVM or 64K host)
61390da0d5aSBenjamin Herrenschmidt      */
61490da0d5aSBenjamin Herrenschmidt     uint8_t pa_features_206[] = { 6, 0,
61590da0d5aSBenjamin Herrenschmidt         0xf6, 0x1f, 0xc7, 0x00, 0x80, 0xc0 };
61690da0d5aSBenjamin Herrenschmidt     uint8_t pa_features_207[] = { 24, 0,
61790da0d5aSBenjamin Herrenschmidt         0xf6, 0x1f, 0xc7, 0xc0, 0x80, 0xf0,
61890da0d5aSBenjamin Herrenschmidt         0x80, 0x00, 0x00, 0x00, 0x00, 0x00,
61990da0d5aSBenjamin Herrenschmidt         0x00, 0x00, 0x00, 0x00, 0x80, 0x00,
62090da0d5aSBenjamin Herrenschmidt         0x80, 0x00, 0x80, 0x00, 0x80, 0x00 };
62190da0d5aSBenjamin Herrenschmidt     uint8_t *pa_features;
62290da0d5aSBenjamin Herrenschmidt     size_t pa_size;
62390da0d5aSBenjamin Herrenschmidt 
6240da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "reg", index)));
6250da6f3feSBharata B Rao     _FDT((fdt_setprop_string(fdt, offset, "device_type", "cpu")));
6260da6f3feSBharata B Rao 
6270da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "cpu-version", env->spr[SPR_PVR])));
6280da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "d-cache-block-size",
6290da6f3feSBharata B Rao                            env->dcache_line_size)));
6300da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "d-cache-line-size",
6310da6f3feSBharata B Rao                            env->dcache_line_size)));
6320da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "i-cache-block-size",
6330da6f3feSBharata B Rao                            env->icache_line_size)));
6340da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "i-cache-line-size",
6350da6f3feSBharata B Rao                            env->icache_line_size)));
6360da6f3feSBharata B Rao 
6370da6f3feSBharata B Rao     if (pcc->l1_dcache_size) {
6380da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "d-cache-size",
6390da6f3feSBharata B Rao                                pcc->l1_dcache_size)));
6400da6f3feSBharata B Rao     } else {
6410da6f3feSBharata B Rao         fprintf(stderr, "Warning: Unknown L1 dcache size for cpu\n");
6420da6f3feSBharata B Rao     }
6430da6f3feSBharata B Rao     if (pcc->l1_icache_size) {
6440da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "i-cache-size",
6450da6f3feSBharata B Rao                                pcc->l1_icache_size)));
6460da6f3feSBharata B Rao     } else {
6470da6f3feSBharata B Rao         fprintf(stderr, "Warning: Unknown L1 icache size for cpu\n");
6480da6f3feSBharata B Rao     }
6490da6f3feSBharata B Rao 
6500da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "timebase-frequency", tbfreq)));
6510da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "clock-frequency", cpufreq)));
652fd5da5c4SThomas Huth     _FDT((fdt_setprop_cell(fdt, offset, "slb-size", env->slb_nr)));
6530da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "ibm,slb-size", env->slb_nr)));
6540da6f3feSBharata B Rao     _FDT((fdt_setprop_string(fdt, offset, "status", "okay")));
6550da6f3feSBharata B Rao     _FDT((fdt_setprop(fdt, offset, "64-bit", NULL, 0)));
6560da6f3feSBharata B Rao 
6570da6f3feSBharata B Rao     if (env->spr_cb[SPR_PURR].oea_read) {
6580da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,purr", NULL, 0)));
6590da6f3feSBharata B Rao     }
6600da6f3feSBharata B Rao 
6610da6f3feSBharata B Rao     if (env->mmu_model & POWERPC_MMU_1TSEG) {
6620da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,processor-segment-sizes",
6630da6f3feSBharata B Rao                           segs, sizeof(segs))));
6640da6f3feSBharata B Rao     }
6650da6f3feSBharata B Rao 
6660da6f3feSBharata B Rao     /* Advertise VMX/VSX (vector extensions) if available
6670da6f3feSBharata B Rao      *   0 / no property == no vector extensions
6680da6f3feSBharata B Rao      *   1               == VMX / Altivec available
6690da6f3feSBharata B Rao      *   2               == VSX available */
6700da6f3feSBharata B Rao     if (env->insns_flags & PPC_ALTIVEC) {
6710da6f3feSBharata B Rao         uint32_t vmx = (env->insns_flags2 & PPC2_VSX) ? 2 : 1;
6720da6f3feSBharata B Rao 
6730da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "ibm,vmx", vmx)));
6740da6f3feSBharata B Rao     }
6750da6f3feSBharata B Rao 
6760da6f3feSBharata B Rao     /* Advertise DFP (Decimal Floating Point) if available
6770da6f3feSBharata B Rao      *   0 / no property == no DFP
6780da6f3feSBharata B Rao      *   1               == DFP available */
6790da6f3feSBharata B Rao     if (env->insns_flags2 & PPC2_DFP) {
6800da6f3feSBharata B Rao         _FDT((fdt_setprop_cell(fdt, offset, "ibm,dfp", 1)));
6810da6f3feSBharata B Rao     }
6820da6f3feSBharata B Rao 
6830da6f3feSBharata B Rao     page_sizes_prop_size = create_page_sizes_prop(env, page_sizes_prop,
6840da6f3feSBharata B Rao                                                   sizeof(page_sizes_prop));
6850da6f3feSBharata B Rao     if (page_sizes_prop_size) {
6860da6f3feSBharata B Rao         _FDT((fdt_setprop(fdt, offset, "ibm,segment-page-sizes",
6870da6f3feSBharata B Rao                           page_sizes_prop, page_sizes_prop_size)));
6880da6f3feSBharata B Rao     }
6890da6f3feSBharata B Rao 
69090da0d5aSBenjamin Herrenschmidt     /* Do the ibm,pa-features property, adjust it for ci-large-pages */
69190da0d5aSBenjamin Herrenschmidt     if (env->mmu_model == POWERPC_MMU_2_06) {
69290da0d5aSBenjamin Herrenschmidt         pa_features = pa_features_206;
69390da0d5aSBenjamin Herrenschmidt         pa_size = sizeof(pa_features_206);
69490da0d5aSBenjamin Herrenschmidt     } else /* env->mmu_model == POWERPC_MMU_2_07 */ {
69590da0d5aSBenjamin Herrenschmidt         pa_features = pa_features_207;
69690da0d5aSBenjamin Herrenschmidt         pa_size = sizeof(pa_features_207);
69790da0d5aSBenjamin Herrenschmidt     }
69890da0d5aSBenjamin Herrenschmidt     if (env->ci_large_pages) {
69990da0d5aSBenjamin Herrenschmidt         pa_features[3] |= 0x20;
70090da0d5aSBenjamin Herrenschmidt     }
70190da0d5aSBenjamin Herrenschmidt     _FDT((fdt_setprop(fdt, offset, "ibm,pa-features", pa_features, pa_size)));
70290da0d5aSBenjamin Herrenschmidt 
7030da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, offset, "ibm,chip-id",
70422419c2aSDavid Gibson                            cs->cpu_index / vcpus_per_socket)));
7050da6f3feSBharata B Rao 
7060da6f3feSBharata B Rao     _FDT((fdt_setprop(fdt, offset, "ibm,pft-size",
7070da6f3feSBharata B Rao                       pft_size_prop, sizeof(pft_size_prop))));
7080da6f3feSBharata B Rao 
7090da6f3feSBharata B Rao     _FDT(spapr_fixup_cpu_numa_dt(fdt, offset, cs));
7100da6f3feSBharata B Rao 
7110da6f3feSBharata B Rao     _FDT(spapr_fixup_cpu_smt_dt(fdt, offset, cpu,
7120da6f3feSBharata B Rao                                 ppc_get_compat_smt_threads(cpu)));
7130da6f3feSBharata B Rao }
7140da6f3feSBharata B Rao 
7150da6f3feSBharata B Rao static void spapr_populate_cpus_dt_node(void *fdt, sPAPRMachineState *spapr)
7160da6f3feSBharata B Rao {
7170da6f3feSBharata B Rao     CPUState *cs;
7180da6f3feSBharata B Rao     int cpus_offset;
7190da6f3feSBharata B Rao     char *nodename;
7200da6f3feSBharata B Rao     int smt = kvmppc_smt_threads();
7210da6f3feSBharata B Rao 
7220da6f3feSBharata B Rao     cpus_offset = fdt_add_subnode(fdt, 0, "cpus");
7230da6f3feSBharata B Rao     _FDT(cpus_offset);
7240da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, cpus_offset, "#address-cells", 0x1)));
7250da6f3feSBharata B Rao     _FDT((fdt_setprop_cell(fdt, cpus_offset, "#size-cells", 0x0)));
7260da6f3feSBharata B Rao 
7270da6f3feSBharata B Rao     /*
7280da6f3feSBharata B Rao      * We walk the CPUs in reverse order to ensure that CPU DT nodes
7290da6f3feSBharata B Rao      * created by fdt_add_subnode() end up in the right order in FDT
7300da6f3feSBharata B Rao      * for the guest kernel the enumerate the CPUs correctly.
7310da6f3feSBharata B Rao      */
7320da6f3feSBharata B Rao     CPU_FOREACH_REVERSE(cs) {
7330da6f3feSBharata B Rao         PowerPCCPU *cpu = POWERPC_CPU(cs);
7340da6f3feSBharata B Rao         int index = ppc_get_vcpu_dt_id(cpu);
7350da6f3feSBharata B Rao         DeviceClass *dc = DEVICE_GET_CLASS(cs);
7360da6f3feSBharata B Rao         int offset;
7370da6f3feSBharata B Rao 
7380da6f3feSBharata B Rao         if ((index % smt) != 0) {
7390da6f3feSBharata B Rao             continue;
7400da6f3feSBharata B Rao         }
7410da6f3feSBharata B Rao 
7420da6f3feSBharata B Rao         nodename = g_strdup_printf("%s@%x", dc->fw_name, index);
7430da6f3feSBharata B Rao         offset = fdt_add_subnode(fdt, cpus_offset, nodename);
7440da6f3feSBharata B Rao         g_free(nodename);
7450da6f3feSBharata B Rao         _FDT(offset);
7460da6f3feSBharata B Rao         spapr_populate_cpu_dt(cs, fdt, offset, spapr);
7470da6f3feSBharata B Rao     }
7480da6f3feSBharata B Rao 
7490da6f3feSBharata B Rao }
7500da6f3feSBharata B Rao 
75103d196b7SBharata B Rao /*
75203d196b7SBharata B Rao  * Adds ibm,dynamic-reconfiguration-memory node.
75303d196b7SBharata B Rao  * Refer to docs/specs/ppc-spapr-hotplug.txt for the documentation
75403d196b7SBharata B Rao  * of this device tree node.
75503d196b7SBharata B Rao  */
75603d196b7SBharata B Rao static int spapr_populate_drconf_memory(sPAPRMachineState *spapr, void *fdt)
75703d196b7SBharata B Rao {
75803d196b7SBharata B Rao     MachineState *machine = MACHINE(spapr);
75903d196b7SBharata B Rao     int ret, i, offset;
76003d196b7SBharata B Rao     uint64_t lmb_size = SPAPR_MEMORY_BLOCK_SIZE;
76103d196b7SBharata B Rao     uint32_t prop_lmb_size[] = {0, cpu_to_be32(lmb_size)};
762e8f986fcSBharata B Rao     uint32_t nr_lmbs = (machine->maxram_size - machine->ram_size)/lmb_size;
76303d196b7SBharata B Rao     uint32_t *int_buf, *cur_index, buf_len;
7646663864eSBharata B Rao     int nr_nodes = nb_numa_nodes ? nb_numa_nodes : 1;
76503d196b7SBharata B Rao 
766ef001f06SThomas Huth     /*
76716c25aefSBharata B Rao      * Don't create the node if there are no DR LMBs.
76816c25aefSBharata B Rao      */
76916c25aefSBharata B Rao     if (!nr_lmbs) {
77016c25aefSBharata B Rao         return 0;
77116c25aefSBharata B Rao     }
77216c25aefSBharata B Rao 
77316c25aefSBharata B Rao     /*
774ef001f06SThomas Huth      * Allocate enough buffer size to fit in ibm,dynamic-memory
775ef001f06SThomas Huth      * or ibm,associativity-lookup-arrays
776ef001f06SThomas Huth      */
777ef001f06SThomas Huth     buf_len = MAX(nr_lmbs * SPAPR_DR_LMB_LIST_ENTRY_SIZE + 1, nr_nodes * 4 + 2)
778ef001f06SThomas Huth               * sizeof(uint32_t);
77903d196b7SBharata B Rao     cur_index = int_buf = g_malloc0(buf_len);
78003d196b7SBharata B Rao 
78103d196b7SBharata B Rao     offset = fdt_add_subnode(fdt, 0, "ibm,dynamic-reconfiguration-memory");
78203d196b7SBharata B Rao 
78303d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,lmb-size", prop_lmb_size,
78403d196b7SBharata B Rao                     sizeof(prop_lmb_size));
78503d196b7SBharata B Rao     if (ret < 0) {
78603d196b7SBharata B Rao         goto out;
78703d196b7SBharata B Rao     }
78803d196b7SBharata B Rao 
78903d196b7SBharata B Rao     ret = fdt_setprop_cell(fdt, offset, "ibm,memory-flags-mask", 0xff);
79003d196b7SBharata B Rao     if (ret < 0) {
79103d196b7SBharata B Rao         goto out;
79203d196b7SBharata B Rao     }
79303d196b7SBharata B Rao 
79403d196b7SBharata B Rao     ret = fdt_setprop_cell(fdt, offset, "ibm,memory-preservation-time", 0x0);
79503d196b7SBharata B Rao     if (ret < 0) {
79603d196b7SBharata B Rao         goto out;
79703d196b7SBharata B Rao     }
79803d196b7SBharata B Rao 
79903d196b7SBharata B Rao     /* ibm,dynamic-memory */
80003d196b7SBharata B Rao     int_buf[0] = cpu_to_be32(nr_lmbs);
80103d196b7SBharata B Rao     cur_index++;
80203d196b7SBharata B Rao     for (i = 0; i < nr_lmbs; i++) {
80303d196b7SBharata B Rao         sPAPRDRConnector *drc;
80403d196b7SBharata B Rao         sPAPRDRConnectorClass *drck;
805e8f986fcSBharata B Rao         uint64_t addr = i * lmb_size + spapr->hotplug_memory.base;;
80603d196b7SBharata B Rao         uint32_t *dynamic_memory = cur_index;
80703d196b7SBharata B Rao 
80803d196b7SBharata B Rao         drc = spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_LMB,
80903d196b7SBharata B Rao                                        addr/lmb_size);
81003d196b7SBharata B Rao         g_assert(drc);
81103d196b7SBharata B Rao         drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
81203d196b7SBharata B Rao 
81303d196b7SBharata B Rao         dynamic_memory[0] = cpu_to_be32(addr >> 32);
81403d196b7SBharata B Rao         dynamic_memory[1] = cpu_to_be32(addr & 0xffffffff);
81503d196b7SBharata B Rao         dynamic_memory[2] = cpu_to_be32(drck->get_index(drc));
81603d196b7SBharata B Rao         dynamic_memory[3] = cpu_to_be32(0); /* reserved */
81703d196b7SBharata B Rao         dynamic_memory[4] = cpu_to_be32(numa_get_node(addr, NULL));
81803d196b7SBharata B Rao         if (addr < machine->ram_size ||
81903d196b7SBharata B Rao                     memory_region_present(get_system_memory(), addr)) {
82003d196b7SBharata B Rao             dynamic_memory[5] = cpu_to_be32(SPAPR_LMB_FLAGS_ASSIGNED);
82103d196b7SBharata B Rao         } else {
82203d196b7SBharata B Rao             dynamic_memory[5] = cpu_to_be32(0);
82303d196b7SBharata B Rao         }
82403d196b7SBharata B Rao 
82503d196b7SBharata B Rao         cur_index += SPAPR_DR_LMB_LIST_ENTRY_SIZE;
82603d196b7SBharata B Rao     }
82703d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,dynamic-memory", int_buf, buf_len);
82803d196b7SBharata B Rao     if (ret < 0) {
82903d196b7SBharata B Rao         goto out;
83003d196b7SBharata B Rao     }
83103d196b7SBharata B Rao 
83203d196b7SBharata B Rao     /* ibm,associativity-lookup-arrays */
83303d196b7SBharata B Rao     cur_index = int_buf;
8346663864eSBharata B Rao     int_buf[0] = cpu_to_be32(nr_nodes);
83503d196b7SBharata B Rao     int_buf[1] = cpu_to_be32(4); /* Number of entries per associativity list */
83603d196b7SBharata B Rao     cur_index += 2;
8376663864eSBharata B Rao     for (i = 0; i < nr_nodes; i++) {
83803d196b7SBharata B Rao         uint32_t associativity[] = {
83903d196b7SBharata B Rao             cpu_to_be32(0x0),
84003d196b7SBharata B Rao             cpu_to_be32(0x0),
84103d196b7SBharata B Rao             cpu_to_be32(0x0),
84203d196b7SBharata B Rao             cpu_to_be32(i)
84303d196b7SBharata B Rao         };
84403d196b7SBharata B Rao         memcpy(cur_index, associativity, sizeof(associativity));
84503d196b7SBharata B Rao         cur_index += 4;
84603d196b7SBharata B Rao     }
84703d196b7SBharata B Rao     ret = fdt_setprop(fdt, offset, "ibm,associativity-lookup-arrays", int_buf,
84803d196b7SBharata B Rao             (cur_index - int_buf) * sizeof(uint32_t));
84903d196b7SBharata B Rao out:
85003d196b7SBharata B Rao     g_free(int_buf);
85103d196b7SBharata B Rao     return ret;
85203d196b7SBharata B Rao }
85303d196b7SBharata B Rao 
85403d196b7SBharata B Rao int spapr_h_cas_compose_response(sPAPRMachineState *spapr,
85503d196b7SBharata B Rao                                  target_ulong addr, target_ulong size,
85603d196b7SBharata B Rao                                  bool cpu_update, bool memory_update)
85703d196b7SBharata B Rao {
85803d196b7SBharata B Rao     void *fdt, *fdt_skel;
85903d196b7SBharata B Rao     sPAPRDeviceTreeUpdateHeader hdr = { .version_id = 1 };
86003d196b7SBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(qdev_get_machine());
86103d196b7SBharata B Rao 
86203d196b7SBharata B Rao     size -= sizeof(hdr);
86303d196b7SBharata B Rao 
86403d196b7SBharata B Rao     /* Create sceleton */
86503d196b7SBharata B Rao     fdt_skel = g_malloc0(size);
86603d196b7SBharata B Rao     _FDT((fdt_create(fdt_skel, size)));
86703d196b7SBharata B Rao     _FDT((fdt_begin_node(fdt_skel, "")));
86803d196b7SBharata B Rao     _FDT((fdt_end_node(fdt_skel)));
86903d196b7SBharata B Rao     _FDT((fdt_finish(fdt_skel)));
87003d196b7SBharata B Rao     fdt = g_malloc0(size);
87103d196b7SBharata B Rao     _FDT((fdt_open_into(fdt_skel, fdt, size)));
87203d196b7SBharata B Rao     g_free(fdt_skel);
87303d196b7SBharata B Rao 
87403d196b7SBharata B Rao     /* Fixup cpu nodes */
87503d196b7SBharata B Rao     if (cpu_update) {
87603d196b7SBharata B Rao         _FDT((spapr_fixup_cpu_dt(fdt, spapr)));
87703d196b7SBharata B Rao     }
87803d196b7SBharata B Rao 
87916c25aefSBharata B Rao     /* Generate ibm,dynamic-reconfiguration-memory node if required */
88003d196b7SBharata B Rao     if (memory_update && smc->dr_lmb_enabled) {
88103d196b7SBharata B Rao         _FDT((spapr_populate_drconf_memory(spapr, fdt)));
88203d196b7SBharata B Rao     }
88303d196b7SBharata B Rao 
88403d196b7SBharata B Rao     /* Pack resulting tree */
88503d196b7SBharata B Rao     _FDT((fdt_pack(fdt)));
88603d196b7SBharata B Rao 
88703d196b7SBharata B Rao     if (fdt_totalsize(fdt) + sizeof(hdr) > size) {
88803d196b7SBharata B Rao         trace_spapr_cas_failed(size);
88903d196b7SBharata B Rao         return -1;
89003d196b7SBharata B Rao     }
89103d196b7SBharata B Rao 
89203d196b7SBharata B Rao     cpu_physical_memory_write(addr, &hdr, sizeof(hdr));
89303d196b7SBharata B Rao     cpu_physical_memory_write(addr + sizeof(hdr), fdt, fdt_totalsize(fdt));
89403d196b7SBharata B Rao     trace_spapr_cas_continue(fdt_totalsize(fdt) + sizeof(hdr));
89503d196b7SBharata B Rao     g_free(fdt);
89603d196b7SBharata B Rao 
89703d196b7SBharata B Rao     return 0;
89803d196b7SBharata B Rao }
89903d196b7SBharata B Rao 
90028e02042SDavid Gibson static void spapr_finalize_fdt(sPAPRMachineState *spapr,
90153018216SPaolo Bonzini                                hwaddr fdt_addr,
90253018216SPaolo Bonzini                                hwaddr rtas_addr,
90353018216SPaolo Bonzini                                hwaddr rtas_size)
90453018216SPaolo Bonzini {
9055b2128d2SAlexander Graf     MachineState *machine = MACHINE(qdev_get_machine());
906c20d332aSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(machine);
9075b2128d2SAlexander Graf     const char *boot_device = machine->boot_order;
90871461b0fSAlexey Kardashevskiy     int ret, i;
90971461b0fSAlexey Kardashevskiy     size_t cb = 0;
91071461b0fSAlexey Kardashevskiy     char *bootlist;
91153018216SPaolo Bonzini     void *fdt;
91253018216SPaolo Bonzini     sPAPRPHBState *phb;
91353018216SPaolo Bonzini 
91453018216SPaolo Bonzini     fdt = g_malloc(FDT_MAX_SIZE);
91553018216SPaolo Bonzini 
91653018216SPaolo Bonzini     /* open out the base tree into a temp buffer for the final tweaks */
91753018216SPaolo Bonzini     _FDT((fdt_open_into(spapr->fdt_skel, fdt, FDT_MAX_SIZE)));
91853018216SPaolo Bonzini 
919e8f986fcSBharata B Rao     ret = spapr_populate_memory(spapr, fdt);
920e8f986fcSBharata B Rao     if (ret < 0) {
921e8f986fcSBharata B Rao         fprintf(stderr, "couldn't setup memory nodes in fdt\n");
922e8f986fcSBharata B Rao         exit(1);
92353018216SPaolo Bonzini     }
92453018216SPaolo Bonzini 
92553018216SPaolo Bonzini     ret = spapr_populate_vdevice(spapr->vio_bus, fdt);
92653018216SPaolo Bonzini     if (ret < 0) {
92753018216SPaolo Bonzini         fprintf(stderr, "couldn't setup vio devices in fdt\n");
92853018216SPaolo Bonzini         exit(1);
92953018216SPaolo Bonzini     }
93053018216SPaolo Bonzini 
9314d9392beSThomas Huth     if (object_resolve_path_type("", TYPE_SPAPR_RNG, NULL)) {
9324d9392beSThomas Huth         ret = spapr_rng_populate_dt(fdt);
9334d9392beSThomas Huth         if (ret < 0) {
9344d9392beSThomas Huth             fprintf(stderr, "could not set up rng device in the fdt\n");
9354d9392beSThomas Huth             exit(1);
9364d9392beSThomas Huth         }
9374d9392beSThomas Huth     }
9384d9392beSThomas Huth 
93953018216SPaolo Bonzini     QLIST_FOREACH(phb, &spapr->phbs, list) {
94053018216SPaolo Bonzini         ret = spapr_populate_pci_dt(phb, PHANDLE_XICP, fdt);
94153018216SPaolo Bonzini     }
94253018216SPaolo Bonzini 
94353018216SPaolo Bonzini     if (ret < 0) {
94453018216SPaolo Bonzini         fprintf(stderr, "couldn't setup PCI devices in fdt\n");
94553018216SPaolo Bonzini         exit(1);
94653018216SPaolo Bonzini     }
94753018216SPaolo Bonzini 
94853018216SPaolo Bonzini     /* RTAS */
94953018216SPaolo Bonzini     ret = spapr_rtas_device_tree_setup(fdt, rtas_addr, rtas_size);
95053018216SPaolo Bonzini     if (ret < 0) {
95153018216SPaolo Bonzini         fprintf(stderr, "Couldn't set up RTAS device tree properties\n");
95253018216SPaolo Bonzini     }
95353018216SPaolo Bonzini 
9540da6f3feSBharata B Rao     /* cpus */
9550da6f3feSBharata B Rao     spapr_populate_cpus_dt_node(fdt, spapr);
95653018216SPaolo Bonzini 
95771461b0fSAlexey Kardashevskiy     bootlist = get_boot_devices_list(&cb, true);
95871461b0fSAlexey Kardashevskiy     if (cb && bootlist) {
95971461b0fSAlexey Kardashevskiy         int offset = fdt_path_offset(fdt, "/chosen");
96071461b0fSAlexey Kardashevskiy         if (offset < 0) {
96171461b0fSAlexey Kardashevskiy             exit(1);
96271461b0fSAlexey Kardashevskiy         }
96371461b0fSAlexey Kardashevskiy         for (i = 0; i < cb; i++) {
96471461b0fSAlexey Kardashevskiy             if (bootlist[i] == '\n') {
96571461b0fSAlexey Kardashevskiy                 bootlist[i] = ' ';
96671461b0fSAlexey Kardashevskiy             }
96771461b0fSAlexey Kardashevskiy 
96871461b0fSAlexey Kardashevskiy         }
96971461b0fSAlexey Kardashevskiy         ret = fdt_setprop_string(fdt, offset, "qemu,boot-list", bootlist);
97071461b0fSAlexey Kardashevskiy     }
97171461b0fSAlexey Kardashevskiy 
9725b2128d2SAlexander Graf     if (boot_device && strlen(boot_device)) {
9735b2128d2SAlexander Graf         int offset = fdt_path_offset(fdt, "/chosen");
9745b2128d2SAlexander Graf 
9755b2128d2SAlexander Graf         if (offset < 0) {
9765b2128d2SAlexander Graf             exit(1);
9775b2128d2SAlexander Graf         }
9785b2128d2SAlexander Graf         fdt_setprop_string(fdt, offset, "qemu,boot-device", boot_device);
9795b2128d2SAlexander Graf     }
9805b2128d2SAlexander Graf 
98153018216SPaolo Bonzini     if (!spapr->has_graphics) {
98253018216SPaolo Bonzini         spapr_populate_chosen_stdout(fdt, spapr->vio_bus);
98353018216SPaolo Bonzini     }
98453018216SPaolo Bonzini 
985c20d332aSBharata B Rao     if (smc->dr_lmb_enabled) {
986c20d332aSBharata B Rao         _FDT(spapr_drc_populate_dt(fdt, 0, NULL, SPAPR_DR_CONNECTOR_TYPE_LMB));
987c20d332aSBharata B Rao     }
988c20d332aSBharata B Rao 
98953018216SPaolo Bonzini     _FDT((fdt_pack(fdt)));
99053018216SPaolo Bonzini 
99153018216SPaolo Bonzini     if (fdt_totalsize(fdt) > FDT_MAX_SIZE) {
992730fce59SThomas Huth         error_report("FDT too big ! 0x%x bytes (max is 0x%x)",
99353018216SPaolo Bonzini                      fdt_totalsize(fdt), FDT_MAX_SIZE);
99453018216SPaolo Bonzini         exit(1);
99553018216SPaolo Bonzini     }
99653018216SPaolo Bonzini 
997ad440b4aSAndrew Jones     qemu_fdt_dumpdtb(fdt, fdt_totalsize(fdt));
99853018216SPaolo Bonzini     cpu_physical_memory_write(fdt_addr, fdt, fdt_totalsize(fdt));
99953018216SPaolo Bonzini 
1000a21a7a70SGonglei     g_free(bootlist);
100153018216SPaolo Bonzini     g_free(fdt);
100253018216SPaolo Bonzini }
100353018216SPaolo Bonzini 
100453018216SPaolo Bonzini static uint64_t translate_kernel_address(void *opaque, uint64_t addr)
100553018216SPaolo Bonzini {
100653018216SPaolo Bonzini     return (addr & 0x0fffffff) + KERNEL_LOAD_ADDR;
100753018216SPaolo Bonzini }
100853018216SPaolo Bonzini 
100953018216SPaolo Bonzini static void emulate_spapr_hypercall(PowerPCCPU *cpu)
101053018216SPaolo Bonzini {
101153018216SPaolo Bonzini     CPUPPCState *env = &cpu->env;
101253018216SPaolo Bonzini 
101353018216SPaolo Bonzini     if (msr_pr) {
101453018216SPaolo Bonzini         hcall_dprintf("Hypercall made with MSR[PR]=1\n");
101553018216SPaolo Bonzini         env->gpr[3] = H_PRIVILEGE;
101653018216SPaolo Bonzini     } else {
101753018216SPaolo Bonzini         env->gpr[3] = spapr_hypercall(cpu, env->gpr[3], &env->gpr[4]);
101853018216SPaolo Bonzini     }
101953018216SPaolo Bonzini }
102053018216SPaolo Bonzini 
1021e6b8fd24SSamuel Mendoza-Jonas #define HPTE(_table, _i)   (void *)(((uint64_t *)(_table)) + ((_i) * 2))
1022e6b8fd24SSamuel Mendoza-Jonas #define HPTE_VALID(_hpte)  (tswap64(*((uint64_t *)(_hpte))) & HPTE64_V_VALID)
1023e6b8fd24SSamuel Mendoza-Jonas #define HPTE_DIRTY(_hpte)  (tswap64(*((uint64_t *)(_hpte))) & HPTE64_V_HPTE_DIRTY)
1024e6b8fd24SSamuel Mendoza-Jonas #define CLEAN_HPTE(_hpte)  ((*(uint64_t *)(_hpte)) &= tswap64(~HPTE64_V_HPTE_DIRTY))
1025e6b8fd24SSamuel Mendoza-Jonas #define DIRTY_HPTE(_hpte)  ((*(uint64_t *)(_hpte)) |= tswap64(HPTE64_V_HPTE_DIRTY))
1026e6b8fd24SSamuel Mendoza-Jonas 
1027b817772aSBharata B Rao static void spapr_alloc_htab(sPAPRMachineState *spapr)
102853018216SPaolo Bonzini {
102953018216SPaolo Bonzini     long shift;
1030e6b8fd24SSamuel Mendoza-Jonas     int index;
103153018216SPaolo Bonzini 
103253018216SPaolo Bonzini     /* allocate hash page table.  For now we always make this 16mb,
103353018216SPaolo Bonzini      * later we should probably make it scale to the size of guest
103453018216SPaolo Bonzini      * RAM */
103553018216SPaolo Bonzini 
103653018216SPaolo Bonzini     shift = kvmppc_reset_htab(spapr->htab_shift);
1037b41d320fSBharata B Rao     if (shift < 0) {
1038b41d320fSBharata B Rao         /*
1039b41d320fSBharata B Rao          * For HV KVM, host kernel will return -ENOMEM when requested
1040b41d320fSBharata B Rao          * HTAB size can't be allocated.
1041b41d320fSBharata B Rao          */
1042b41d320fSBharata B Rao         error_setg(&error_abort, "Failed to allocate HTAB of requested size, try with smaller maxmem");
1043b41d320fSBharata B Rao     } else if (shift > 0) {
1044b41d320fSBharata B Rao         /*
1045b41d320fSBharata B Rao          * Kernel handles htab, we don't need to allocate one
1046b41d320fSBharata B Rao          *
1047b41d320fSBharata B Rao          * Older kernels can fall back to lower HTAB shift values,
1048b41d320fSBharata B Rao          * but we don't allow booting of such guests.
1049b41d320fSBharata B Rao          */
10507735fedaSBharata B Rao         if (shift != spapr->htab_shift) {
10517735fedaSBharata B Rao             error_setg(&error_abort, "Failed to allocate HTAB of requested size, try with smaller maxmem");
10527735fedaSBharata B Rao         }
10537735fedaSBharata B Rao 
105453018216SPaolo Bonzini         spapr->htab_shift = shift;
10557c43bca0SAneesh Kumar K.V         kvmppc_kern_htab = true;
1056b817772aSBharata B Rao     } else {
1057b817772aSBharata B Rao         /* Allocate htab */
1058b817772aSBharata B Rao         spapr->htab = qemu_memalign(HTAB_SIZE(spapr), HTAB_SIZE(spapr));
105901a57972SSamuel Mendoza-Jonas 
1060b817772aSBharata B Rao         /* And clear it */
1061b817772aSBharata B Rao         memset(spapr->htab, 0, HTAB_SIZE(spapr));
1062b817772aSBharata B Rao 
1063b817772aSBharata B Rao         for (index = 0; index < HTAB_SIZE(spapr) / HASH_PTE_SIZE_64; index++) {
1064b817772aSBharata B Rao             DIRTY_HPTE(HPTE(spapr->htab, index));
1065b817772aSBharata B Rao         }
1066b817772aSBharata B Rao     }
1067b817772aSBharata B Rao }
1068b817772aSBharata B Rao 
1069b817772aSBharata B Rao /*
1070b817772aSBharata B Rao  * Clear HTAB entries during reset.
1071b817772aSBharata B Rao  *
1072b817772aSBharata B Rao  * If host kernel has allocated HTAB, KVM_PPC_ALLOCATE_HTAB ioctl is
1073b817772aSBharata B Rao  * used to clear HTAB. Otherwise QEMU-allocated HTAB is cleared manually.
1074b817772aSBharata B Rao  */
1075b817772aSBharata B Rao static void spapr_reset_htab(sPAPRMachineState *spapr)
1076b817772aSBharata B Rao {
1077b817772aSBharata B Rao     long shift;
1078b817772aSBharata B Rao     int index;
1079b817772aSBharata B Rao 
1080b817772aSBharata B Rao     shift = kvmppc_reset_htab(spapr->htab_shift);
1081b41d320fSBharata B Rao     if (shift < 0) {
1082b41d320fSBharata B Rao         error_setg(&error_abort, "Failed to reset HTAB");
1083b41d320fSBharata B Rao     } else if (shift > 0) {
10847735fedaSBharata B Rao         if (shift != spapr->htab_shift) {
10857735fedaSBharata B Rao             error_setg(&error_abort, "Requested HTAB allocation failed during reset");
10867735fedaSBharata B Rao         }
10877735fedaSBharata B Rao 
108801a57972SSamuel Mendoza-Jonas         /* Tell readers to update their file descriptor */
108901a57972SSamuel Mendoza-Jonas         if (spapr->htab_fd >= 0) {
109001a57972SSamuel Mendoza-Jonas             spapr->htab_fd_stale = true;
109101a57972SSamuel Mendoza-Jonas         }
109253018216SPaolo Bonzini     } else {
109353018216SPaolo Bonzini         memset(spapr->htab, 0, HTAB_SIZE(spapr));
1094e6b8fd24SSamuel Mendoza-Jonas 
1095e6b8fd24SSamuel Mendoza-Jonas         for (index = 0; index < HTAB_SIZE(spapr) / HASH_PTE_SIZE_64; index++) {
1096e6b8fd24SSamuel Mendoza-Jonas             DIRTY_HPTE(HPTE(spapr->htab, index));
1097e6b8fd24SSamuel Mendoza-Jonas         }
109853018216SPaolo Bonzini     }
109953018216SPaolo Bonzini 
110053018216SPaolo Bonzini     /* Update the RMA size if necessary */
110153018216SPaolo Bonzini     if (spapr->vrma_adjust) {
1102b082d65aSAlexey Kardashevskiy         spapr->rma_size = kvmppc_rma_size(spapr_node0_size(),
1103b082d65aSAlexey Kardashevskiy                                           spapr->htab_shift);
110453018216SPaolo Bonzini     }
110553018216SPaolo Bonzini }
110653018216SPaolo Bonzini 
11079e3f9733SAlexander Graf static int find_unknown_sysbus_device(SysBusDevice *sbdev, void *opaque)
11089e3f9733SAlexander Graf {
11099e3f9733SAlexander Graf     bool matched = false;
11109e3f9733SAlexander Graf 
11119e3f9733SAlexander Graf     if (object_dynamic_cast(OBJECT(sbdev), TYPE_SPAPR_PCI_HOST_BRIDGE)) {
11129e3f9733SAlexander Graf         matched = true;
11139e3f9733SAlexander Graf     }
11149e3f9733SAlexander Graf 
11159e3f9733SAlexander Graf     if (!matched) {
11169e3f9733SAlexander Graf         error_report("Device %s is not supported by this machine yet.",
11179e3f9733SAlexander Graf                      qdev_fw_name(DEVICE(sbdev)));
11189e3f9733SAlexander Graf         exit(1);
11199e3f9733SAlexander Graf     }
11209e3f9733SAlexander Graf 
11219e3f9733SAlexander Graf     return 0;
11229e3f9733SAlexander Graf }
11239e3f9733SAlexander Graf 
112401a57972SSamuel Mendoza-Jonas /*
112501a57972SSamuel Mendoza-Jonas  * A guest reset will cause spapr->htab_fd to become stale if being used.
112601a57972SSamuel Mendoza-Jonas  * Reopen the file descriptor to make sure the whole HTAB is properly read.
112701a57972SSamuel Mendoza-Jonas  */
112828e02042SDavid Gibson static int spapr_check_htab_fd(sPAPRMachineState *spapr)
112901a57972SSamuel Mendoza-Jonas {
113001a57972SSamuel Mendoza-Jonas     int rc = 0;
113101a57972SSamuel Mendoza-Jonas 
113201a57972SSamuel Mendoza-Jonas     if (spapr->htab_fd_stale) {
113301a57972SSamuel Mendoza-Jonas         close(spapr->htab_fd);
113401a57972SSamuel Mendoza-Jonas         spapr->htab_fd = kvmppc_get_htab_fd(false);
113501a57972SSamuel Mendoza-Jonas         if (spapr->htab_fd < 0) {
113601a57972SSamuel Mendoza-Jonas             error_report("Unable to open fd for reading hash table from KVM: "
113701a57972SSamuel Mendoza-Jonas                          "%s", strerror(errno));
113801a57972SSamuel Mendoza-Jonas             rc = -1;
113901a57972SSamuel Mendoza-Jonas         }
114001a57972SSamuel Mendoza-Jonas         spapr->htab_fd_stale = false;
114101a57972SSamuel Mendoza-Jonas     }
114201a57972SSamuel Mendoza-Jonas 
114301a57972SSamuel Mendoza-Jonas     return rc;
114401a57972SSamuel Mendoza-Jonas }
114501a57972SSamuel Mendoza-Jonas 
114653018216SPaolo Bonzini static void ppc_spapr_reset(void)
114753018216SPaolo Bonzini {
114828e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(qdev_get_machine());
1149182735efSAndreas Färber     PowerPCCPU *first_ppc_cpu;
1150b7d1f77aSBenjamin Herrenschmidt     uint32_t rtas_limit;
1151259186a7SAndreas Färber 
11529e3f9733SAlexander Graf     /* Check for unknown sysbus devices */
11539e3f9733SAlexander Graf     foreach_dynamic_sysbus_device(find_unknown_sysbus_device, NULL);
11549e3f9733SAlexander Graf 
115553018216SPaolo Bonzini     /* Reset the hash table & recalc the RMA */
115653018216SPaolo Bonzini     spapr_reset_htab(spapr);
115753018216SPaolo Bonzini 
115853018216SPaolo Bonzini     qemu_devices_reset();
115953018216SPaolo Bonzini 
1160b7d1f77aSBenjamin Herrenschmidt     /*
1161b7d1f77aSBenjamin Herrenschmidt      * We place the device tree and RTAS just below either the top of the RMA,
1162b7d1f77aSBenjamin Herrenschmidt      * or just below 2GB, whichever is lowere, so that it can be
1163b7d1f77aSBenjamin Herrenschmidt      * processed with 32-bit real mode code if necessary
1164b7d1f77aSBenjamin Herrenschmidt      */
1165b7d1f77aSBenjamin Herrenschmidt     rtas_limit = MIN(spapr->rma_size, RTAS_MAX_ADDR);
1166b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_addr = rtas_limit - RTAS_MAX_SIZE;
1167b7d1f77aSBenjamin Herrenschmidt     spapr->fdt_addr = spapr->rtas_addr - FDT_MAX_SIZE;
1168b7d1f77aSBenjamin Herrenschmidt 
116953018216SPaolo Bonzini     /* Load the fdt */
117053018216SPaolo Bonzini     spapr_finalize_fdt(spapr, spapr->fdt_addr, spapr->rtas_addr,
117153018216SPaolo Bonzini                        spapr->rtas_size);
117253018216SPaolo Bonzini 
1173b7d1f77aSBenjamin Herrenschmidt     /* Copy RTAS over */
1174b7d1f77aSBenjamin Herrenschmidt     cpu_physical_memory_write(spapr->rtas_addr, spapr->rtas_blob,
1175b7d1f77aSBenjamin Herrenschmidt                               spapr->rtas_size);
1176b7d1f77aSBenjamin Herrenschmidt 
117753018216SPaolo Bonzini     /* Set up the entry state */
1178182735efSAndreas Färber     first_ppc_cpu = POWERPC_CPU(first_cpu);
1179182735efSAndreas Färber     first_ppc_cpu->env.gpr[3] = spapr->fdt_addr;
1180182735efSAndreas Färber     first_ppc_cpu->env.gpr[5] = 0;
1181182735efSAndreas Färber     first_cpu->halted = 0;
11821b718907SDavid Gibson     first_ppc_cpu->env.nip = SPAPR_ENTRY_POINT;
118353018216SPaolo Bonzini 
118453018216SPaolo Bonzini }
118553018216SPaolo Bonzini 
118653018216SPaolo Bonzini static void spapr_cpu_reset(void *opaque)
118753018216SPaolo Bonzini {
118828e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(qdev_get_machine());
118953018216SPaolo Bonzini     PowerPCCPU *cpu = opaque;
1190259186a7SAndreas Färber     CPUState *cs = CPU(cpu);
119153018216SPaolo Bonzini     CPUPPCState *env = &cpu->env;
119253018216SPaolo Bonzini 
1193259186a7SAndreas Färber     cpu_reset(cs);
119453018216SPaolo Bonzini 
119553018216SPaolo Bonzini     /* All CPUs start halted.  CPU0 is unhalted from the machine level
119653018216SPaolo Bonzini      * reset code and the rest are explicitly started up by the guest
119753018216SPaolo Bonzini      * using an RTAS call */
1198259186a7SAndreas Färber     cs->halted = 1;
119953018216SPaolo Bonzini 
120053018216SPaolo Bonzini     env->spr[SPR_HIOR] = 0;
120153018216SPaolo Bonzini 
12024be21d56SDavid Gibson     env->external_htab = (uint8_t *)spapr->htab;
12035736245cSAneesh Kumar K.V     if (kvm_enabled() && !env->external_htab) {
12045736245cSAneesh Kumar K.V         /*
12055736245cSAneesh Kumar K.V          * HV KVM, set external_htab to 1 so our ppc_hash64_load_hpte*
12065736245cSAneesh Kumar K.V          * functions do the right thing.
12075736245cSAneesh Kumar K.V          */
12085736245cSAneesh Kumar K.V         env->external_htab = (void *)1;
12095736245cSAneesh Kumar K.V     }
121053018216SPaolo Bonzini     env->htab_base = -1;
1211f3c75d42SAneesh Kumar K.V     /*
1212f3c75d42SAneesh Kumar K.V      * htab_mask is the mask used to normalize hash value to PTEG index.
1213f3c75d42SAneesh Kumar K.V      * htab_shift is log2 of hash table size.
1214f3c75d42SAneesh Kumar K.V      * We have 8 hpte per group, and each hpte is 16 bytes.
1215f3c75d42SAneesh Kumar K.V      * ie have 128 bytes per hpte entry.
1216f3c75d42SAneesh Kumar K.V      */
121728e02042SDavid Gibson     env->htab_mask = (1ULL << (spapr->htab_shift - 7)) - 1;
1218ec4936e1SStefan Weil     env->spr[SPR_SDR1] = (target_ulong)(uintptr_t)spapr->htab |
121953018216SPaolo Bonzini         (spapr->htab_shift - 18);
122053018216SPaolo Bonzini }
122153018216SPaolo Bonzini 
122228e02042SDavid Gibson static void spapr_create_nvram(sPAPRMachineState *spapr)
122353018216SPaolo Bonzini {
12242ff3de68SMarkus Armbruster     DeviceState *dev = qdev_create(&spapr->vio_bus->bus, "spapr-nvram");
12253978b863SPaolo Bonzini     DriveInfo *dinfo = drive_get(IF_PFLASH, 0, 0);
122653018216SPaolo Bonzini 
12273978b863SPaolo Bonzini     if (dinfo) {
12286231a6daSMarkus Armbruster         qdev_prop_set_drive(dev, "drive", blk_by_legacy_dinfo(dinfo),
12296231a6daSMarkus Armbruster                             &error_fatal);
123053018216SPaolo Bonzini     }
123153018216SPaolo Bonzini 
123253018216SPaolo Bonzini     qdev_init_nofail(dev);
123353018216SPaolo Bonzini 
123453018216SPaolo Bonzini     spapr->nvram = (struct sPAPRNVRAM *)dev;
123553018216SPaolo Bonzini }
123653018216SPaolo Bonzini 
123728e02042SDavid Gibson static void spapr_rtc_create(sPAPRMachineState *spapr)
123828df36a1SDavid Gibson {
123928df36a1SDavid Gibson     DeviceState *dev = qdev_create(NULL, TYPE_SPAPR_RTC);
124028df36a1SDavid Gibson 
124128df36a1SDavid Gibson     qdev_init_nofail(dev);
124228df36a1SDavid Gibson     spapr->rtc = dev;
124374e5ae28SDavid Gibson 
124474e5ae28SDavid Gibson     object_property_add_alias(qdev_get_machine(), "rtc-time",
124574e5ae28SDavid Gibson                               OBJECT(spapr->rtc), "date", NULL);
124628df36a1SDavid Gibson }
124728df36a1SDavid Gibson 
124853018216SPaolo Bonzini /* Returns whether we want to use VGA or not */
124953018216SPaolo Bonzini static int spapr_vga_init(PCIBus *pci_bus)
125053018216SPaolo Bonzini {
125153018216SPaolo Bonzini     switch (vga_interface_type) {
125253018216SPaolo Bonzini     case VGA_NONE:
12537effdaa3SMark Wu         return false;
12547effdaa3SMark Wu     case VGA_DEVICE:
12557effdaa3SMark Wu         return true;
125653018216SPaolo Bonzini     case VGA_STD:
1257b798c190SBenjamin Herrenschmidt     case VGA_VIRTIO:
125853018216SPaolo Bonzini         return pci_vga_init(pci_bus) != NULL;
125953018216SPaolo Bonzini     default:
126053018216SPaolo Bonzini         fprintf(stderr, "This vga model is not supported,"
126153018216SPaolo Bonzini                 "currently it only supports -vga std\n");
126253018216SPaolo Bonzini         exit(0);
126353018216SPaolo Bonzini     }
126453018216SPaolo Bonzini }
126553018216SPaolo Bonzini 
1266880ae7deSDavid Gibson static int spapr_post_load(void *opaque, int version_id)
1267880ae7deSDavid Gibson {
126828e02042SDavid Gibson     sPAPRMachineState *spapr = (sPAPRMachineState *)opaque;
1269880ae7deSDavid Gibson     int err = 0;
1270880ae7deSDavid Gibson 
1271631b22eaSStefan Weil     /* In earlier versions, there was no separate qdev for the PAPR
1272880ae7deSDavid Gibson      * RTC, so the RTC offset was stored directly in sPAPREnvironment.
1273880ae7deSDavid Gibson      * So when migrating from those versions, poke the incoming offset
1274880ae7deSDavid Gibson      * value into the RTC device */
1275880ae7deSDavid Gibson     if (version_id < 3) {
1276880ae7deSDavid Gibson         err = spapr_rtc_import_offset(spapr->rtc, spapr->rtc_offset);
1277880ae7deSDavid Gibson     }
1278880ae7deSDavid Gibson 
1279880ae7deSDavid Gibson     return err;
1280880ae7deSDavid Gibson }
1281880ae7deSDavid Gibson 
1282880ae7deSDavid Gibson static bool version_before_3(void *opaque, int version_id)
1283880ae7deSDavid Gibson {
1284880ae7deSDavid Gibson     return version_id < 3;
1285880ae7deSDavid Gibson }
1286880ae7deSDavid Gibson 
12874be21d56SDavid Gibson static const VMStateDescription vmstate_spapr = {
12884be21d56SDavid Gibson     .name = "spapr",
1289880ae7deSDavid Gibson     .version_id = 3,
12904be21d56SDavid Gibson     .minimum_version_id = 1,
1291880ae7deSDavid Gibson     .post_load = spapr_post_load,
12924be21d56SDavid Gibson     .fields = (VMStateField[]) {
1293880ae7deSDavid Gibson         /* used to be @next_irq */
1294880ae7deSDavid Gibson         VMSTATE_UNUSED_BUFFER(version_before_3, 0, 4),
12954be21d56SDavid Gibson 
12964be21d56SDavid Gibson         /* RTC offset */
129728e02042SDavid Gibson         VMSTATE_UINT64_TEST(rtc_offset, sPAPRMachineState, version_before_3),
1298880ae7deSDavid Gibson 
129928e02042SDavid Gibson         VMSTATE_PPC_TIMEBASE_V(tb, sPAPRMachineState, 2),
13004be21d56SDavid Gibson         VMSTATE_END_OF_LIST()
13014be21d56SDavid Gibson     },
13024be21d56SDavid Gibson };
13034be21d56SDavid Gibson 
13044be21d56SDavid Gibson static int htab_save_setup(QEMUFile *f, void *opaque)
13054be21d56SDavid Gibson {
130628e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
13074be21d56SDavid Gibson 
13084be21d56SDavid Gibson     /* "Iteration" header */
13094be21d56SDavid Gibson     qemu_put_be32(f, spapr->htab_shift);
13104be21d56SDavid Gibson 
1311e68cb8b4SAlexey Kardashevskiy     if (spapr->htab) {
1312e68cb8b4SAlexey Kardashevskiy         spapr->htab_save_index = 0;
1313e68cb8b4SAlexey Kardashevskiy         spapr->htab_first_pass = true;
1314e68cb8b4SAlexey Kardashevskiy     } else {
1315e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1316e68cb8b4SAlexey Kardashevskiy 
1317e68cb8b4SAlexey Kardashevskiy         spapr->htab_fd = kvmppc_get_htab_fd(false);
131801a57972SSamuel Mendoza-Jonas         spapr->htab_fd_stale = false;
1319e68cb8b4SAlexey Kardashevskiy         if (spapr->htab_fd < 0) {
1320e68cb8b4SAlexey Kardashevskiy             fprintf(stderr, "Unable to open fd for reading hash table from KVM: %s\n",
1321e68cb8b4SAlexey Kardashevskiy                     strerror(errno));
1322e68cb8b4SAlexey Kardashevskiy             return -1;
1323e68cb8b4SAlexey Kardashevskiy         }
13244be21d56SDavid Gibson     }
13254be21d56SDavid Gibson 
1326e68cb8b4SAlexey Kardashevskiy 
1327e68cb8b4SAlexey Kardashevskiy     return 0;
1328e68cb8b4SAlexey Kardashevskiy }
13294be21d56SDavid Gibson 
133028e02042SDavid Gibson static void htab_save_first_pass(QEMUFile *f, sPAPRMachineState *spapr,
13314be21d56SDavid Gibson                                  int64_t max_ns)
13324be21d56SDavid Gibson {
13334be21d56SDavid Gibson     int htabslots = HTAB_SIZE(spapr) / HASH_PTE_SIZE_64;
13344be21d56SDavid Gibson     int index = spapr->htab_save_index;
1335bc72ad67SAlex Bligh     int64_t starttime = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
13364be21d56SDavid Gibson 
13374be21d56SDavid Gibson     assert(spapr->htab_first_pass);
13384be21d56SDavid Gibson 
13394be21d56SDavid Gibson     do {
13404be21d56SDavid Gibson         int chunkstart;
13414be21d56SDavid Gibson 
13424be21d56SDavid Gibson         /* Consume invalid HPTEs */
13434be21d56SDavid Gibson         while ((index < htabslots)
13444be21d56SDavid Gibson                && !HPTE_VALID(HPTE(spapr->htab, index))) {
13454be21d56SDavid Gibson             index++;
13464be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
13474be21d56SDavid Gibson         }
13484be21d56SDavid Gibson 
13494be21d56SDavid Gibson         /* Consume valid HPTEs */
13504be21d56SDavid Gibson         chunkstart = index;
1351338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - chunkstart < USHRT_MAX)
13524be21d56SDavid Gibson                && HPTE_VALID(HPTE(spapr->htab, index))) {
13534be21d56SDavid Gibson             index++;
13544be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
13554be21d56SDavid Gibson         }
13564be21d56SDavid Gibson 
13574be21d56SDavid Gibson         if (index > chunkstart) {
13584be21d56SDavid Gibson             int n_valid = index - chunkstart;
13594be21d56SDavid Gibson 
13604be21d56SDavid Gibson             qemu_put_be32(f, chunkstart);
13614be21d56SDavid Gibson             qemu_put_be16(f, n_valid);
13624be21d56SDavid Gibson             qemu_put_be16(f, 0);
13634be21d56SDavid Gibson             qemu_put_buffer(f, HPTE(spapr->htab, chunkstart),
13644be21d56SDavid Gibson                             HASH_PTE_SIZE_64 * n_valid);
13654be21d56SDavid Gibson 
1366bc72ad67SAlex Bligh             if ((qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - starttime) > max_ns) {
13674be21d56SDavid Gibson                 break;
13684be21d56SDavid Gibson             }
13694be21d56SDavid Gibson         }
13704be21d56SDavid Gibson     } while ((index < htabslots) && !qemu_file_rate_limit(f));
13714be21d56SDavid Gibson 
13724be21d56SDavid Gibson     if (index >= htabslots) {
13734be21d56SDavid Gibson         assert(index == htabslots);
13744be21d56SDavid Gibson         index = 0;
13754be21d56SDavid Gibson         spapr->htab_first_pass = false;
13764be21d56SDavid Gibson     }
13774be21d56SDavid Gibson     spapr->htab_save_index = index;
13784be21d56SDavid Gibson }
13794be21d56SDavid Gibson 
138028e02042SDavid Gibson static int htab_save_later_pass(QEMUFile *f, sPAPRMachineState *spapr,
13814be21d56SDavid Gibson                                 int64_t max_ns)
13824be21d56SDavid Gibson {
13834be21d56SDavid Gibson     bool final = max_ns < 0;
13844be21d56SDavid Gibson     int htabslots = HTAB_SIZE(spapr) / HASH_PTE_SIZE_64;
13854be21d56SDavid Gibson     int examined = 0, sent = 0;
13864be21d56SDavid Gibson     int index = spapr->htab_save_index;
1387bc72ad67SAlex Bligh     int64_t starttime = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
13884be21d56SDavid Gibson 
13894be21d56SDavid Gibson     assert(!spapr->htab_first_pass);
13904be21d56SDavid Gibson 
13914be21d56SDavid Gibson     do {
13924be21d56SDavid Gibson         int chunkstart, invalidstart;
13934be21d56SDavid Gibson 
13944be21d56SDavid Gibson         /* Consume non-dirty HPTEs */
13954be21d56SDavid Gibson         while ((index < htabslots)
13964be21d56SDavid Gibson                && !HPTE_DIRTY(HPTE(spapr->htab, index))) {
13974be21d56SDavid Gibson             index++;
13984be21d56SDavid Gibson             examined++;
13994be21d56SDavid Gibson         }
14004be21d56SDavid Gibson 
14014be21d56SDavid Gibson         chunkstart = index;
14024be21d56SDavid Gibson         /* Consume valid dirty HPTEs */
1403338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - chunkstart < USHRT_MAX)
14044be21d56SDavid Gibson                && HPTE_DIRTY(HPTE(spapr->htab, index))
14054be21d56SDavid Gibson                && HPTE_VALID(HPTE(spapr->htab, index))) {
14064be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
14074be21d56SDavid Gibson             index++;
14084be21d56SDavid Gibson             examined++;
14094be21d56SDavid Gibson         }
14104be21d56SDavid Gibson 
14114be21d56SDavid Gibson         invalidstart = index;
14124be21d56SDavid Gibson         /* Consume invalid dirty HPTEs */
1413338c25b6SSamuel Mendoza-Jonas         while ((index < htabslots) && (index - invalidstart < USHRT_MAX)
14144be21d56SDavid Gibson                && HPTE_DIRTY(HPTE(spapr->htab, index))
14154be21d56SDavid Gibson                && !HPTE_VALID(HPTE(spapr->htab, index))) {
14164be21d56SDavid Gibson             CLEAN_HPTE(HPTE(spapr->htab, index));
14174be21d56SDavid Gibson             index++;
14184be21d56SDavid Gibson             examined++;
14194be21d56SDavid Gibson         }
14204be21d56SDavid Gibson 
14214be21d56SDavid Gibson         if (index > chunkstart) {
14224be21d56SDavid Gibson             int n_valid = invalidstart - chunkstart;
14234be21d56SDavid Gibson             int n_invalid = index - invalidstart;
14244be21d56SDavid Gibson 
14254be21d56SDavid Gibson             qemu_put_be32(f, chunkstart);
14264be21d56SDavid Gibson             qemu_put_be16(f, n_valid);
14274be21d56SDavid Gibson             qemu_put_be16(f, n_invalid);
14284be21d56SDavid Gibson             qemu_put_buffer(f, HPTE(spapr->htab, chunkstart),
14294be21d56SDavid Gibson                             HASH_PTE_SIZE_64 * n_valid);
14304be21d56SDavid Gibson             sent += index - chunkstart;
14314be21d56SDavid Gibson 
1432bc72ad67SAlex Bligh             if (!final && (qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - starttime) > max_ns) {
14334be21d56SDavid Gibson                 break;
14344be21d56SDavid Gibson             }
14354be21d56SDavid Gibson         }
14364be21d56SDavid Gibson 
14374be21d56SDavid Gibson         if (examined >= htabslots) {
14384be21d56SDavid Gibson             break;
14394be21d56SDavid Gibson         }
14404be21d56SDavid Gibson 
14414be21d56SDavid Gibson         if (index >= htabslots) {
14424be21d56SDavid Gibson             assert(index == htabslots);
14434be21d56SDavid Gibson             index = 0;
14444be21d56SDavid Gibson         }
14454be21d56SDavid Gibson     } while ((examined < htabslots) && (!qemu_file_rate_limit(f) || final));
14464be21d56SDavid Gibson 
14474be21d56SDavid Gibson     if (index >= htabslots) {
14484be21d56SDavid Gibson         assert(index == htabslots);
14494be21d56SDavid Gibson         index = 0;
14504be21d56SDavid Gibson     }
14514be21d56SDavid Gibson 
14524be21d56SDavid Gibson     spapr->htab_save_index = index;
14534be21d56SDavid Gibson 
1454e68cb8b4SAlexey Kardashevskiy     return (examined >= htabslots) && (sent == 0) ? 1 : 0;
14554be21d56SDavid Gibson }
14564be21d56SDavid Gibson 
1457e68cb8b4SAlexey Kardashevskiy #define MAX_ITERATION_NS    5000000 /* 5 ms */
1458e68cb8b4SAlexey Kardashevskiy #define MAX_KVM_BUF_SIZE    2048
1459e68cb8b4SAlexey Kardashevskiy 
14604be21d56SDavid Gibson static int htab_save_iterate(QEMUFile *f, void *opaque)
14614be21d56SDavid Gibson {
146228e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
1463e68cb8b4SAlexey Kardashevskiy     int rc = 0;
14644be21d56SDavid Gibson 
14654be21d56SDavid Gibson     /* Iteration header */
14664be21d56SDavid Gibson     qemu_put_be32(f, 0);
14674be21d56SDavid Gibson 
1468e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1469e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1470e68cb8b4SAlexey Kardashevskiy 
147101a57972SSamuel Mendoza-Jonas         rc = spapr_check_htab_fd(spapr);
147201a57972SSamuel Mendoza-Jonas         if (rc < 0) {
147301a57972SSamuel Mendoza-Jonas             return rc;
147401a57972SSamuel Mendoza-Jonas         }
147501a57972SSamuel Mendoza-Jonas 
1476e68cb8b4SAlexey Kardashevskiy         rc = kvmppc_save_htab(f, spapr->htab_fd,
1477e68cb8b4SAlexey Kardashevskiy                               MAX_KVM_BUF_SIZE, MAX_ITERATION_NS);
1478e68cb8b4SAlexey Kardashevskiy         if (rc < 0) {
1479e68cb8b4SAlexey Kardashevskiy             return rc;
1480e68cb8b4SAlexey Kardashevskiy         }
1481e68cb8b4SAlexey Kardashevskiy     } else  if (spapr->htab_first_pass) {
14824be21d56SDavid Gibson         htab_save_first_pass(f, spapr, MAX_ITERATION_NS);
14834be21d56SDavid Gibson     } else {
1484e68cb8b4SAlexey Kardashevskiy         rc = htab_save_later_pass(f, spapr, MAX_ITERATION_NS);
14854be21d56SDavid Gibson     }
14864be21d56SDavid Gibson 
14874be21d56SDavid Gibson     /* End marker */
14884be21d56SDavid Gibson     qemu_put_be32(f, 0);
14894be21d56SDavid Gibson     qemu_put_be16(f, 0);
14904be21d56SDavid Gibson     qemu_put_be16(f, 0);
14914be21d56SDavid Gibson 
1492e68cb8b4SAlexey Kardashevskiy     return rc;
14934be21d56SDavid Gibson }
14944be21d56SDavid Gibson 
14954be21d56SDavid Gibson static int htab_save_complete(QEMUFile *f, void *opaque)
14964be21d56SDavid Gibson {
149728e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
14984be21d56SDavid Gibson 
14994be21d56SDavid Gibson     /* Iteration header */
15004be21d56SDavid Gibson     qemu_put_be32(f, 0);
15014be21d56SDavid Gibson 
1502e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1503e68cb8b4SAlexey Kardashevskiy         int rc;
1504e68cb8b4SAlexey Kardashevskiy 
1505e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1506e68cb8b4SAlexey Kardashevskiy 
150701a57972SSamuel Mendoza-Jonas         rc = spapr_check_htab_fd(spapr);
150801a57972SSamuel Mendoza-Jonas         if (rc < 0) {
150901a57972SSamuel Mendoza-Jonas             return rc;
151001a57972SSamuel Mendoza-Jonas         }
151101a57972SSamuel Mendoza-Jonas 
1512e68cb8b4SAlexey Kardashevskiy         rc = kvmppc_save_htab(f, spapr->htab_fd, MAX_KVM_BUF_SIZE, -1);
1513e68cb8b4SAlexey Kardashevskiy         if (rc < 0) {
1514e68cb8b4SAlexey Kardashevskiy             return rc;
1515e68cb8b4SAlexey Kardashevskiy         }
1516e68cb8b4SAlexey Kardashevskiy         close(spapr->htab_fd);
1517e68cb8b4SAlexey Kardashevskiy         spapr->htab_fd = -1;
1518e68cb8b4SAlexey Kardashevskiy     } else {
15194be21d56SDavid Gibson         htab_save_later_pass(f, spapr, -1);
1520e68cb8b4SAlexey Kardashevskiy     }
15214be21d56SDavid Gibson 
15224be21d56SDavid Gibson     /* End marker */
15234be21d56SDavid Gibson     qemu_put_be32(f, 0);
15244be21d56SDavid Gibson     qemu_put_be16(f, 0);
15254be21d56SDavid Gibson     qemu_put_be16(f, 0);
15264be21d56SDavid Gibson 
15274be21d56SDavid Gibson     return 0;
15284be21d56SDavid Gibson }
15294be21d56SDavid Gibson 
15304be21d56SDavid Gibson static int htab_load(QEMUFile *f, void *opaque, int version_id)
15314be21d56SDavid Gibson {
153228e02042SDavid Gibson     sPAPRMachineState *spapr = opaque;
15334be21d56SDavid Gibson     uint32_t section_hdr;
1534e68cb8b4SAlexey Kardashevskiy     int fd = -1;
15354be21d56SDavid Gibson 
15364be21d56SDavid Gibson     if (version_id < 1 || version_id > 1) {
15374be21d56SDavid Gibson         fprintf(stderr, "htab_load() bad version\n");
15384be21d56SDavid Gibson         return -EINVAL;
15394be21d56SDavid Gibson     }
15404be21d56SDavid Gibson 
15414be21d56SDavid Gibson     section_hdr = qemu_get_be32(f);
15424be21d56SDavid Gibson 
15434be21d56SDavid Gibson     if (section_hdr) {
15444be21d56SDavid Gibson         /* First section, just the hash shift */
15454be21d56SDavid Gibson         if (spapr->htab_shift != section_hdr) {
1546613e7a76SBharata B Rao             error_report("htab_shift mismatch: source %d target %d",
1547613e7a76SBharata B Rao                          section_hdr, spapr->htab_shift);
15484be21d56SDavid Gibson             return -EINVAL;
15494be21d56SDavid Gibson         }
15504be21d56SDavid Gibson         return 0;
15514be21d56SDavid Gibson     }
15524be21d56SDavid Gibson 
1553e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1554e68cb8b4SAlexey Kardashevskiy         assert(kvm_enabled());
1555e68cb8b4SAlexey Kardashevskiy 
1556e68cb8b4SAlexey Kardashevskiy         fd = kvmppc_get_htab_fd(true);
1557e68cb8b4SAlexey Kardashevskiy         if (fd < 0) {
1558e68cb8b4SAlexey Kardashevskiy             fprintf(stderr, "Unable to open fd to restore KVM hash table: %s\n",
1559e68cb8b4SAlexey Kardashevskiy                     strerror(errno));
1560e68cb8b4SAlexey Kardashevskiy         }
1561e68cb8b4SAlexey Kardashevskiy     }
1562e68cb8b4SAlexey Kardashevskiy 
15634be21d56SDavid Gibson     while (true) {
15644be21d56SDavid Gibson         uint32_t index;
15654be21d56SDavid Gibson         uint16_t n_valid, n_invalid;
15664be21d56SDavid Gibson 
15674be21d56SDavid Gibson         index = qemu_get_be32(f);
15684be21d56SDavid Gibson         n_valid = qemu_get_be16(f);
15694be21d56SDavid Gibson         n_invalid = qemu_get_be16(f);
15704be21d56SDavid Gibson 
15714be21d56SDavid Gibson         if ((index == 0) && (n_valid == 0) && (n_invalid == 0)) {
15724be21d56SDavid Gibson             /* End of Stream */
15734be21d56SDavid Gibson             break;
15744be21d56SDavid Gibson         }
15754be21d56SDavid Gibson 
1576e68cb8b4SAlexey Kardashevskiy         if ((index + n_valid + n_invalid) >
15774be21d56SDavid Gibson             (HTAB_SIZE(spapr) / HASH_PTE_SIZE_64)) {
15784be21d56SDavid Gibson             /* Bad index in stream */
15794be21d56SDavid Gibson             fprintf(stderr, "htab_load() bad index %d (%hd+%hd entries) "
1580e68cb8b4SAlexey Kardashevskiy                     "in htab stream (htab_shift=%d)\n", index, n_valid, n_invalid,
1581e68cb8b4SAlexey Kardashevskiy                     spapr->htab_shift);
15824be21d56SDavid Gibson             return -EINVAL;
15834be21d56SDavid Gibson         }
15844be21d56SDavid Gibson 
1585e68cb8b4SAlexey Kardashevskiy         if (spapr->htab) {
15864be21d56SDavid Gibson             if (n_valid) {
15874be21d56SDavid Gibson                 qemu_get_buffer(f, HPTE(spapr->htab, index),
15884be21d56SDavid Gibson                                 HASH_PTE_SIZE_64 * n_valid);
15894be21d56SDavid Gibson             }
15904be21d56SDavid Gibson             if (n_invalid) {
15914be21d56SDavid Gibson                 memset(HPTE(spapr->htab, index + n_valid), 0,
15924be21d56SDavid Gibson                        HASH_PTE_SIZE_64 * n_invalid);
15934be21d56SDavid Gibson             }
1594e68cb8b4SAlexey Kardashevskiy         } else {
1595e68cb8b4SAlexey Kardashevskiy             int rc;
1596e68cb8b4SAlexey Kardashevskiy 
1597e68cb8b4SAlexey Kardashevskiy             assert(fd >= 0);
1598e68cb8b4SAlexey Kardashevskiy 
1599e68cb8b4SAlexey Kardashevskiy             rc = kvmppc_load_htab_chunk(f, fd, index, n_valid, n_invalid);
1600e68cb8b4SAlexey Kardashevskiy             if (rc < 0) {
1601e68cb8b4SAlexey Kardashevskiy                 return rc;
1602e68cb8b4SAlexey Kardashevskiy             }
1603e68cb8b4SAlexey Kardashevskiy         }
1604e68cb8b4SAlexey Kardashevskiy     }
1605e68cb8b4SAlexey Kardashevskiy 
1606e68cb8b4SAlexey Kardashevskiy     if (!spapr->htab) {
1607e68cb8b4SAlexey Kardashevskiy         assert(fd >= 0);
1608e68cb8b4SAlexey Kardashevskiy         close(fd);
16094be21d56SDavid Gibson     }
16104be21d56SDavid Gibson 
16114be21d56SDavid Gibson     return 0;
16124be21d56SDavid Gibson }
16134be21d56SDavid Gibson 
16144be21d56SDavid Gibson static SaveVMHandlers savevm_htab_handlers = {
16154be21d56SDavid Gibson     .save_live_setup = htab_save_setup,
16164be21d56SDavid Gibson     .save_live_iterate = htab_save_iterate,
1617a3e06c3dSDr. David Alan Gilbert     .save_live_complete_precopy = htab_save_complete,
16184be21d56SDavid Gibson     .load_state = htab_load,
16194be21d56SDavid Gibson };
16204be21d56SDavid Gibson 
16215b2128d2SAlexander Graf static void spapr_boot_set(void *opaque, const char *boot_device,
16225b2128d2SAlexander Graf                            Error **errp)
16235b2128d2SAlexander Graf {
16245b2128d2SAlexander Graf     MachineState *machine = MACHINE(qdev_get_machine());
16255b2128d2SAlexander Graf     machine->boot_order = g_strdup(boot_device);
16265b2128d2SAlexander Graf }
16275b2128d2SAlexander Graf 
1628*569f4967SDavid Gibson static void spapr_cpu_init(sPAPRMachineState *spapr, PowerPCCPU *cpu,
1629*569f4967SDavid Gibson                            Error **errp)
1630bab99ea0SBharata B Rao {
1631bab99ea0SBharata B Rao     CPUPPCState *env = &cpu->env;
1632bab99ea0SBharata B Rao 
1633bab99ea0SBharata B Rao     /* Set time-base frequency to 512 MHz */
1634bab99ea0SBharata B Rao     cpu_ppc_tb_init(env, TIMEBASE_FREQ);
1635bab99ea0SBharata B Rao 
1636bab99ea0SBharata B Rao     /* PAPR always has exception vectors in RAM not ROM. To ensure this,
1637bab99ea0SBharata B Rao      * MSR[IP] should never be set.
1638bab99ea0SBharata B Rao      */
1639bab99ea0SBharata B Rao     env->msr_mask &= ~(1 << 6);
1640bab99ea0SBharata B Rao 
1641bab99ea0SBharata B Rao     /* Tell KVM that we're in PAPR mode */
1642bab99ea0SBharata B Rao     if (kvm_enabled()) {
1643bab99ea0SBharata B Rao         kvmppc_set_papr(cpu);
1644bab99ea0SBharata B Rao     }
1645bab99ea0SBharata B Rao 
1646bab99ea0SBharata B Rao     if (cpu->max_compat) {
1647*569f4967SDavid Gibson         Error *local_err = NULL;
1648*569f4967SDavid Gibson 
1649*569f4967SDavid Gibson         ppc_set_compat(cpu, cpu->max_compat, &local_err);
1650*569f4967SDavid Gibson         if (local_err) {
1651*569f4967SDavid Gibson             error_propagate(errp, local_err);
1652*569f4967SDavid Gibson             return;
1653*569f4967SDavid Gibson         }
1654bab99ea0SBharata B Rao     }
1655bab99ea0SBharata B Rao 
1656bab99ea0SBharata B Rao     xics_cpu_setup(spapr->icp, cpu);
1657bab99ea0SBharata B Rao 
1658bab99ea0SBharata B Rao     qemu_register_reset(spapr_cpu_reset, cpu);
1659bab99ea0SBharata B Rao }
1660bab99ea0SBharata B Rao 
1661224245bfSDavid Gibson /*
1662224245bfSDavid Gibson  * Reset routine for LMB DR devices.
1663224245bfSDavid Gibson  *
1664224245bfSDavid Gibson  * Unlike PCI DR devices, LMB DR devices explicitly register this reset
1665224245bfSDavid Gibson  * routine. Reset for PCI DR devices will be handled by PHB reset routine
1666224245bfSDavid Gibson  * when it walks all its children devices. LMB devices reset occurs
1667224245bfSDavid Gibson  * as part of spapr_ppc_reset().
1668224245bfSDavid Gibson  */
1669224245bfSDavid Gibson static void spapr_drc_reset(void *opaque)
1670224245bfSDavid Gibson {
1671224245bfSDavid Gibson     sPAPRDRConnector *drc = opaque;
1672224245bfSDavid Gibson     DeviceState *d = DEVICE(drc);
1673224245bfSDavid Gibson 
1674224245bfSDavid Gibson     if (d) {
1675224245bfSDavid Gibson         device_reset(d);
1676224245bfSDavid Gibson     }
1677224245bfSDavid Gibson }
1678224245bfSDavid Gibson 
1679224245bfSDavid Gibson static void spapr_create_lmb_dr_connectors(sPAPRMachineState *spapr)
1680224245bfSDavid Gibson {
1681224245bfSDavid Gibson     MachineState *machine = MACHINE(spapr);
1682224245bfSDavid Gibson     uint64_t lmb_size = SPAPR_MEMORY_BLOCK_SIZE;
1683e8f986fcSBharata B Rao     uint32_t nr_lmbs = (machine->maxram_size - machine->ram_size)/lmb_size;
1684224245bfSDavid Gibson     int i;
1685224245bfSDavid Gibson 
1686224245bfSDavid Gibson     for (i = 0; i < nr_lmbs; i++) {
1687224245bfSDavid Gibson         sPAPRDRConnector *drc;
1688224245bfSDavid Gibson         uint64_t addr;
1689224245bfSDavid Gibson 
1690e8f986fcSBharata B Rao         addr = i * lmb_size + spapr->hotplug_memory.base;
1691224245bfSDavid Gibson         drc = spapr_dr_connector_new(OBJECT(spapr), SPAPR_DR_CONNECTOR_TYPE_LMB,
1692224245bfSDavid Gibson                                      addr/lmb_size);
1693224245bfSDavid Gibson         qemu_register_reset(spapr_drc_reset, drc);
1694224245bfSDavid Gibson     }
1695224245bfSDavid Gibson }
1696224245bfSDavid Gibson 
1697224245bfSDavid Gibson /*
1698224245bfSDavid Gibson  * If RAM size, maxmem size and individual node mem sizes aren't aligned
1699224245bfSDavid Gibson  * to SPAPR_MEMORY_BLOCK_SIZE(256MB), then refuse to start the guest
1700224245bfSDavid Gibson  * since we can't support such unaligned sizes with DRCONF_MEMORY.
1701224245bfSDavid Gibson  */
1702224245bfSDavid Gibson static void spapr_validate_node_memory(MachineState *machine)
1703224245bfSDavid Gibson {
1704224245bfSDavid Gibson     int i;
1705224245bfSDavid Gibson 
1706224245bfSDavid Gibson     if (machine->maxram_size % SPAPR_MEMORY_BLOCK_SIZE ||
1707224245bfSDavid Gibson         machine->ram_size % SPAPR_MEMORY_BLOCK_SIZE) {
1708224245bfSDavid Gibson         error_report("Can't support memory configuration where RAM size "
1709224245bfSDavid Gibson                      "0x" RAM_ADDR_FMT " or maxmem size "
1710224245bfSDavid Gibson                      "0x" RAM_ADDR_FMT " isn't aligned to %llu MB",
1711224245bfSDavid Gibson                      machine->ram_size, machine->maxram_size,
1712224245bfSDavid Gibson                      SPAPR_MEMORY_BLOCK_SIZE/M_BYTE);
1713224245bfSDavid Gibson         exit(EXIT_FAILURE);
1714224245bfSDavid Gibson     }
1715224245bfSDavid Gibson 
1716224245bfSDavid Gibson     for (i = 0; i < nb_numa_nodes; i++) {
1717224245bfSDavid Gibson         if (numa_info[i].node_mem % SPAPR_MEMORY_BLOCK_SIZE) {
1718224245bfSDavid Gibson             error_report("Can't support memory configuration where memory size"
1719224245bfSDavid Gibson                          " %" PRIx64 " of node %d isn't aligned to %llu MB",
1720224245bfSDavid Gibson                          numa_info[i].node_mem, i,
1721224245bfSDavid Gibson                          SPAPR_MEMORY_BLOCK_SIZE/M_BYTE);
1722224245bfSDavid Gibson             exit(EXIT_FAILURE);
1723224245bfSDavid Gibson         }
1724224245bfSDavid Gibson     }
1725224245bfSDavid Gibson }
1726224245bfSDavid Gibson 
172753018216SPaolo Bonzini /* pSeries LPAR / sPAPR hardware init */
17283ef96221SMarcel Apfelbaum static void ppc_spapr_init(MachineState *machine)
172953018216SPaolo Bonzini {
173028e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
1731224245bfSDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(machine);
17323ef96221SMarcel Apfelbaum     const char *kernel_filename = machine->kernel_filename;
17333ef96221SMarcel Apfelbaum     const char *kernel_cmdline = machine->kernel_cmdline;
17343ef96221SMarcel Apfelbaum     const char *initrd_filename = machine->initrd_filename;
173553018216SPaolo Bonzini     PowerPCCPU *cpu;
173653018216SPaolo Bonzini     PCIHostState *phb;
173753018216SPaolo Bonzini     int i;
173853018216SPaolo Bonzini     MemoryRegion *sysmem = get_system_memory();
173953018216SPaolo Bonzini     MemoryRegion *ram = g_new(MemoryRegion, 1);
1740658fa66bSAlexey Kardashevskiy     MemoryRegion *rma_region;
1741658fa66bSAlexey Kardashevskiy     void *rma = NULL;
174253018216SPaolo Bonzini     hwaddr rma_alloc_size;
1743b082d65aSAlexey Kardashevskiy     hwaddr node0_size = spapr_node0_size();
174453018216SPaolo Bonzini     uint32_t initrd_base = 0;
174553018216SPaolo Bonzini     long kernel_size = 0, initrd_size = 0;
1746b7d1f77aSBenjamin Herrenschmidt     long load_limit, fw_size;
174716457e7fSBenjamin Herrenschmidt     bool kernel_le = false;
174853018216SPaolo Bonzini     char *filename;
174953018216SPaolo Bonzini 
175053018216SPaolo Bonzini     msi_supported = true;
175153018216SPaolo Bonzini 
175253018216SPaolo Bonzini     QLIST_INIT(&spapr->phbs);
175353018216SPaolo Bonzini 
175453018216SPaolo Bonzini     cpu_ppc_hypercall = emulate_spapr_hypercall;
175553018216SPaolo Bonzini 
175653018216SPaolo Bonzini     /* Allocate RMA if necessary */
1757658fa66bSAlexey Kardashevskiy     rma_alloc_size = kvmppc_alloc_rma(&rma);
175853018216SPaolo Bonzini 
175953018216SPaolo Bonzini     if (rma_alloc_size == -1) {
1760730fce59SThomas Huth         error_report("Unable to create RMA");
176153018216SPaolo Bonzini         exit(1);
176253018216SPaolo Bonzini     }
176353018216SPaolo Bonzini 
1764c4177479SAlexey Kardashevskiy     if (rma_alloc_size && (rma_alloc_size < node0_size)) {
176553018216SPaolo Bonzini         spapr->rma_size = rma_alloc_size;
176653018216SPaolo Bonzini     } else {
1767c4177479SAlexey Kardashevskiy         spapr->rma_size = node0_size;
176853018216SPaolo Bonzini 
176953018216SPaolo Bonzini         /* With KVM, we don't actually know whether KVM supports an
177053018216SPaolo Bonzini          * unbounded RMA (PR KVM) or is limited by the hash table size
177153018216SPaolo Bonzini          * (HV KVM using VRMA), so we always assume the latter
177253018216SPaolo Bonzini          *
177353018216SPaolo Bonzini          * In that case, we also limit the initial allocations for RTAS
177453018216SPaolo Bonzini          * etc... to 256M since we have no way to know what the VRMA size
177553018216SPaolo Bonzini          * is going to be as it depends on the size of the hash table
177653018216SPaolo Bonzini          * isn't determined yet.
177753018216SPaolo Bonzini          */
177853018216SPaolo Bonzini         if (kvm_enabled()) {
177953018216SPaolo Bonzini             spapr->vrma_adjust = 1;
178053018216SPaolo Bonzini             spapr->rma_size = MIN(spapr->rma_size, 0x10000000);
178153018216SPaolo Bonzini         }
178253018216SPaolo Bonzini     }
178353018216SPaolo Bonzini 
1784c4177479SAlexey Kardashevskiy     if (spapr->rma_size > node0_size) {
1785c4177479SAlexey Kardashevskiy         fprintf(stderr, "Error: Numa node 0 has to span the RMA (%#08"HWADDR_PRIx")\n",
1786c4177479SAlexey Kardashevskiy                 spapr->rma_size);
1787c4177479SAlexey Kardashevskiy         exit(1);
1788c4177479SAlexey Kardashevskiy     }
1789c4177479SAlexey Kardashevskiy 
1790b7d1f77aSBenjamin Herrenschmidt     /* Setup a load limit for the ramdisk leaving room for SLOF and FDT */
1791b7d1f77aSBenjamin Herrenschmidt     load_limit = MIN(spapr->rma_size, RTAS_MAX_ADDR) - FW_OVERHEAD;
179253018216SPaolo Bonzini 
179353018216SPaolo Bonzini     /* We aim for a hash table of size 1/128 the size of RAM.  The
179453018216SPaolo Bonzini      * normal rule of thumb is 1/64 the size of RAM, but that's much
179553018216SPaolo Bonzini      * more than needed for the Linux guests we support. */
179653018216SPaolo Bonzini     spapr->htab_shift = 18; /* Minimum architected size */
179753018216SPaolo Bonzini     while (spapr->htab_shift <= 46) {
1798ce881f77SBharata B Rao         if ((1ULL << (spapr->htab_shift + 7)) >= machine->maxram_size) {
179953018216SPaolo Bonzini             break;
180053018216SPaolo Bonzini         }
180153018216SPaolo Bonzini         spapr->htab_shift++;
180253018216SPaolo Bonzini     }
1803b817772aSBharata B Rao     spapr_alloc_htab(spapr);
180453018216SPaolo Bonzini 
18057b565160SDavid Gibson     /* Set up Interrupt Controller before we create the VCPUs */
1806446f16a6SMarcel Apfelbaum     spapr->icp = xics_system_init(machine,
18079e734e3dSBharata B Rao                                   DIV_ROUND_UP(max_cpus * kvmppc_smt_threads(),
1808f303f117SGreg Kurz                                                smp_threads),
18097b565160SDavid Gibson                                   XICS_IRQS);
18107b565160SDavid Gibson 
1811224245bfSDavid Gibson     if (smc->dr_lmb_enabled) {
1812224245bfSDavid Gibson         spapr_validate_node_memory(machine);
1813224245bfSDavid Gibson     }
1814224245bfSDavid Gibson 
181553018216SPaolo Bonzini     /* init CPUs */
181619fb2c36SBharata B Rao     if (machine->cpu_model == NULL) {
181719fb2c36SBharata B Rao         machine->cpu_model = kvm_enabled() ? "host" : "POWER7";
181853018216SPaolo Bonzini     }
181953018216SPaolo Bonzini     for (i = 0; i < smp_cpus; i++) {
182019fb2c36SBharata B Rao         cpu = cpu_ppc_init(machine->cpu_model);
182153018216SPaolo Bonzini         if (cpu == NULL) {
1822*569f4967SDavid Gibson             error_report("Unable to find PowerPC CPU definition");
182353018216SPaolo Bonzini             exit(1);
182453018216SPaolo Bonzini         }
1825*569f4967SDavid Gibson         spapr_cpu_init(spapr, cpu, &error_fatal);
182653018216SPaolo Bonzini     }
182753018216SPaolo Bonzini 
1828026bfd89SDavid Gibson     if (kvm_enabled()) {
1829026bfd89SDavid Gibson         /* Enable H_LOGICAL_CI_* so SLOF can talk to in-kernel devices */
1830026bfd89SDavid Gibson         kvmppc_enable_logical_ci_hcalls();
1831ef9971ddSAlexey Kardashevskiy         kvmppc_enable_set_mode_hcall();
1832026bfd89SDavid Gibson     }
1833026bfd89SDavid Gibson 
183453018216SPaolo Bonzini     /* allocate RAM */
1835f92f5da1SAlexey Kardashevskiy     memory_region_allocate_system_memory(ram, NULL, "ppc_spapr.ram",
1836fb164994SDavid Gibson                                          machine->ram_size);
1837f92f5da1SAlexey Kardashevskiy     memory_region_add_subregion(sysmem, 0, ram);
183853018216SPaolo Bonzini 
1839658fa66bSAlexey Kardashevskiy     if (rma_alloc_size && rma) {
1840658fa66bSAlexey Kardashevskiy         rma_region = g_new(MemoryRegion, 1);
1841658fa66bSAlexey Kardashevskiy         memory_region_init_ram_ptr(rma_region, NULL, "ppc_spapr.rma",
1842658fa66bSAlexey Kardashevskiy                                    rma_alloc_size, rma);
1843658fa66bSAlexey Kardashevskiy         vmstate_register_ram_global(rma_region);
1844658fa66bSAlexey Kardashevskiy         memory_region_add_subregion(sysmem, 0, rma_region);
1845658fa66bSAlexey Kardashevskiy     }
1846658fa66bSAlexey Kardashevskiy 
18474a1c9cf0SBharata B Rao     /* initialize hotplug memory address space */
18484a1c9cf0SBharata B Rao     if (machine->ram_size < machine->maxram_size) {
18494a1c9cf0SBharata B Rao         ram_addr_t hotplug_mem_size = machine->maxram_size - machine->ram_size;
18504a1c9cf0SBharata B Rao 
18514a1c9cf0SBharata B Rao         if (machine->ram_slots > SPAPR_MAX_RAM_SLOTS) {
18529af9e0feSMarkus Armbruster             error_report("Specified number of memory slots %" PRIu64
18539af9e0feSMarkus Armbruster                          " exceeds max supported %d",
185419a35c9eSBharata B Rao                          machine->ram_slots, SPAPR_MAX_RAM_SLOTS);
18554a1c9cf0SBharata B Rao             exit(EXIT_FAILURE);
18564a1c9cf0SBharata B Rao         }
18574a1c9cf0SBharata B Rao 
18584a1c9cf0SBharata B Rao         spapr->hotplug_memory.base = ROUND_UP(machine->ram_size,
18594a1c9cf0SBharata B Rao                                               SPAPR_HOTPLUG_MEM_ALIGN);
18604a1c9cf0SBharata B Rao         memory_region_init(&spapr->hotplug_memory.mr, OBJECT(spapr),
18614a1c9cf0SBharata B Rao                            "hotplug-memory", hotplug_mem_size);
18624a1c9cf0SBharata B Rao         memory_region_add_subregion(sysmem, spapr->hotplug_memory.base,
18634a1c9cf0SBharata B Rao                                     &spapr->hotplug_memory.mr);
18644a1c9cf0SBharata B Rao     }
18654a1c9cf0SBharata B Rao 
1866224245bfSDavid Gibson     if (smc->dr_lmb_enabled) {
1867224245bfSDavid Gibson         spapr_create_lmb_dr_connectors(spapr);
1868224245bfSDavid Gibson     }
1869224245bfSDavid Gibson 
187053018216SPaolo Bonzini     filename = qemu_find_file(QEMU_FILE_TYPE_BIOS, "spapr-rtas.bin");
18714c56440dSStefan Weil     if (!filename) {
1872730fce59SThomas Huth         error_report("Could not find LPAR rtas '%s'", "spapr-rtas.bin");
18734c56440dSStefan Weil         exit(1);
18744c56440dSStefan Weil     }
1875b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_size = get_image_size(filename);
1876b7d1f77aSBenjamin Herrenschmidt     spapr->rtas_blob = g_malloc(spapr->rtas_size);
1877b7d1f77aSBenjamin Herrenschmidt     if (load_image_size(filename, spapr->rtas_blob, spapr->rtas_size) < 0) {
1878730fce59SThomas Huth         error_report("Could not load LPAR rtas '%s'", filename);
187953018216SPaolo Bonzini         exit(1);
188053018216SPaolo Bonzini     }
188153018216SPaolo Bonzini     if (spapr->rtas_size > RTAS_MAX_SIZE) {
1882730fce59SThomas Huth         error_report("RTAS too big ! 0x%zx bytes (max is 0x%x)",
18832f285bddSPeter Maydell                      (size_t)spapr->rtas_size, RTAS_MAX_SIZE);
188453018216SPaolo Bonzini         exit(1);
188553018216SPaolo Bonzini     }
188653018216SPaolo Bonzini     g_free(filename);
188753018216SPaolo Bonzini 
188853018216SPaolo Bonzini     /* Set up EPOW events infrastructure */
188953018216SPaolo Bonzini     spapr_events_init(spapr);
189053018216SPaolo Bonzini 
189112f42174SDavid Gibson     /* Set up the RTC RTAS interfaces */
189228df36a1SDavid Gibson     spapr_rtc_create(spapr);
189312f42174SDavid Gibson 
189453018216SPaolo Bonzini     /* Set up VIO bus */
189553018216SPaolo Bonzini     spapr->vio_bus = spapr_vio_bus_init();
189653018216SPaolo Bonzini 
189753018216SPaolo Bonzini     for (i = 0; i < MAX_SERIAL_PORTS; i++) {
189853018216SPaolo Bonzini         if (serial_hds[i]) {
189953018216SPaolo Bonzini             spapr_vty_create(spapr->vio_bus, serial_hds[i]);
190053018216SPaolo Bonzini         }
190153018216SPaolo Bonzini     }
190253018216SPaolo Bonzini 
190353018216SPaolo Bonzini     /* We always have at least the nvram device on VIO */
190453018216SPaolo Bonzini     spapr_create_nvram(spapr);
190553018216SPaolo Bonzini 
190653018216SPaolo Bonzini     /* Set up PCI */
190753018216SPaolo Bonzini     spapr_pci_rtas_init();
190853018216SPaolo Bonzini 
190989dfd6e1SDavid Gibson     phb = spapr_create_phb(spapr, 0);
191053018216SPaolo Bonzini 
191153018216SPaolo Bonzini     for (i = 0; i < nb_nics; i++) {
191253018216SPaolo Bonzini         NICInfo *nd = &nd_table[i];
191353018216SPaolo Bonzini 
191453018216SPaolo Bonzini         if (!nd->model) {
191553018216SPaolo Bonzini             nd->model = g_strdup("ibmveth");
191653018216SPaolo Bonzini         }
191753018216SPaolo Bonzini 
191853018216SPaolo Bonzini         if (strcmp(nd->model, "ibmveth") == 0) {
191953018216SPaolo Bonzini             spapr_vlan_create(spapr->vio_bus, nd);
192053018216SPaolo Bonzini         } else {
192129b358f9SDavid Gibson             pci_nic_init_nofail(&nd_table[i], phb->bus, nd->model, NULL);
192253018216SPaolo Bonzini         }
192353018216SPaolo Bonzini     }
192453018216SPaolo Bonzini 
192553018216SPaolo Bonzini     for (i = 0; i <= drive_get_max_bus(IF_SCSI); i++) {
192653018216SPaolo Bonzini         spapr_vscsi_create(spapr->vio_bus);
192753018216SPaolo Bonzini     }
192853018216SPaolo Bonzini 
192953018216SPaolo Bonzini     /* Graphics */
193053018216SPaolo Bonzini     if (spapr_vga_init(phb->bus)) {
193153018216SPaolo Bonzini         spapr->has_graphics = true;
1932c6e76503SPaolo Bonzini         machine->usb |= defaults_enabled() && !machine->usb_disabled;
193353018216SPaolo Bonzini     }
193453018216SPaolo Bonzini 
19354ee9ced9SMarcel Apfelbaum     if (machine->usb) {
193657040d45SThomas Huth         if (smc->use_ohci_by_default) {
193753018216SPaolo Bonzini             pci_create_simple(phb->bus, -1, "pci-ohci");
193857040d45SThomas Huth         } else {
193957040d45SThomas Huth             pci_create_simple(phb->bus, -1, "nec-usb-xhci");
194057040d45SThomas Huth         }
1941c86580b8SMarkus Armbruster 
194253018216SPaolo Bonzini         if (spapr->has_graphics) {
1943c86580b8SMarkus Armbruster             USBBus *usb_bus = usb_bus_find(-1);
1944c86580b8SMarkus Armbruster 
1945c86580b8SMarkus Armbruster             usb_create_simple(usb_bus, "usb-kbd");
1946c86580b8SMarkus Armbruster             usb_create_simple(usb_bus, "usb-mouse");
194753018216SPaolo Bonzini         }
194853018216SPaolo Bonzini     }
194953018216SPaolo Bonzini 
195053018216SPaolo Bonzini     if (spapr->rma_size < (MIN_RMA_SLOF << 20)) {
195153018216SPaolo Bonzini         fprintf(stderr, "qemu: pSeries SLOF firmware requires >= "
195253018216SPaolo Bonzini                 "%ldM guest RMA (Real Mode Area memory)\n", MIN_RMA_SLOF);
195353018216SPaolo Bonzini         exit(1);
195453018216SPaolo Bonzini     }
195553018216SPaolo Bonzini 
195653018216SPaolo Bonzini     if (kernel_filename) {
195753018216SPaolo Bonzini         uint64_t lowaddr = 0;
195853018216SPaolo Bonzini 
195953018216SPaolo Bonzini         kernel_size = load_elf(kernel_filename, translate_kernel_address, NULL,
19604ecd4d16SPeter Crosthwaite                                NULL, &lowaddr, NULL, 1, PPC_ELF_MACHINE, 0);
19613b66da82SAlexey Kardashevskiy         if (kernel_size == ELF_LOAD_WRONG_ENDIAN) {
196216457e7fSBenjamin Herrenschmidt             kernel_size = load_elf(kernel_filename,
196316457e7fSBenjamin Herrenschmidt                                    translate_kernel_address, NULL,
19644ecd4d16SPeter Crosthwaite                                    NULL, &lowaddr, NULL, 0, PPC_ELF_MACHINE, 0);
196516457e7fSBenjamin Herrenschmidt             kernel_le = kernel_size > 0;
196616457e7fSBenjamin Herrenschmidt         }
196716457e7fSBenjamin Herrenschmidt         if (kernel_size < 0) {
19683b66da82SAlexey Kardashevskiy             fprintf(stderr, "qemu: error loading %s: %s\n",
19693b66da82SAlexey Kardashevskiy                     kernel_filename, load_elf_strerror(kernel_size));
197053018216SPaolo Bonzini             exit(1);
197153018216SPaolo Bonzini         }
197253018216SPaolo Bonzini 
197353018216SPaolo Bonzini         /* load initrd */
197453018216SPaolo Bonzini         if (initrd_filename) {
197553018216SPaolo Bonzini             /* Try to locate the initrd in the gap between the kernel
197653018216SPaolo Bonzini              * and the firmware. Add a bit of space just in case
197753018216SPaolo Bonzini              */
197853018216SPaolo Bonzini             initrd_base = (KERNEL_LOAD_ADDR + kernel_size + 0x1ffff) & ~0xffff;
197953018216SPaolo Bonzini             initrd_size = load_image_targphys(initrd_filename, initrd_base,
198053018216SPaolo Bonzini                                               load_limit - initrd_base);
198153018216SPaolo Bonzini             if (initrd_size < 0) {
198253018216SPaolo Bonzini                 fprintf(stderr, "qemu: could not load initial ram disk '%s'\n",
198353018216SPaolo Bonzini                         initrd_filename);
198453018216SPaolo Bonzini                 exit(1);
198553018216SPaolo Bonzini             }
198653018216SPaolo Bonzini         } else {
198753018216SPaolo Bonzini             initrd_base = 0;
198853018216SPaolo Bonzini             initrd_size = 0;
198953018216SPaolo Bonzini         }
199053018216SPaolo Bonzini     }
199153018216SPaolo Bonzini 
19928e7ea787SAndreas Färber     if (bios_name == NULL) {
19938e7ea787SAndreas Färber         bios_name = FW_FILE_NAME;
19948e7ea787SAndreas Färber     }
19958e7ea787SAndreas Färber     filename = qemu_find_file(QEMU_FILE_TYPE_BIOS, bios_name);
19964c56440dSStefan Weil     if (!filename) {
199768fea5a0SThomas Huth         error_report("Could not find LPAR firmware '%s'", bios_name);
19984c56440dSStefan Weil         exit(1);
19994c56440dSStefan Weil     }
200053018216SPaolo Bonzini     fw_size = load_image_targphys(filename, 0, FW_MAX_SIZE);
200168fea5a0SThomas Huth     if (fw_size <= 0) {
200268fea5a0SThomas Huth         error_report("Could not load LPAR firmware '%s'", filename);
200353018216SPaolo Bonzini         exit(1);
200453018216SPaolo Bonzini     }
200553018216SPaolo Bonzini     g_free(filename);
200653018216SPaolo Bonzini 
200728e02042SDavid Gibson     /* FIXME: Should register things through the MachineState's qdev
200828e02042SDavid Gibson      * interface, this is a legacy from the sPAPREnvironment structure
200928e02042SDavid Gibson      * which predated MachineState but had a similar function */
20104be21d56SDavid Gibson     vmstate_register(NULL, 0, &vmstate_spapr, spapr);
20114be21d56SDavid Gibson     register_savevm_live(NULL, "spapr/htab", -1, 1,
20124be21d56SDavid Gibson                          &savevm_htab_handlers, spapr);
20134be21d56SDavid Gibson 
201453018216SPaolo Bonzini     /* Prepare the device tree */
20153bbf37f2SAndreas Färber     spapr->fdt_skel = spapr_create_fdt_skel(initrd_base, initrd_size,
201616457e7fSBenjamin Herrenschmidt                                             kernel_size, kernel_le,
201731fe14d1SNathan Fontenot                                             kernel_cmdline,
201831fe14d1SNathan Fontenot                                             spapr->check_exception_irq);
201953018216SPaolo Bonzini     assert(spapr->fdt_skel != NULL);
20205b2128d2SAlexander Graf 
202146503c2bSMichael Roth     /* used by RTAS */
202246503c2bSMichael Roth     QTAILQ_INIT(&spapr->ccs_list);
202346503c2bSMichael Roth     qemu_register_reset(spapr_ccs_reset_hook, spapr);
202446503c2bSMichael Roth 
20255b2128d2SAlexander Graf     qemu_register_boot_set(spapr_boot_set, spapr);
202653018216SPaolo Bonzini }
202753018216SPaolo Bonzini 
2028135a129aSAneesh Kumar K.V static int spapr_kvm_type(const char *vm_type)
2029135a129aSAneesh Kumar K.V {
2030135a129aSAneesh Kumar K.V     if (!vm_type) {
2031135a129aSAneesh Kumar K.V         return 0;
2032135a129aSAneesh Kumar K.V     }
2033135a129aSAneesh Kumar K.V 
2034135a129aSAneesh Kumar K.V     if (!strcmp(vm_type, "HV")) {
2035135a129aSAneesh Kumar K.V         return 1;
2036135a129aSAneesh Kumar K.V     }
2037135a129aSAneesh Kumar K.V 
2038135a129aSAneesh Kumar K.V     if (!strcmp(vm_type, "PR")) {
2039135a129aSAneesh Kumar K.V         return 2;
2040135a129aSAneesh Kumar K.V     }
2041135a129aSAneesh Kumar K.V 
2042135a129aSAneesh Kumar K.V     error_report("Unknown kvm-type specified '%s'", vm_type);
2043135a129aSAneesh Kumar K.V     exit(1);
2044135a129aSAneesh Kumar K.V }
2045135a129aSAneesh Kumar K.V 
204671461b0fSAlexey Kardashevskiy /*
2047627b84f4SGonglei  * Implementation of an interface to adjust firmware path
204871461b0fSAlexey Kardashevskiy  * for the bootindex property handling.
204971461b0fSAlexey Kardashevskiy  */
205071461b0fSAlexey Kardashevskiy static char *spapr_get_fw_dev_path(FWPathProvider *p, BusState *bus,
205171461b0fSAlexey Kardashevskiy                                    DeviceState *dev)
205271461b0fSAlexey Kardashevskiy {
205371461b0fSAlexey Kardashevskiy #define CAST(type, obj, name) \
205471461b0fSAlexey Kardashevskiy     ((type *)object_dynamic_cast(OBJECT(obj), (name)))
205571461b0fSAlexey Kardashevskiy     SCSIDevice *d = CAST(SCSIDevice,  dev, TYPE_SCSI_DEVICE);
205671461b0fSAlexey Kardashevskiy     sPAPRPHBState *phb = CAST(sPAPRPHBState, dev, TYPE_SPAPR_PCI_HOST_BRIDGE);
205771461b0fSAlexey Kardashevskiy 
205871461b0fSAlexey Kardashevskiy     if (d) {
205971461b0fSAlexey Kardashevskiy         void *spapr = CAST(void, bus->parent, "spapr-vscsi");
206071461b0fSAlexey Kardashevskiy         VirtIOSCSI *virtio = CAST(VirtIOSCSI, bus->parent, TYPE_VIRTIO_SCSI);
206171461b0fSAlexey Kardashevskiy         USBDevice *usb = CAST(USBDevice, bus->parent, TYPE_USB_DEVICE);
206271461b0fSAlexey Kardashevskiy 
206371461b0fSAlexey Kardashevskiy         if (spapr) {
206471461b0fSAlexey Kardashevskiy             /*
206571461b0fSAlexey Kardashevskiy              * Replace "channel@0/disk@0,0" with "disk@8000000000000000":
206671461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 8000 | (bus << 8) | (id << 5) | lun
206771461b0fSAlexey Kardashevskiy              * in the top 16 bits of the 64-bit LUN
206871461b0fSAlexey Kardashevskiy              */
206971461b0fSAlexey Kardashevskiy             unsigned id = 0x8000 | (d->id << 8) | d->lun;
207071461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
207171461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 48);
207271461b0fSAlexey Kardashevskiy         } else if (virtio) {
207371461b0fSAlexey Kardashevskiy             /*
207471461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 01000000 | (target << 8) | lun
207571461b0fSAlexey Kardashevskiy              * in the top 32 bits of the 64-bit LUN
207671461b0fSAlexey Kardashevskiy              * Note: the quote above is from SLOF and it is wrong,
207771461b0fSAlexey Kardashevskiy              * the actual binding is:
207871461b0fSAlexey Kardashevskiy              * swap 0100 or 10 << or 20 << ( target lun-id -- srplun )
207971461b0fSAlexey Kardashevskiy              */
208071461b0fSAlexey Kardashevskiy             unsigned id = 0x1000000 | (d->id << 16) | d->lun;
208171461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
208271461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 32);
208371461b0fSAlexey Kardashevskiy         } else if (usb) {
208471461b0fSAlexey Kardashevskiy             /*
208571461b0fSAlexey Kardashevskiy              * We use SRP luns of the form 01000000 | (usb-port << 16) | lun
208671461b0fSAlexey Kardashevskiy              * in the top 32 bits of the 64-bit LUN
208771461b0fSAlexey Kardashevskiy              */
208871461b0fSAlexey Kardashevskiy             unsigned usb_port = atoi(usb->port->path);
208971461b0fSAlexey Kardashevskiy             unsigned id = 0x1000000 | (usb_port << 16) | d->lun;
209071461b0fSAlexey Kardashevskiy             return g_strdup_printf("%s@%"PRIX64, qdev_fw_name(dev),
209171461b0fSAlexey Kardashevskiy                                    (uint64_t)id << 32);
209271461b0fSAlexey Kardashevskiy         }
209371461b0fSAlexey Kardashevskiy     }
209471461b0fSAlexey Kardashevskiy 
209571461b0fSAlexey Kardashevskiy     if (phb) {
209671461b0fSAlexey Kardashevskiy         /* Replace "pci" with "pci@800000020000000" */
209771461b0fSAlexey Kardashevskiy         return g_strdup_printf("pci@%"PRIX64, phb->buid);
209871461b0fSAlexey Kardashevskiy     }
209971461b0fSAlexey Kardashevskiy 
210071461b0fSAlexey Kardashevskiy     return NULL;
210171461b0fSAlexey Kardashevskiy }
210271461b0fSAlexey Kardashevskiy 
210323825581SEduardo Habkost static char *spapr_get_kvm_type(Object *obj, Error **errp)
210423825581SEduardo Habkost {
210528e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
210623825581SEduardo Habkost 
210728e02042SDavid Gibson     return g_strdup(spapr->kvm_type);
210823825581SEduardo Habkost }
210923825581SEduardo Habkost 
211023825581SEduardo Habkost static void spapr_set_kvm_type(Object *obj, const char *value, Error **errp)
211123825581SEduardo Habkost {
211228e02042SDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
211323825581SEduardo Habkost 
211428e02042SDavid Gibson     g_free(spapr->kvm_type);
211528e02042SDavid Gibson     spapr->kvm_type = g_strdup(value);
211623825581SEduardo Habkost }
211723825581SEduardo Habkost 
211823825581SEduardo Habkost static void spapr_machine_initfn(Object *obj)
211923825581SEduardo Habkost {
212023825581SEduardo Habkost     object_property_add_str(obj, "kvm-type",
212123825581SEduardo Habkost                             spapr_get_kvm_type, spapr_set_kvm_type, NULL);
212249d2e648SMarcel Apfelbaum     object_property_set_description(obj, "kvm-type",
212349d2e648SMarcel Apfelbaum                                     "Specifies the KVM virtualization mode (HV, PR)",
212449d2e648SMarcel Apfelbaum                                     NULL);
212523825581SEduardo Habkost }
212623825581SEduardo Habkost 
212787bbdd9cSDavid Gibson static void spapr_machine_finalizefn(Object *obj)
212887bbdd9cSDavid Gibson {
212987bbdd9cSDavid Gibson     sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
213087bbdd9cSDavid Gibson 
213187bbdd9cSDavid Gibson     g_free(spapr->kvm_type);
213287bbdd9cSDavid Gibson }
213387bbdd9cSDavid Gibson 
213434316482SAlexey Kardashevskiy static void ppc_cpu_do_nmi_on_cpu(void *arg)
213534316482SAlexey Kardashevskiy {
213634316482SAlexey Kardashevskiy     CPUState *cs = arg;
213734316482SAlexey Kardashevskiy 
213834316482SAlexey Kardashevskiy     cpu_synchronize_state(cs);
213934316482SAlexey Kardashevskiy     ppc_cpu_do_system_reset(cs);
214034316482SAlexey Kardashevskiy }
214134316482SAlexey Kardashevskiy 
214234316482SAlexey Kardashevskiy static void spapr_nmi(NMIState *n, int cpu_index, Error **errp)
214334316482SAlexey Kardashevskiy {
214434316482SAlexey Kardashevskiy     CPUState *cs;
214534316482SAlexey Kardashevskiy 
214634316482SAlexey Kardashevskiy     CPU_FOREACH(cs) {
214734316482SAlexey Kardashevskiy         async_run_on_cpu(cs, ppc_cpu_do_nmi_on_cpu, cs);
214834316482SAlexey Kardashevskiy     }
214934316482SAlexey Kardashevskiy }
215034316482SAlexey Kardashevskiy 
2151c20d332aSBharata B Rao static void spapr_add_lmbs(DeviceState *dev, uint64_t addr, uint64_t size,
2152c20d332aSBharata B Rao                            uint32_t node, Error **errp)
2153c20d332aSBharata B Rao {
2154c20d332aSBharata B Rao     sPAPRDRConnector *drc;
2155c20d332aSBharata B Rao     sPAPRDRConnectorClass *drck;
2156c20d332aSBharata B Rao     uint32_t nr_lmbs = size/SPAPR_MEMORY_BLOCK_SIZE;
2157c20d332aSBharata B Rao     int i, fdt_offset, fdt_size;
2158c20d332aSBharata B Rao     void *fdt;
2159c20d332aSBharata B Rao 
2160c20d332aSBharata B Rao     /*
2161c20d332aSBharata B Rao      * Check for DRC connectors and send hotplug notification to the
2162c20d332aSBharata B Rao      * guest only in case of hotplugged memory. This allows cold plugged
2163c20d332aSBharata B Rao      * memory to be specified at boot time.
2164c20d332aSBharata B Rao      */
2165c20d332aSBharata B Rao     if (!dev->hotplugged) {
2166c20d332aSBharata B Rao         return;
2167c20d332aSBharata B Rao     }
2168c20d332aSBharata B Rao 
2169c20d332aSBharata B Rao     for (i = 0; i < nr_lmbs; i++) {
2170c20d332aSBharata B Rao         drc = spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_LMB,
2171c20d332aSBharata B Rao                 addr/SPAPR_MEMORY_BLOCK_SIZE);
2172c20d332aSBharata B Rao         g_assert(drc);
2173c20d332aSBharata B Rao 
2174c20d332aSBharata B Rao         fdt = create_device_tree(&fdt_size);
2175c20d332aSBharata B Rao         fdt_offset = spapr_populate_memory_node(fdt, node, addr,
2176c20d332aSBharata B Rao                                                 SPAPR_MEMORY_BLOCK_SIZE);
2177c20d332aSBharata B Rao 
2178c20d332aSBharata B Rao         drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
2179c20d332aSBharata B Rao         drck->attach(drc, dev, fdt, fdt_offset, !dev->hotplugged, errp);
2180c20d332aSBharata B Rao         addr += SPAPR_MEMORY_BLOCK_SIZE;
2181c20d332aSBharata B Rao     }
21820a417869SBharata B Rao     spapr_hotplug_req_add_by_count(SPAPR_DR_CONNECTOR_TYPE_LMB, nr_lmbs);
2183c20d332aSBharata B Rao }
2184c20d332aSBharata B Rao 
2185c20d332aSBharata B Rao static void spapr_memory_plug(HotplugHandler *hotplug_dev, DeviceState *dev,
2186c20d332aSBharata B Rao                               uint32_t node, Error **errp)
2187c20d332aSBharata B Rao {
2188c20d332aSBharata B Rao     Error *local_err = NULL;
2189c20d332aSBharata B Rao     sPAPRMachineState *ms = SPAPR_MACHINE(hotplug_dev);
2190c20d332aSBharata B Rao     PCDIMMDevice *dimm = PC_DIMM(dev);
2191c20d332aSBharata B Rao     PCDIMMDeviceClass *ddc = PC_DIMM_GET_CLASS(dimm);
2192c20d332aSBharata B Rao     MemoryRegion *mr = ddc->get_memory_region(dimm);
2193c20d332aSBharata B Rao     uint64_t align = memory_region_get_alignment(mr);
2194c20d332aSBharata B Rao     uint64_t size = memory_region_size(mr);
2195c20d332aSBharata B Rao     uint64_t addr;
2196c20d332aSBharata B Rao 
2197c20d332aSBharata B Rao     if (size % SPAPR_MEMORY_BLOCK_SIZE) {
2198c20d332aSBharata B Rao         error_setg(&local_err, "Hotplugged memory size must be a multiple of "
2199c20d332aSBharata B Rao                       "%lld MB", SPAPR_MEMORY_BLOCK_SIZE/M_BYTE);
2200c20d332aSBharata B Rao         goto out;
2201c20d332aSBharata B Rao     }
2202c20d332aSBharata B Rao 
2203d6a9b0b8SMichael S. Tsirkin     pc_dimm_memory_plug(dev, &ms->hotplug_memory, mr, align, &local_err);
2204c20d332aSBharata B Rao     if (local_err) {
2205c20d332aSBharata B Rao         goto out;
2206c20d332aSBharata B Rao     }
2207c20d332aSBharata B Rao 
2208c20d332aSBharata B Rao     addr = object_property_get_int(OBJECT(dimm), PC_DIMM_ADDR_PROP, &local_err);
2209c20d332aSBharata B Rao     if (local_err) {
2210c20d332aSBharata B Rao         pc_dimm_memory_unplug(dev, &ms->hotplug_memory, mr);
2211c20d332aSBharata B Rao         goto out;
2212c20d332aSBharata B Rao     }
2213c20d332aSBharata B Rao 
2214c20d332aSBharata B Rao     spapr_add_lmbs(dev, addr, size, node, &error_abort);
2215c20d332aSBharata B Rao 
2216c20d332aSBharata B Rao out:
2217c20d332aSBharata B Rao     error_propagate(errp, local_err);
2218c20d332aSBharata B Rao }
2219c20d332aSBharata B Rao 
2220c20d332aSBharata B Rao static void spapr_machine_device_plug(HotplugHandler *hotplug_dev,
2221c20d332aSBharata B Rao                                       DeviceState *dev, Error **errp)
2222c20d332aSBharata B Rao {
2223c20d332aSBharata B Rao     sPAPRMachineClass *smc = SPAPR_MACHINE_GET_CLASS(qdev_get_machine());
2224c20d332aSBharata B Rao 
2225c20d332aSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2226b556854bSBharata B Rao         int node;
2227c20d332aSBharata B Rao 
2228c20d332aSBharata B Rao         if (!smc->dr_lmb_enabled) {
2229c20d332aSBharata B Rao             error_setg(errp, "Memory hotplug not supported for this machine");
2230c20d332aSBharata B Rao             return;
2231c20d332aSBharata B Rao         }
2232c20d332aSBharata B Rao         node = object_property_get_int(OBJECT(dev), PC_DIMM_NODE_PROP, errp);
2233c20d332aSBharata B Rao         if (*errp) {
2234c20d332aSBharata B Rao             return;
2235c20d332aSBharata B Rao         }
2236c20d332aSBharata B Rao 
2237b556854bSBharata B Rao         /*
2238b556854bSBharata B Rao          * Currently PowerPC kernel doesn't allow hot-adding memory to
2239b556854bSBharata B Rao          * memory-less node, but instead will silently add the memory
2240b556854bSBharata B Rao          * to the first node that has some memory. This causes two
2241b556854bSBharata B Rao          * unexpected behaviours for the user.
2242b556854bSBharata B Rao          *
2243b556854bSBharata B Rao          * - Memory gets hotplugged to a different node than what the user
2244b556854bSBharata B Rao          *   specified.
2245b556854bSBharata B Rao          * - Since pc-dimm subsystem in QEMU still thinks that memory belongs
2246b556854bSBharata B Rao          *   to memory-less node, a reboot will set things accordingly
2247b556854bSBharata B Rao          *   and the previously hotplugged memory now ends in the right node.
2248b556854bSBharata B Rao          *   This appears as if some memory moved from one node to another.
2249b556854bSBharata B Rao          *
2250b556854bSBharata B Rao          * So until kernel starts supporting memory hotplug to memory-less
2251b556854bSBharata B Rao          * nodes, just prevent such attempts upfront in QEMU.
2252b556854bSBharata B Rao          */
2253b556854bSBharata B Rao         if (nb_numa_nodes && !numa_info[node].node_mem) {
2254b556854bSBharata B Rao             error_setg(errp, "Can't hotplug memory to memory-less node %d",
2255b556854bSBharata B Rao                        node);
2256b556854bSBharata B Rao             return;
2257b556854bSBharata B Rao         }
2258b556854bSBharata B Rao 
2259c20d332aSBharata B Rao         spapr_memory_plug(hotplug_dev, dev, node, errp);
2260c20d332aSBharata B Rao     }
2261c20d332aSBharata B Rao }
2262c20d332aSBharata B Rao 
2263c20d332aSBharata B Rao static void spapr_machine_device_unplug(HotplugHandler *hotplug_dev,
2264c20d332aSBharata B Rao                                       DeviceState *dev, Error **errp)
2265c20d332aSBharata B Rao {
2266c20d332aSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2267c20d332aSBharata B Rao         error_setg(errp, "Memory hot unplug not supported by sPAPR");
2268c20d332aSBharata B Rao     }
2269c20d332aSBharata B Rao }
2270c20d332aSBharata B Rao 
2271c20d332aSBharata B Rao static HotplugHandler *spapr_get_hotpug_handler(MachineState *machine,
2272c20d332aSBharata B Rao                                              DeviceState *dev)
2273c20d332aSBharata B Rao {
2274c20d332aSBharata B Rao     if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2275c20d332aSBharata B Rao         return HOTPLUG_HANDLER(machine);
2276c20d332aSBharata B Rao     }
2277c20d332aSBharata B Rao     return NULL;
2278c20d332aSBharata B Rao }
2279c20d332aSBharata B Rao 
228020bb648dSDavid Gibson static unsigned spapr_cpu_index_to_socket_id(unsigned cpu_index)
228120bb648dSDavid Gibson {
228220bb648dSDavid Gibson     /* Allocate to NUMA nodes on a "socket" basis (not that concept of
228320bb648dSDavid Gibson      * socket means much for the paravirtualized PAPR platform) */
228420bb648dSDavid Gibson     return cpu_index / smp_threads / smp_cores;
228520bb648dSDavid Gibson }
228620bb648dSDavid Gibson 
228729ee3247SAlexey Kardashevskiy static void spapr_machine_class_init(ObjectClass *oc, void *data)
228853018216SPaolo Bonzini {
228929ee3247SAlexey Kardashevskiy     MachineClass *mc = MACHINE_CLASS(oc);
2290224245bfSDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(oc);
229171461b0fSAlexey Kardashevskiy     FWPathProviderClass *fwc = FW_PATH_PROVIDER_CLASS(oc);
229234316482SAlexey Kardashevskiy     NMIClass *nc = NMI_CLASS(oc);
2293c20d332aSBharata B Rao     HotplugHandlerClass *hc = HOTPLUG_HANDLER_CLASS(oc);
229429ee3247SAlexey Kardashevskiy 
22950eb9054cSDavid Gibson     mc->desc = "pSeries Logical Partition (PAPR compliant)";
2296fc9f38c3SDavid Gibson 
2297fc9f38c3SDavid Gibson     /*
2298fc9f38c3SDavid Gibson      * We set up the default / latest behaviour here.  The class_init
2299fc9f38c3SDavid Gibson      * functions for the specific versioned machine types can override
2300fc9f38c3SDavid Gibson      * these details for backwards compatibility
2301fc9f38c3SDavid Gibson      */
2302958db90cSMarcel Apfelbaum     mc->init = ppc_spapr_init;
2303958db90cSMarcel Apfelbaum     mc->reset = ppc_spapr_reset;
2304958db90cSMarcel Apfelbaum     mc->block_default_type = IF_SCSI;
230538b02bd8SAlexey Kardashevskiy     mc->max_cpus = MAX_CPUMASK_BITS;
2306958db90cSMarcel Apfelbaum     mc->no_parallel = 1;
23075b2128d2SAlexander Graf     mc->default_boot_order = "";
2308a34944feSNikunj A Dadhania     mc->default_ram_size = 512 * M_BYTE;
2309958db90cSMarcel Apfelbaum     mc->kvm_type = spapr_kvm_type;
23109e3f9733SAlexander Graf     mc->has_dynamic_sysbus = true;
2311e4024630SLaurent Vivier     mc->pci_allow_0_address = true;
2312c20d332aSBharata B Rao     mc->get_hotplug_handler = spapr_get_hotpug_handler;
2313c20d332aSBharata B Rao     hc->plug = spapr_machine_device_plug;
2314c20d332aSBharata B Rao     hc->unplug = spapr_machine_device_unplug;
231520bb648dSDavid Gibson     mc->cpu_index_to_socket_id = spapr_cpu_index_to_socket_id;
231600b4fbe2SMarcel Apfelbaum 
2317fc9f38c3SDavid Gibson     smc->dr_lmb_enabled = true;
231871461b0fSAlexey Kardashevskiy     fwc->get_dev_path = spapr_get_fw_dev_path;
231934316482SAlexey Kardashevskiy     nc->nmi_monitor_handler = spapr_nmi;
232053018216SPaolo Bonzini }
232153018216SPaolo Bonzini 
232229ee3247SAlexey Kardashevskiy static const TypeInfo spapr_machine_info = {
232329ee3247SAlexey Kardashevskiy     .name          = TYPE_SPAPR_MACHINE,
232429ee3247SAlexey Kardashevskiy     .parent        = TYPE_MACHINE,
23254aee7362SDavid Gibson     .abstract      = true,
23266ca1502eSAlexey Kardashevskiy     .instance_size = sizeof(sPAPRMachineState),
232723825581SEduardo Habkost     .instance_init = spapr_machine_initfn,
232887bbdd9cSDavid Gibson     .instance_finalize = spapr_machine_finalizefn,
2329183930c0SDavid Gibson     .class_size    = sizeof(sPAPRMachineClass),
233029ee3247SAlexey Kardashevskiy     .class_init    = spapr_machine_class_init,
233171461b0fSAlexey Kardashevskiy     .interfaces = (InterfaceInfo[]) {
233271461b0fSAlexey Kardashevskiy         { TYPE_FW_PATH_PROVIDER },
233334316482SAlexey Kardashevskiy         { TYPE_NMI },
2334c20d332aSBharata B Rao         { TYPE_HOTPLUG_HANDLER },
233571461b0fSAlexey Kardashevskiy         { }
233671461b0fSAlexey Kardashevskiy     },
233729ee3247SAlexey Kardashevskiy };
233829ee3247SAlexey Kardashevskiy 
2339fccbc785SDavid Gibson #define DEFINE_SPAPR_MACHINE(suffix, verstr, latest)                 \
23405013c547SDavid Gibson     static void spapr_machine_##suffix##_class_init(ObjectClass *oc, \
23415013c547SDavid Gibson                                                     void *data)      \
23425013c547SDavid Gibson     {                                                                \
23435013c547SDavid Gibson         MachineClass *mc = MACHINE_CLASS(oc);                        \
23445013c547SDavid Gibson         spapr_machine_##suffix##_class_options(mc);                  \
2345fccbc785SDavid Gibson         if (latest) {                                                \
2346fccbc785SDavid Gibson             mc->alias = "pseries";                                   \
2347fccbc785SDavid Gibson             mc->is_default = 1;                                      \
2348fccbc785SDavid Gibson         }                                                            \
23495013c547SDavid Gibson     }                                                                \
23505013c547SDavid Gibson     static void spapr_machine_##suffix##_instance_init(Object *obj)  \
23515013c547SDavid Gibson     {                                                                \
23525013c547SDavid Gibson         MachineState *machine = MACHINE(obj);                        \
23535013c547SDavid Gibson         spapr_machine_##suffix##_instance_options(machine);          \
23545013c547SDavid Gibson     }                                                                \
23555013c547SDavid Gibson     static const TypeInfo spapr_machine_##suffix##_info = {          \
23565013c547SDavid Gibson         .name = MACHINE_TYPE_NAME("pseries-" verstr),                \
23575013c547SDavid Gibson         .parent = TYPE_SPAPR_MACHINE,                                \
23585013c547SDavid Gibson         .class_init = spapr_machine_##suffix##_class_init,           \
23595013c547SDavid Gibson         .instance_init = spapr_machine_##suffix##_instance_init,     \
23605013c547SDavid Gibson     };                                                               \
23615013c547SDavid Gibson     static void spapr_machine_register_##suffix(void)                \
23625013c547SDavid Gibson     {                                                                \
23635013c547SDavid Gibson         type_register(&spapr_machine_##suffix##_info);               \
23645013c547SDavid Gibson     }                                                                \
23655013c547SDavid Gibson     machine_init(spapr_machine_register_##suffix)
23665013c547SDavid Gibson 
23671c5f29bbSDavid Gibson /*
23684b23699cSDavid Gibson  * pseries-2.6
23694b23699cSDavid Gibson  */
23704b23699cSDavid Gibson static void spapr_machine_2_6_instance_options(MachineState *machine)
23714b23699cSDavid Gibson {
23724b23699cSDavid Gibson }
23734b23699cSDavid Gibson 
23744b23699cSDavid Gibson static void spapr_machine_2_6_class_options(MachineClass *mc)
23754b23699cSDavid Gibson {
23764b23699cSDavid Gibson     /* Defaults for the latest behaviour inherited from the base class */
23774b23699cSDavid Gibson }
23784b23699cSDavid Gibson 
23794b23699cSDavid Gibson DEFINE_SPAPR_MACHINE(2_6, "2.6", true);
23804b23699cSDavid Gibson 
23814b23699cSDavid Gibson /*
23821c5f29bbSDavid Gibson  * pseries-2.5
23831c5f29bbSDavid Gibson  */
23844b23699cSDavid Gibson #define SPAPR_COMPAT_2_5 \
23854b23699cSDavid Gibson         HW_COMPAT_2_5
23864b23699cSDavid Gibson 
23875013c547SDavid Gibson static void spapr_machine_2_5_instance_options(MachineState *machine)
23881c5f29bbSDavid Gibson {
23895013c547SDavid Gibson }
23905013c547SDavid Gibson 
23915013c547SDavid Gibson static void spapr_machine_2_5_class_options(MachineClass *mc)
23925013c547SDavid Gibson {
239357040d45SThomas Huth     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc);
239457040d45SThomas Huth 
23954b23699cSDavid Gibson     spapr_machine_2_6_class_options(mc);
239657040d45SThomas Huth     smc->use_ohci_by_default = true;
23974b23699cSDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_5);
23981c5f29bbSDavid Gibson }
23991c5f29bbSDavid Gibson 
24004b23699cSDavid Gibson DEFINE_SPAPR_MACHINE(2_5, "2.5", false);
24011c5f29bbSDavid Gibson 
24021c5f29bbSDavid Gibson /*
24031c5f29bbSDavid Gibson  * pseries-2.4
24041c5f29bbSDavid Gibson  */
240580fd50f9SCornelia Huck #define SPAPR_COMPAT_2_4 \
240680fd50f9SCornelia Huck         HW_COMPAT_2_4
240780fd50f9SCornelia Huck 
24085013c547SDavid Gibson static void spapr_machine_2_4_instance_options(MachineState *machine)
24091c5f29bbSDavid Gibson {
24105013c547SDavid Gibson     spapr_machine_2_5_instance_options(machine);
24115013c547SDavid Gibson }
24121c5f29bbSDavid Gibson 
24135013c547SDavid Gibson static void spapr_machine_2_4_class_options(MachineClass *mc)
24145013c547SDavid Gibson {
2415fc9f38c3SDavid Gibson     sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc);
2416fc9f38c3SDavid Gibson 
2417fc9f38c3SDavid Gibson     spapr_machine_2_5_class_options(mc);
2418fc9f38c3SDavid Gibson     smc->dr_lmb_enabled = false;
2419f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_4);
24201c5f29bbSDavid Gibson }
24211c5f29bbSDavid Gibson 
2422fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_4, "2.4", false);
24231c5f29bbSDavid Gibson 
24241c5f29bbSDavid Gibson /*
24251c5f29bbSDavid Gibson  * pseries-2.3
24261c5f29bbSDavid Gibson  */
242738ff32c6SEduardo Habkost #define SPAPR_COMPAT_2_3 \
242880fd50f9SCornelia Huck         SPAPR_COMPAT_2_4 \
24297619c7b0SMichael Roth         HW_COMPAT_2_3 \
24307619c7b0SMichael Roth         {\
24317619c7b0SMichael Roth             .driver   = "spapr-pci-host-bridge",\
24327619c7b0SMichael Roth             .property = "dynamic-reconfiguration",\
24337619c7b0SMichael Roth             .value    = "off",\
24347619c7b0SMichael Roth         },
243538ff32c6SEduardo Habkost 
24365013c547SDavid Gibson static void spapr_machine_2_3_instance_options(MachineState *machine)
24371c5f29bbSDavid Gibson {
24385013c547SDavid Gibson     spapr_machine_2_4_instance_options(machine);
24391c5f29bbSDavid Gibson     savevm_skip_section_footers();
24401c5f29bbSDavid Gibson     global_state_set_optional();
24411c5f29bbSDavid Gibson }
24421c5f29bbSDavid Gibson 
24435013c547SDavid Gibson static void spapr_machine_2_3_class_options(MachineClass *mc)
24441c5f29bbSDavid Gibson {
2445fc9f38c3SDavid Gibson     spapr_machine_2_4_class_options(mc);
2446f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_3);
24471c5f29bbSDavid Gibson }
2448fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_3, "2.3", false);
24491c5f29bbSDavid Gibson 
24501c5f29bbSDavid Gibson /*
24511c5f29bbSDavid Gibson  * pseries-2.2
24521c5f29bbSDavid Gibson  */
24531c5f29bbSDavid Gibson 
2454b194df47SAlexey Kardashevskiy #define SPAPR_COMPAT_2_2 \
245538ff32c6SEduardo Habkost         SPAPR_COMPAT_2_3 \
24564dfd8eaaSEduardo Habkost         HW_COMPAT_2_2 \
2457b194df47SAlexey Kardashevskiy         {\
2458b194df47SAlexey Kardashevskiy             .driver   = TYPE_SPAPR_PCI_HOST_BRIDGE,\
2459b194df47SAlexey Kardashevskiy             .property = "mem_win_size",\
2460b194df47SAlexey Kardashevskiy             .value    = "0x20000000",\
2461dd754bafSEduardo Habkost         },
2462b194df47SAlexey Kardashevskiy 
24635013c547SDavid Gibson static void spapr_machine_2_2_instance_options(MachineState *machine)
2464b0e966d0SJason Wang {
24655013c547SDavid Gibson     spapr_machine_2_3_instance_options(machine);
2466b0e966d0SJason Wang }
2467b0e966d0SJason Wang 
24685013c547SDavid Gibson static void spapr_machine_2_2_class_options(MachineClass *mc)
2469b0e966d0SJason Wang {
2470fc9f38c3SDavid Gibson     spapr_machine_2_3_class_options(mc);
2471f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_2);
24721c5f29bbSDavid Gibson }
2473fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_2, "2.2", false);
24741c5f29bbSDavid Gibson 
24751c5f29bbSDavid Gibson /*
24761c5f29bbSDavid Gibson  * pseries-2.1
24771c5f29bbSDavid Gibson  */
24781c5f29bbSDavid Gibson #define SPAPR_COMPAT_2_1 \
24791c5f29bbSDavid Gibson         SPAPR_COMPAT_2_2 \
24801c5f29bbSDavid Gibson         HW_COMPAT_2_1
24811c5f29bbSDavid Gibson 
24825013c547SDavid Gibson static void spapr_machine_2_1_instance_options(MachineState *machine)
24831c5f29bbSDavid Gibson {
24845013c547SDavid Gibson     spapr_machine_2_2_instance_options(machine);
24851c5f29bbSDavid Gibson }
24861c5f29bbSDavid Gibson 
24875013c547SDavid Gibson static void spapr_machine_2_1_class_options(MachineClass *mc)
2488b0e966d0SJason Wang {
2489fc9f38c3SDavid Gibson     spapr_machine_2_2_class_options(mc);
2490f949b4e5SDavid Gibson     SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_1);
24916026db45SAlexey Kardashevskiy }
2492fccbc785SDavid Gibson DEFINE_SPAPR_MACHINE(2_1, "2.1", false);
24936026db45SAlexey Kardashevskiy 
249429ee3247SAlexey Kardashevskiy static void spapr_machine_register_types(void)
249529ee3247SAlexey Kardashevskiy {
249629ee3247SAlexey Kardashevskiy     type_register_static(&spapr_machine_info);
249729ee3247SAlexey Kardashevskiy }
249829ee3247SAlexey Kardashevskiy 
249929ee3247SAlexey Kardashevskiy type_init(spapr_machine_register_types)
2500