]> git.proxmox.com Git - mirror_qemu.git/blame - hw/i386/pc.c
tests/.gitignore: add entry for generated file
[mirror_qemu.git] / hw / i386 / pc.c
CommitLineData
80cabfad
FB
1/*
2 * QEMU PC System Emulator
5fafdf24 3 *
80cabfad 4 * Copyright (c) 2003-2004 Fabrice Bellard
5fafdf24 5 *
80cabfad
FB
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
e688df6b 24
b6a0aa05 25#include "qemu/osdep.h"
83c9f4ca 26#include "hw/hw.h"
0d09e41a
PB
27#include "hw/i386/pc.h"
28#include "hw/char/serial.h"
bb3d5ea8 29#include "hw/char/parallel.h"
0d09e41a 30#include "hw/i386/apic.h"
54a40293
EH
31#include "hw/i386/topology.h"
32#include "sysemu/cpus.h"
0d09e41a 33#include "hw/block/fdc.h"
83c9f4ca
PB
34#include "hw/ide.h"
35#include "hw/pci/pci.h"
2118196b 36#include "hw/pci/pci_bus.h"
0d09e41a
PB
37#include "hw/nvram/fw_cfg.h"
38#include "hw/timer/hpet.h"
60d8f328 39#include "hw/smbios/smbios.h"
83c9f4ca 40#include "hw/loader.h"
ca20cf32 41#include "elf.h"
47b43a1f 42#include "multiboot.h"
0d09e41a 43#include "hw/timer/mc146818rtc.h"
55f613ac 44#include "hw/dma/i8257.h"
0d09e41a 45#include "hw/timer/i8254.h"
47973a2d 46#include "hw/input/i8042.h"
0d09e41a 47#include "hw/audio/pcspk.h"
83c9f4ca
PB
48#include "hw/pci/msi.h"
49#include "hw/sysbus.h"
9c17d615 50#include "sysemu/sysemu.h"
e35704ba 51#include "sysemu/numa.h"
9c17d615 52#include "sysemu/kvm.h"
b1c12027 53#include "sysemu/qtest.h"
1d31f66b 54#include "kvm_i386.h"
0d09e41a 55#include "hw/xen/xen.h"
a19cbfb3 56#include "ui/qemu-spice.h"
022c62cb
PB
57#include "exec/memory.h"
58#include "exec/address-spaces.h"
9c17d615 59#include "sysemu/arch_init.h"
1de7afc9 60#include "qemu/bitmap.h"
0c764a9d 61#include "qemu/config-file.h"
d49b6836 62#include "qemu/error-report.h"
922a01a0 63#include "qemu/option.h"
0445259b 64#include "hw/acpi/acpi.h"
5ff020b7 65#include "hw/acpi/cpu_hotplug.h"
c649983b 66#include "hw/boards.h"
39848901 67#include "hw/pci/pci_host.h"
72c194f7 68#include "acpi-build.h"
95bee274 69#include "hw/mem/pc-dimm.h"
e688df6b 70#include "qapi/error.h"
9af23989 71#include "qapi/qapi-visit-common.h"
bf1e8939 72#include "qapi/visitor.h"
15eafc2e 73#include "qom/cpu.h"
1255166b 74#include "hw/nmi.h"
60c5e104 75#include "hw/i386/intel_iommu.h"
489983d6 76#include "hw/net/ne2000-isa.h"
80cabfad 77
471fd342
BS
78/* debug PC/ISA interrupts */
79//#define DEBUG_IRQ
80
81#ifdef DEBUG_IRQ
82#define DPRINTF(fmt, ...) \
83 do { printf("CPUIRQ: " fmt , ## __VA_ARGS__); } while (0)
84#else
85#define DPRINTF(fmt, ...)
86#endif
87
8a92ea2f 88#define FW_CFG_ACPI_TABLES (FW_CFG_ARCH_LOCAL + 0)
b6f6e3d3 89#define FW_CFG_SMBIOS_ENTRIES (FW_CFG_ARCH_LOCAL + 1)
6b35e7bf 90#define FW_CFG_IRQ0_OVERRIDE (FW_CFG_ARCH_LOCAL + 2)
4c5b10b7 91#define FW_CFG_E820_TABLE (FW_CFG_ARCH_LOCAL + 3)
40ac17cd 92#define FW_CFG_HPET (FW_CFG_ARCH_LOCAL + 4)
80cabfad 93
4c5b10b7
JS
94#define E820_NR_ENTRIES 16
95
96struct e820_entry {
97 uint64_t address;
98 uint64_t length;
99 uint32_t type;
541dc0d4 100} QEMU_PACKED __attribute((__aligned__(4)));
4c5b10b7
JS
101
102struct e820_table {
103 uint32_t count;
104 struct e820_entry entry[E820_NR_ENTRIES];
541dc0d4 105} QEMU_PACKED __attribute((__aligned__(4)));
4c5b10b7 106
7d67110f
GH
107static struct e820_table e820_reserve;
108static struct e820_entry *e820_table;
109static unsigned e820_entries;
dd703b99 110struct hpet_fw_config hpet_cfg = {.count = UINT8_MAX};
4c5b10b7 111
b881fbe9 112void gsi_handler(void *opaque, int n, int level)
1452411b 113{
b881fbe9 114 GSIState *s = opaque;
1452411b 115
b881fbe9
JK
116 DPRINTF("pc: %s GSI %d\n", level ? "raising" : "lowering", n);
117 if (n < ISA_NUM_IRQS) {
118 qemu_set_irq(s->i8259_irq[n], level);
1632dc6a 119 }
b881fbe9 120 qemu_set_irq(s->ioapic_irq[n], level);
2e9947d2 121}
1452411b 122
258711c6
JG
123static void ioport80_write(void *opaque, hwaddr addr, uint64_t data,
124 unsigned size)
80cabfad
FB
125{
126}
127
c02e1eac
JG
128static uint64_t ioport80_read(void *opaque, hwaddr addr, unsigned size)
129{
a6fc23e5 130 return 0xffffffffffffffffULL;
c02e1eac
JG
131}
132
f929aad6 133/* MSDOS compatibility mode FPU exception support */
d537cf6c 134static qemu_irq ferr_irq;
8e78eb28
IY
135
136void pc_register_ferr_irq(qemu_irq irq)
137{
138 ferr_irq = irq;
139}
140
f929aad6
FB
141/* XXX: add IGNNE support */
142void cpu_set_ferr(CPUX86State *s)
143{
d537cf6c 144 qemu_irq_raise(ferr_irq);
f929aad6
FB
145}
146
258711c6
JG
147static void ioportF0_write(void *opaque, hwaddr addr, uint64_t data,
148 unsigned size)
f929aad6 149{
d537cf6c 150 qemu_irq_lower(ferr_irq);
f929aad6
FB
151}
152
c02e1eac
JG
153static uint64_t ioportF0_read(void *opaque, hwaddr addr, unsigned size)
154{
a6fc23e5 155 return 0xffffffffffffffffULL;
c02e1eac
JG
156}
157
28ab0e2e 158/* TSC handling */
28ab0e2e
FB
159uint64_t cpu_get_tsc(CPUX86State *env)
160{
4a1418e0 161 return cpu_get_ticks();
28ab0e2e
FB
162}
163
3de388f6 164/* IRQ handling */
4a8fa5dc 165int cpu_get_pic_interrupt(CPUX86State *env)
3de388f6 166{
02e51483 167 X86CPU *cpu = x86_env_get_cpu(env);
3de388f6
FB
168 int intno;
169
bb93e099
WL
170 if (!kvm_irqchip_in_kernel()) {
171 intno = apic_get_interrupt(cpu->apic_state);
172 if (intno >= 0) {
173 return intno;
174 }
175 /* read the irq from the PIC */
176 if (!apic_accept_pic_intr(cpu->apic_state)) {
177 return -1;
178 }
cf6d64bf 179 }
0e21e12b 180
3de388f6
FB
181 intno = pic_read_irq(isa_pic);
182 return intno;
183}
184
d537cf6c 185static void pic_irq_request(void *opaque, int irq, int level)
3de388f6 186{
182735ef
AF
187 CPUState *cs = first_cpu;
188 X86CPU *cpu = X86_CPU(cs);
a5b38b51 189
471fd342 190 DPRINTF("pic_irqs: %s irq %d\n", level? "raise" : "lower", irq);
bb93e099 191 if (cpu->apic_state && !kvm_irqchip_in_kernel()) {
bdc44640 192 CPU_FOREACH(cs) {
182735ef 193 cpu = X86_CPU(cs);
02e51483
CF
194 if (apic_accept_pic_intr(cpu->apic_state)) {
195 apic_deliver_pic_intr(cpu->apic_state, level);
cf6d64bf 196 }
d5529471
AJ
197 }
198 } else {
d8ed887b 199 if (level) {
c3affe56 200 cpu_interrupt(cs, CPU_INTERRUPT_HARD);
d8ed887b
AF
201 } else {
202 cpu_reset_interrupt(cs, CPU_INTERRUPT_HARD);
203 }
a5b38b51 204 }
3de388f6
FB
205}
206
b0a21b53
FB
207/* PC cmos mappings */
208
80cabfad
FB
209#define REG_EQUIPMENT_BYTE 0x14
210
bda05509 211int cmos_get_fd_drive_type(FloppyDriveType fd0)
777428f2
FB
212{
213 int val;
214
215 switch (fd0) {
2da44dd0 216 case FLOPPY_DRIVE_TYPE_144:
777428f2
FB
217 /* 1.44 Mb 3"5 drive */
218 val = 4;
219 break;
2da44dd0 220 case FLOPPY_DRIVE_TYPE_288:
777428f2
FB
221 /* 2.88 Mb 3"5 drive */
222 val = 5;
223 break;
2da44dd0 224 case FLOPPY_DRIVE_TYPE_120:
777428f2
FB
225 /* 1.2 Mb 5"5 drive */
226 val = 2;
227 break;
2da44dd0 228 case FLOPPY_DRIVE_TYPE_NONE:
777428f2
FB
229 default:
230 val = 0;
231 break;
232 }
233 return val;
234}
235
9139046c
MA
236static void cmos_init_hd(ISADevice *s, int type_ofs, int info_ofs,
237 int16_t cylinders, int8_t heads, int8_t sectors)
ba6c2377 238{
ba6c2377
FB
239 rtc_set_memory(s, type_ofs, 47);
240 rtc_set_memory(s, info_ofs, cylinders);
241 rtc_set_memory(s, info_ofs + 1, cylinders >> 8);
242 rtc_set_memory(s, info_ofs + 2, heads);
243 rtc_set_memory(s, info_ofs + 3, 0xff);
244 rtc_set_memory(s, info_ofs + 4, 0xff);
245 rtc_set_memory(s, info_ofs + 5, 0xc0 | ((heads > 8) << 3));
246 rtc_set_memory(s, info_ofs + 6, cylinders);
247 rtc_set_memory(s, info_ofs + 7, cylinders >> 8);
248 rtc_set_memory(s, info_ofs + 8, sectors);
249}
250
6ac0e82d
AZ
251/* convert boot_device letter to something recognizable by the bios */
252static int boot_device2nibble(char boot_device)
253{
254 switch(boot_device) {
255 case 'a':
256 case 'b':
257 return 0x01; /* floppy boot */
258 case 'c':
259 return 0x02; /* hard drive boot */
260 case 'd':
261 return 0x03; /* CD-ROM boot */
262 case 'n':
263 return 0x04; /* Network boot */
264 }
265 return 0;
266}
267
ddcd5531 268static void set_boot_dev(ISADevice *s, const char *boot_device, Error **errp)
0ecdffbb
AJ
269{
270#define PC_MAX_BOOT_DEVICES 3
0ecdffbb
AJ
271 int nbds, bds[3] = { 0, };
272 int i;
273
274 nbds = strlen(boot_device);
275 if (nbds > PC_MAX_BOOT_DEVICES) {
ddcd5531
GA
276 error_setg(errp, "Too many boot devices for PC");
277 return;
0ecdffbb
AJ
278 }
279 for (i = 0; i < nbds; i++) {
280 bds[i] = boot_device2nibble(boot_device[i]);
281 if (bds[i] == 0) {
ddcd5531
GA
282 error_setg(errp, "Invalid boot device for PC: '%c'",
283 boot_device[i]);
284 return;
0ecdffbb
AJ
285 }
286 }
287 rtc_set_memory(s, 0x3d, (bds[1] << 4) | bds[0]);
d9346e81 288 rtc_set_memory(s, 0x38, (bds[2] << 4) | (fd_bootchk ? 0x0 : 0x1));
0ecdffbb
AJ
289}
290
ddcd5531 291static void pc_boot_set(void *opaque, const char *boot_device, Error **errp)
d9346e81 292{
ddcd5531 293 set_boot_dev(opaque, boot_device, errp);
d9346e81
MA
294}
295
7444ca4e
LE
296static void pc_cmos_init_floppy(ISADevice *rtc_state, ISADevice *floppy)
297{
298 int val, nb, i;
2da44dd0
JS
299 FloppyDriveType fd_type[2] = { FLOPPY_DRIVE_TYPE_NONE,
300 FLOPPY_DRIVE_TYPE_NONE };
7444ca4e
LE
301
302 /* floppy type */
303 if (floppy) {
304 for (i = 0; i < 2; i++) {
305 fd_type[i] = isa_fdc_get_drive_type(floppy, i);
306 }
307 }
308 val = (cmos_get_fd_drive_type(fd_type[0]) << 4) |
309 cmos_get_fd_drive_type(fd_type[1]);
310 rtc_set_memory(rtc_state, 0x10, val);
311
312 val = rtc_get_memory(rtc_state, REG_EQUIPMENT_BYTE);
313 nb = 0;
2da44dd0 314 if (fd_type[0] != FLOPPY_DRIVE_TYPE_NONE) {
7444ca4e
LE
315 nb++;
316 }
2da44dd0 317 if (fd_type[1] != FLOPPY_DRIVE_TYPE_NONE) {
7444ca4e
LE
318 nb++;
319 }
320 switch (nb) {
321 case 0:
322 break;
323 case 1:
324 val |= 0x01; /* 1 drive, ready for boot */
325 break;
326 case 2:
327 val |= 0x41; /* 2 drives, ready for boot */
328 break;
329 }
330 rtc_set_memory(rtc_state, REG_EQUIPMENT_BYTE, val);
331}
332
c0897e0c
MA
333typedef struct pc_cmos_init_late_arg {
334 ISADevice *rtc_state;
9139046c 335 BusState *idebus[2];
c0897e0c
MA
336} pc_cmos_init_late_arg;
337
b86f4613
LE
338typedef struct check_fdc_state {
339 ISADevice *floppy;
340 bool multiple;
341} CheckFdcState;
342
343static int check_fdc(Object *obj, void *opaque)
344{
345 CheckFdcState *state = opaque;
346 Object *fdc;
347 uint32_t iobase;
348 Error *local_err = NULL;
349
350 fdc = object_dynamic_cast(obj, TYPE_ISA_FDC);
351 if (!fdc) {
352 return 0;
353 }
354
1ea1572a 355 iobase = object_property_get_uint(obj, "iobase", &local_err);
b86f4613
LE
356 if (local_err || iobase != 0x3f0) {
357 error_free(local_err);
358 return 0;
359 }
360
361 if (state->floppy) {
362 state->multiple = true;
363 } else {
364 state->floppy = ISA_DEVICE(obj);
365 }
366 return 0;
367}
368
369static const char * const fdc_container_path[] = {
370 "/unattached", "/peripheral", "/peripheral-anon"
371};
372
424e4a87
RK
373/*
374 * Locate the FDC at IO address 0x3f0, in order to configure the CMOS registers
375 * and ACPI objects.
376 */
377ISADevice *pc_find_fdc0(void)
378{
379 int i;
380 Object *container;
381 CheckFdcState state = { 0 };
382
383 for (i = 0; i < ARRAY_SIZE(fdc_container_path); i++) {
384 container = container_get(qdev_get_machine(), fdc_container_path[i]);
385 object_child_foreach(container, check_fdc, &state);
386 }
387
388 if (state.multiple) {
3dc6f869
AF
389 warn_report("multiple floppy disk controllers with "
390 "iobase=0x3f0 have been found");
433672b0 391 error_printf("the one being picked for CMOS setup might not reflect "
9e5d2c52 392 "your intent");
424e4a87
RK
393 }
394
395 return state.floppy;
396}
397
c0897e0c
MA
398static void pc_cmos_init_late(void *opaque)
399{
400 pc_cmos_init_late_arg *arg = opaque;
401 ISADevice *s = arg->rtc_state;
9139046c
MA
402 int16_t cylinders;
403 int8_t heads, sectors;
c0897e0c 404 int val;
2adc99b2 405 int i, trans;
c0897e0c 406
9139046c 407 val = 0;
272f0428
CP
408 if (arg->idebus[0] && ide_get_geometry(arg->idebus[0], 0,
409 &cylinders, &heads, &sectors) >= 0) {
9139046c
MA
410 cmos_init_hd(s, 0x19, 0x1b, cylinders, heads, sectors);
411 val |= 0xf0;
412 }
272f0428
CP
413 if (arg->idebus[0] && ide_get_geometry(arg->idebus[0], 1,
414 &cylinders, &heads, &sectors) >= 0) {
9139046c
MA
415 cmos_init_hd(s, 0x1a, 0x24, cylinders, heads, sectors);
416 val |= 0x0f;
417 }
418 rtc_set_memory(s, 0x12, val);
c0897e0c
MA
419
420 val = 0;
421 for (i = 0; i < 4; i++) {
9139046c
MA
422 /* NOTE: ide_get_geometry() returns the physical
423 geometry. It is always such that: 1 <= sects <= 63, 1
424 <= heads <= 16, 1 <= cylinders <= 16383. The BIOS
425 geometry can be different if a translation is done. */
272f0428
CP
426 if (arg->idebus[i / 2] &&
427 ide_get_geometry(arg->idebus[i / 2], i % 2,
9139046c 428 &cylinders, &heads, &sectors) >= 0) {
2adc99b2
MA
429 trans = ide_get_bios_chs_trans(arg->idebus[i / 2], i % 2) - 1;
430 assert((trans & ~3) == 0);
431 val |= trans << (i * 2);
c0897e0c
MA
432 }
433 }
434 rtc_set_memory(s, 0x39, val);
435
424e4a87 436 pc_cmos_init_floppy(s, pc_find_fdc0());
b86f4613 437
c0897e0c
MA
438 qemu_unregister_reset(pc_cmos_init_late, opaque);
439}
440
23d30407 441void pc_cmos_init(PCMachineState *pcms,
220a8846 442 BusState *idebus0, BusState *idebus1,
63ffb564 443 ISADevice *s)
80cabfad 444{
7444ca4e 445 int val;
c0897e0c 446 static pc_cmos_init_late_arg arg;
b0a21b53 447
b0a21b53 448 /* various important CMOS locations needed by PC/Bochs bios */
80cabfad
FB
449
450 /* memory size */
e89001f7 451 /* base memory (first MiB) */
88076854 452 val = MIN(pcms->below_4g_mem_size / 1024, 640);
333190eb
FB
453 rtc_set_memory(s, 0x15, val);
454 rtc_set_memory(s, 0x16, val >> 8);
e89001f7 455 /* extended memory (next 64MiB) */
88076854
EH
456 if (pcms->below_4g_mem_size > 1024 * 1024) {
457 val = (pcms->below_4g_mem_size - 1024 * 1024) / 1024;
e89001f7
MA
458 } else {
459 val = 0;
460 }
80cabfad
FB
461 if (val > 65535)
462 val = 65535;
b0a21b53
FB
463 rtc_set_memory(s, 0x17, val);
464 rtc_set_memory(s, 0x18, val >> 8);
465 rtc_set_memory(s, 0x30, val);
466 rtc_set_memory(s, 0x31, val >> 8);
e89001f7 467 /* memory between 16MiB and 4GiB */
88076854
EH
468 if (pcms->below_4g_mem_size > 16 * 1024 * 1024) {
469 val = (pcms->below_4g_mem_size - 16 * 1024 * 1024) / 65536;
e89001f7 470 } else {
9da98861 471 val = 0;
e89001f7 472 }
80cabfad
FB
473 if (val > 65535)
474 val = 65535;
b0a21b53
FB
475 rtc_set_memory(s, 0x34, val);
476 rtc_set_memory(s, 0x35, val >> 8);
e89001f7 477 /* memory above 4GiB */
88076854 478 val = pcms->above_4g_mem_size / 65536;
e89001f7
MA
479 rtc_set_memory(s, 0x5b, val);
480 rtc_set_memory(s, 0x5c, val >> 8);
481 rtc_set_memory(s, 0x5d, val >> 16);
3b46e624 482
23d30407 483 object_property_add_link(OBJECT(pcms), "rtc_state",
2d996150 484 TYPE_ISA_DEVICE,
ec68007a 485 (Object **)&pcms->rtc,
2d996150
GZ
486 object_property_allow_set_link,
487 OBJ_PROP_LINK_UNREF_ON_RELEASE, &error_abort);
23d30407 488 object_property_set_link(OBJECT(pcms), OBJECT(s),
2d996150 489 "rtc_state", &error_abort);
298e01b6 490
007b0657 491 set_boot_dev(s, MACHINE(pcms)->boot_order, &error_fatal);
80cabfad 492
b0a21b53 493 val = 0;
b0a21b53
FB
494 val |= 0x02; /* FPU is there */
495 val |= 0x04; /* PS/2 mouse installed */
496 rtc_set_memory(s, REG_EQUIPMENT_BYTE, val);
497
b86f4613 498 /* hard drives and FDC */
c0897e0c 499 arg.rtc_state = s;
9139046c
MA
500 arg.idebus[0] = idebus0;
501 arg.idebus[1] = idebus1;
c0897e0c 502 qemu_register_reset(pc_cmos_init_late, &arg);
80cabfad
FB
503}
504
a0881c64
AF
505#define TYPE_PORT92 "port92"
506#define PORT92(obj) OBJECT_CHECK(Port92State, (obj), TYPE_PORT92)
507
4b78a802
BS
508/* port 92 stuff: could be split off */
509typedef struct Port92State {
a0881c64
AF
510 ISADevice parent_obj;
511
23af670e 512 MemoryRegion io;
4b78a802 513 uint8_t outport;
d812b3d6 514 qemu_irq a20_out;
4b78a802
BS
515} Port92State;
516
93ef4192
AG
517static void port92_write(void *opaque, hwaddr addr, uint64_t val,
518 unsigned size)
4b78a802
BS
519{
520 Port92State *s = opaque;
4700a316 521 int oldval = s->outport;
4b78a802 522
c5539cb4 523 DPRINTF("port92: write 0x%02" PRIx64 "\n", val);
4b78a802 524 s->outport = val;
d812b3d6 525 qemu_set_irq(s->a20_out, (val >> 1) & 1);
4700a316 526 if ((val & 1) && !(oldval & 1)) {
cf83f140 527 qemu_system_reset_request(SHUTDOWN_CAUSE_GUEST_RESET);
4b78a802
BS
528 }
529}
530
93ef4192
AG
531static uint64_t port92_read(void *opaque, hwaddr addr,
532 unsigned size)
4b78a802
BS
533{
534 Port92State *s = opaque;
535 uint32_t ret;
536
537 ret = s->outport;
538 DPRINTF("port92: read 0x%02x\n", ret);
539 return ret;
540}
541
d80fe99d 542static void port92_init(ISADevice *dev, qemu_irq a20_out)
4b78a802 543{
d80fe99d 544 qdev_connect_gpio_out_named(DEVICE(dev), PORT92_A20_LINE, 0, a20_out);
4b78a802
BS
545}
546
547static const VMStateDescription vmstate_port92_isa = {
548 .name = "port92",
549 .version_id = 1,
550 .minimum_version_id = 1,
d49805ae 551 .fields = (VMStateField[]) {
4b78a802
BS
552 VMSTATE_UINT8(outport, Port92State),
553 VMSTATE_END_OF_LIST()
554 }
555};
556
557static void port92_reset(DeviceState *d)
558{
a0881c64 559 Port92State *s = PORT92(d);
4b78a802
BS
560
561 s->outport &= ~1;
562}
563
23af670e 564static const MemoryRegionOps port92_ops = {
93ef4192
AG
565 .read = port92_read,
566 .write = port92_write,
567 .impl = {
568 .min_access_size = 1,
569 .max_access_size = 1,
570 },
571 .endianness = DEVICE_LITTLE_ENDIAN,
23af670e
RH
572};
573
db895a1e 574static void port92_initfn(Object *obj)
4b78a802 575{
db895a1e 576 Port92State *s = PORT92(obj);
4b78a802 577
1437c94b 578 memory_region_init_io(&s->io, OBJECT(s), &port92_ops, s, "port92", 1);
23af670e 579
4b78a802 580 s->outport = 0;
d812b3d6
EV
581
582 qdev_init_gpio_out_named(DEVICE(obj), &s->a20_out, PORT92_A20_LINE, 1);
db895a1e
AF
583}
584
585static void port92_realizefn(DeviceState *dev, Error **errp)
586{
587 ISADevice *isadev = ISA_DEVICE(dev);
588 Port92State *s = PORT92(dev);
589
590 isa_register_ioport(isadev, &s->io, 0x92);
4b78a802
BS
591}
592
8f04ee08
AL
593static void port92_class_initfn(ObjectClass *klass, void *data)
594{
39bffca2 595 DeviceClass *dc = DEVICE_CLASS(klass);
db895a1e 596
db895a1e 597 dc->realize = port92_realizefn;
39bffca2
AL
598 dc->reset = port92_reset;
599 dc->vmsd = &vmstate_port92_isa;
f3b17640
MA
600 /*
601 * Reason: unlike ordinary ISA devices, this one needs additional
602 * wiring: its A20 output line needs to be wired up by
603 * port92_init().
604 */
e90f2a8c 605 dc->user_creatable = false;
8f04ee08
AL
606}
607
8c43a6f0 608static const TypeInfo port92_info = {
a0881c64 609 .name = TYPE_PORT92,
39bffca2
AL
610 .parent = TYPE_ISA_DEVICE,
611 .instance_size = sizeof(Port92State),
db895a1e 612 .instance_init = port92_initfn,
39bffca2 613 .class_init = port92_class_initfn,
4b78a802
BS
614};
615
83f7d43a 616static void port92_register_types(void)
4b78a802 617{
39bffca2 618 type_register_static(&port92_info);
4b78a802 619}
83f7d43a
AF
620
621type_init(port92_register_types)
4b78a802 622
956a3e6b 623static void handle_a20_line_change(void *opaque, int irq, int level)
59b8ad81 624{
cc36a7a2 625 X86CPU *cpu = opaque;
e1a23744 626
956a3e6b 627 /* XXX: send to all CPUs ? */
4b78a802 628 /* XXX: add logic to handle multiple A20 line sources */
cc36a7a2 629 x86_cpu_set_a20(cpu, level);
e1a23744
FB
630}
631
4c5b10b7
JS
632int e820_add_entry(uint64_t address, uint64_t length, uint32_t type)
633{
7d67110f 634 int index = le32_to_cpu(e820_reserve.count);
4c5b10b7
JS
635 struct e820_entry *entry;
636
7d67110f
GH
637 if (type != E820_RAM) {
638 /* old FW_CFG_E820_TABLE entry -- reservations only */
639 if (index >= E820_NR_ENTRIES) {
640 return -EBUSY;
641 }
642 entry = &e820_reserve.entry[index++];
643
644 entry->address = cpu_to_le64(address);
645 entry->length = cpu_to_le64(length);
646 entry->type = cpu_to_le32(type);
647
648 e820_reserve.count = cpu_to_le32(index);
649 }
4c5b10b7 650
7d67110f 651 /* new "etc/e820" file -- include ram too */
ab3ad07f 652 e820_table = g_renew(struct e820_entry, e820_table, e820_entries + 1);
7d67110f
GH
653 e820_table[e820_entries].address = cpu_to_le64(address);
654 e820_table[e820_entries].length = cpu_to_le64(length);
655 e820_table[e820_entries].type = cpu_to_le32(type);
656 e820_entries++;
4c5b10b7 657
7d67110f 658 return e820_entries;
4c5b10b7
JS
659}
660
7bf8ef19
GS
661int e820_get_num_entries(void)
662{
663 return e820_entries;
664}
665
666bool e820_get_entry(int idx, uint32_t type, uint64_t *address, uint64_t *length)
667{
668 if (idx < e820_entries && e820_table[idx].type == cpu_to_le32(type)) {
669 *address = le64_to_cpu(e820_table[idx].address);
670 *length = le64_to_cpu(e820_table[idx].length);
671 return true;
672 }
673 return false;
674}
675
54a40293
EH
676/* Enables contiguous-apic-ID mode, for compatibility */
677static bool compat_apic_id_mode;
678
679void enable_compat_apic_id_mode(void)
680{
681 compat_apic_id_mode = true;
682}
683
684/* Calculates initial APIC ID for a specific CPU index
685 *
686 * Currently we need to be able to calculate the APIC ID from the CPU index
687 * alone (without requiring a CPU object), as the QEMU<->Seabios interfaces have
688 * no concept of "CPU index", and the NUMA tables on fw_cfg need the APIC ID of
689 * all CPUs up to max_cpus.
690 */
691static uint32_t x86_cpu_apic_id_from_index(unsigned int cpu_index)
692{
693 uint32_t correct_id;
694 static bool warned;
695
696 correct_id = x86_apicid_from_cpu_idx(smp_cores, smp_threads, cpu_index);
697 if (compat_apic_id_mode) {
b1c12027 698 if (cpu_index != correct_id && !warned && !qtest_enabled()) {
54a40293
EH
699 error_report("APIC IDs set in compatibility mode, "
700 "CPU topology won't match the configuration");
701 warned = true;
702 }
703 return cpu_index;
704 } else {
705 return correct_id;
706 }
707}
708
f2098f48 709static void pc_build_smbios(PCMachineState *pcms)
80cabfad 710{
c97294ec
GS
711 uint8_t *smbios_tables, *smbios_anchor;
712 size_t smbios_tables_len, smbios_anchor_len;
89cc4a27
WH
713 struct smbios_phys_mem_area *mem_array;
714 unsigned i, array_count;
38690a1c
IM
715 MachineState *ms = MACHINE(pcms);
716 X86CPU *cpu = X86_CPU(ms->possible_cpus->cpus[0].cpu);
f2098f48
IM
717
718 /* tell smbios about cpuid version and features */
719 smbios_set_cpuid(cpu->env.cpuid_version, cpu->env.features[FEAT_1_EDX]);
5fd0a9d4
WH
720
721 smbios_tables = smbios_get_table_legacy(&smbios_tables_len);
722 if (smbios_tables) {
f2098f48 723 fw_cfg_add_bytes(pcms->fw_cfg, FW_CFG_SMBIOS_ENTRIES,
5fd0a9d4
WH
724 smbios_tables, smbios_tables_len);
725 }
726
89cc4a27
WH
727 /* build the array of physical mem area from e820 table */
728 mem_array = g_malloc0(sizeof(*mem_array) * e820_get_num_entries());
729 for (i = 0, array_count = 0; i < e820_get_num_entries(); i++) {
730 uint64_t addr, len;
731
732 if (e820_get_entry(i, E820_RAM, &addr, &len)) {
733 mem_array[array_count].address = addr;
734 mem_array[array_count].length = len;
735 array_count++;
736 }
737 }
738 smbios_get_tables(mem_array, array_count,
739 &smbios_tables, &smbios_tables_len,
5fd0a9d4 740 &smbios_anchor, &smbios_anchor_len);
89cc4a27
WH
741 g_free(mem_array);
742
5fd0a9d4 743 if (smbios_anchor) {
f2098f48 744 fw_cfg_add_file(pcms->fw_cfg, "etc/smbios/smbios-tables",
5fd0a9d4 745 smbios_tables, smbios_tables_len);
f2098f48 746 fw_cfg_add_file(pcms->fw_cfg, "etc/smbios/smbios-anchor",
5fd0a9d4
WH
747 smbios_anchor, smbios_anchor_len);
748 }
749}
750
ebde2465 751static FWCfgState *bochs_bios_init(AddressSpace *as, PCMachineState *pcms)
5fd0a9d4
WH
752{
753 FWCfgState *fw_cfg;
11c2fd3e 754 uint64_t *numa_fw_cfg;
ea265072
IM
755 int i;
756 const CPUArchIdList *cpus;
757 MachineClass *mc = MACHINE_GET_CLASS(pcms);
3cce6243 758
305ae888 759 fw_cfg = fw_cfg_init_io_dma(FW_CFG_IO_BASE, FW_CFG_IO_BASE + 4, as);
e3cadac0 760 fw_cfg_add_i16(fw_cfg, FW_CFG_NB_CPUS, pcms->boot_cpus);
c886fc4c 761
1d934e89
EH
762 /* FW_CFG_MAX_CPUS is a bit confusing/problematic on x86:
763 *
a3abd0f2
IM
764 * For machine types prior to 1.8, SeaBIOS needs FW_CFG_MAX_CPUS for
765 * building MPTable, ACPI MADT, ACPI CPU hotplug and ACPI SRAT table,
766 * that tables are based on xAPIC ID and QEMU<->SeaBIOS interface
767 * for CPU hotplug also uses APIC ID and not "CPU index".
768 * This means that FW_CFG_MAX_CPUS is not the "maximum number of CPUs",
769 * but the "limit to the APIC ID values SeaBIOS may see".
1d934e89 770 *
a3abd0f2
IM
771 * So for compatibility reasons with old BIOSes we are stuck with
772 * "etc/max-cpus" actually being apic_id_limit
1d934e89 773 */
ebde2465 774 fw_cfg_add_i16(fw_cfg, FW_CFG_MAX_CPUS, (uint16_t)pcms->apic_id_limit);
905fdcb5 775 fw_cfg_add_i64(fw_cfg, FW_CFG_RAM_SIZE, (uint64_t)ram_size);
089da572
MA
776 fw_cfg_add_bytes(fw_cfg, FW_CFG_ACPI_TABLES,
777 acpi_tables, acpi_tables_len);
9b5b76d4 778 fw_cfg_add_i32(fw_cfg, FW_CFG_IRQ0_OVERRIDE, kvm_allows_irq0_override());
b6f6e3d3 779
089da572 780 fw_cfg_add_bytes(fw_cfg, FW_CFG_E820_TABLE,
7d67110f
GH
781 &e820_reserve, sizeof(e820_reserve));
782 fw_cfg_add_file(fw_cfg, "etc/e820", e820_table,
783 sizeof(struct e820_entry) * e820_entries);
11c2fd3e 784
089da572 785 fw_cfg_add_bytes(fw_cfg, FW_CFG_HPET, &hpet_cfg, sizeof(hpet_cfg));
11c2fd3e
AL
786 /* allocate memory for the NUMA channel: one (64bit) word for the number
787 * of nodes, one word for each VCPU->node and one word for each node to
788 * hold the amount of memory.
789 */
ebde2465 790 numa_fw_cfg = g_new0(uint64_t, 1 + pcms->apic_id_limit + nb_numa_nodes);
11c2fd3e 791 numa_fw_cfg[0] = cpu_to_le64(nb_numa_nodes);
ea265072
IM
792 cpus = mc->possible_cpu_arch_ids(MACHINE(pcms));
793 for (i = 0; i < cpus->len; i++) {
794 unsigned int apic_id = cpus->cpus[i].arch_id;
ebde2465 795 assert(apic_id < pcms->apic_id_limit);
d41f3e75 796 numa_fw_cfg[apic_id + 1] = cpu_to_le64(cpus->cpus[i].props.node_id);
11c2fd3e
AL
797 }
798 for (i = 0; i < nb_numa_nodes; i++) {
ebde2465
IM
799 numa_fw_cfg[pcms->apic_id_limit + 1 + i] =
800 cpu_to_le64(numa_info[i].node_mem);
11c2fd3e 801 }
089da572 802 fw_cfg_add_bytes(fw_cfg, FW_CFG_NUMA, numa_fw_cfg,
ebde2465 803 (1 + pcms->apic_id_limit + nb_numa_nodes) *
1d934e89 804 sizeof(*numa_fw_cfg));
bf483392
AG
805
806 return fw_cfg;
80cabfad
FB
807}
808
642a4f96
TS
809static long get_file_size(FILE *f)
810{
811 long where, size;
812
813 /* XXX: on Unix systems, using fstat() probably makes more sense */
814
815 where = ftell(f);
816 fseek(f, 0, SEEK_END);
817 size = ftell(f);
818 fseek(f, where, SEEK_SET);
819
820 return size;
821}
822
3cbeb524
AB
823/* setup_data types */
824#define SETUP_NONE 0
825#define SETUP_E820_EXT 1
826#define SETUP_DTB 2
827#define SETUP_PCI 3
828#define SETUP_EFI 4
829
830struct setup_data {
831 uint64_t next;
832 uint32_t type;
833 uint32_t len;
834 uint8_t data[0];
835} __attribute__((packed));
836
df1f79fd
EH
837static void load_linux(PCMachineState *pcms,
838 FWCfgState *fw_cfg)
642a4f96
TS
839{
840 uint16_t protocol;
5cea8590 841 int setup_size, kernel_size, initrd_size = 0, cmdline_size;
3cbeb524 842 int dtb_size, setup_data_offset;
642a4f96 843 uint32_t initrd_max;
57a46d05 844 uint8_t header[8192], *setup, *kernel, *initrd_data;
a8170e5e 845 hwaddr real_addr, prot_addr, cmdline_addr, initrd_addr = 0;
45a50b16 846 FILE *f;
bf4e5d92 847 char *vmode;
df1f79fd 848 MachineState *machine = MACHINE(pcms);
cd4040ec 849 PCMachineClass *pcmc = PC_MACHINE_GET_CLASS(pcms);
3cbeb524 850 struct setup_data *setup_data;
df1f79fd
EH
851 const char *kernel_filename = machine->kernel_filename;
852 const char *initrd_filename = machine->initrd_filename;
3cbeb524 853 const char *dtb_filename = machine->dtb;
df1f79fd 854 const char *kernel_cmdline = machine->kernel_cmdline;
642a4f96
TS
855
856 /* Align to 16 bytes as a paranoia measure */
857 cmdline_size = (strlen(kernel_cmdline)+16) & ~15;
858
859 /* load the kernel header */
860 f = fopen(kernel_filename, "rb");
861 if (!f || !(kernel_size = get_file_size(f)) ||
0f9d76e5
LG
862 fread(header, 1, MIN(ARRAY_SIZE(header), kernel_size), f) !=
863 MIN(ARRAY_SIZE(header), kernel_size)) {
864 fprintf(stderr, "qemu: could not load kernel '%s': %s\n",
865 kernel_filename, strerror(errno));
866 exit(1);
642a4f96
TS
867 }
868
869 /* kernel protocol version */
bc4edd79 870#if 0
642a4f96 871 fprintf(stderr, "header magic: %#x\n", ldl_p(header+0x202));
bc4edd79 872#endif
0f9d76e5
LG
873 if (ldl_p(header+0x202) == 0x53726448) {
874 protocol = lduw_p(header+0x206);
875 } else {
876 /* This looks like a multiboot kernel. If it is, let's stop
877 treating it like a Linux kernel. */
52001445 878 if (load_multiboot(fw_cfg, f, kernel_filename, initrd_filename,
0f9d76e5 879 kernel_cmdline, kernel_size, header)) {
82663ee2 880 return;
0f9d76e5
LG
881 }
882 protocol = 0;
f16408df 883 }
642a4f96
TS
884
885 if (protocol < 0x200 || !(header[0x211] & 0x01)) {
0f9d76e5
LG
886 /* Low kernel */
887 real_addr = 0x90000;
888 cmdline_addr = 0x9a000 - cmdline_size;
889 prot_addr = 0x10000;
642a4f96 890 } else if (protocol < 0x202) {
0f9d76e5
LG
891 /* High but ancient kernel */
892 real_addr = 0x90000;
893 cmdline_addr = 0x9a000 - cmdline_size;
894 prot_addr = 0x100000;
642a4f96 895 } else {
0f9d76e5
LG
896 /* High and recent kernel */
897 real_addr = 0x10000;
898 cmdline_addr = 0x20000;
899 prot_addr = 0x100000;
642a4f96
TS
900 }
901
bc4edd79 902#if 0
642a4f96 903 fprintf(stderr,
0f9d76e5
LG
904 "qemu: real_addr = 0x" TARGET_FMT_plx "\n"
905 "qemu: cmdline_addr = 0x" TARGET_FMT_plx "\n"
906 "qemu: prot_addr = 0x" TARGET_FMT_plx "\n",
907 real_addr,
908 cmdline_addr,
909 prot_addr);
bc4edd79 910#endif
642a4f96
TS
911
912 /* highest address for loading the initrd */
0f9d76e5
LG
913 if (protocol >= 0x203) {
914 initrd_max = ldl_p(header+0x22c);
915 } else {
916 initrd_max = 0x37ffffff;
917 }
642a4f96 918
cd4040ec
EH
919 if (initrd_max >= pcms->below_4g_mem_size - pcmc->acpi_data_size) {
920 initrd_max = pcms->below_4g_mem_size - pcmc->acpi_data_size - 1;
927766c7 921 }
642a4f96 922
57a46d05
AG
923 fw_cfg_add_i32(fw_cfg, FW_CFG_CMDLINE_ADDR, cmdline_addr);
924 fw_cfg_add_i32(fw_cfg, FW_CFG_CMDLINE_SIZE, strlen(kernel_cmdline)+1);
96f80586 925 fw_cfg_add_string(fw_cfg, FW_CFG_CMDLINE_DATA, kernel_cmdline);
642a4f96
TS
926
927 if (protocol >= 0x202) {
0f9d76e5 928 stl_p(header+0x228, cmdline_addr);
642a4f96 929 } else {
0f9d76e5
LG
930 stw_p(header+0x20, 0xA33F);
931 stw_p(header+0x22, cmdline_addr-real_addr);
642a4f96
TS
932 }
933
bf4e5d92
PT
934 /* handle vga= parameter */
935 vmode = strstr(kernel_cmdline, "vga=");
936 if (vmode) {
937 unsigned int video_mode;
938 /* skip "vga=" */
939 vmode += 4;
940 if (!strncmp(vmode, "normal", 6)) {
941 video_mode = 0xffff;
942 } else if (!strncmp(vmode, "ext", 3)) {
943 video_mode = 0xfffe;
944 } else if (!strncmp(vmode, "ask", 3)) {
945 video_mode = 0xfffd;
946 } else {
947 video_mode = strtol(vmode, NULL, 0);
948 }
949 stw_p(header+0x1fa, video_mode);
950 }
951
642a4f96 952 /* loader type */
5cbdb3a3 953 /* High nybble = B reserved for QEMU; low nybble is revision number.
642a4f96
TS
954 If this code is substantially changed, you may want to consider
955 incrementing the revision. */
0f9d76e5
LG
956 if (protocol >= 0x200) {
957 header[0x210] = 0xB0;
958 }
642a4f96
TS
959 /* heap */
960 if (protocol >= 0x201) {
0f9d76e5
LG
961 header[0x211] |= 0x80; /* CAN_USE_HEAP */
962 stw_p(header+0x224, cmdline_addr-real_addr-0x200);
642a4f96
TS
963 }
964
965 /* load initrd */
966 if (initrd_filename) {
0f9d76e5
LG
967 if (protocol < 0x200) {
968 fprintf(stderr, "qemu: linux kernel too old to load a ram disk\n");
969 exit(1);
970 }
642a4f96 971
0f9d76e5 972 initrd_size = get_image_size(initrd_filename);
d6fa4b77 973 if (initrd_size < 0) {
7454e51d
MT
974 fprintf(stderr, "qemu: error reading initrd %s: %s\n",
975 initrd_filename, strerror(errno));
d6fa4b77
MK
976 exit(1);
977 }
978
45a50b16 979 initrd_addr = (initrd_max-initrd_size) & ~4095;
57a46d05 980
7267c094 981 initrd_data = g_malloc(initrd_size);
57a46d05
AG
982 load_image(initrd_filename, initrd_data);
983
984 fw_cfg_add_i32(fw_cfg, FW_CFG_INITRD_ADDR, initrd_addr);
985 fw_cfg_add_i32(fw_cfg, FW_CFG_INITRD_SIZE, initrd_size);
986 fw_cfg_add_bytes(fw_cfg, FW_CFG_INITRD_DATA, initrd_data, initrd_size);
642a4f96 987
0f9d76e5
LG
988 stl_p(header+0x218, initrd_addr);
989 stl_p(header+0x21c, initrd_size);
642a4f96
TS
990 }
991
45a50b16 992 /* load kernel and setup */
642a4f96 993 setup_size = header[0x1f1];
0f9d76e5
LG
994 if (setup_size == 0) {
995 setup_size = 4;
996 }
642a4f96 997 setup_size = (setup_size+1)*512;
ec5fd402
PB
998 if (setup_size > kernel_size) {
999 fprintf(stderr, "qemu: invalid kernel header\n");
1000 exit(1);
1001 }
45a50b16 1002 kernel_size -= setup_size;
642a4f96 1003
7267c094
AL
1004 setup = g_malloc(setup_size);
1005 kernel = g_malloc(kernel_size);
45a50b16 1006 fseek(f, 0, SEEK_SET);
5a41ecc5
KS
1007 if (fread(setup, 1, setup_size, f) != setup_size) {
1008 fprintf(stderr, "fread() failed\n");
1009 exit(1);
1010 }
1011 if (fread(kernel, 1, kernel_size, f) != kernel_size) {
1012 fprintf(stderr, "fread() failed\n");
1013 exit(1);
1014 }
642a4f96 1015 fclose(f);
3cbeb524
AB
1016
1017 /* append dtb to kernel */
1018 if (dtb_filename) {
1019 if (protocol < 0x209) {
1020 fprintf(stderr, "qemu: Linux kernel too old to load a dtb\n");
1021 exit(1);
1022 }
1023
1024 dtb_size = get_image_size(dtb_filename);
1025 if (dtb_size <= 0) {
1026 fprintf(stderr, "qemu: error reading dtb %s: %s\n",
1027 dtb_filename, strerror(errno));
1028 exit(1);
1029 }
1030
1031 setup_data_offset = QEMU_ALIGN_UP(kernel_size, 16);
1032 kernel_size = setup_data_offset + sizeof(struct setup_data) + dtb_size;
1033 kernel = g_realloc(kernel, kernel_size);
1034
1035 stq_p(header+0x250, prot_addr + setup_data_offset);
1036
1037 setup_data = (struct setup_data *)(kernel + setup_data_offset);
1038 setup_data->next = 0;
1039 setup_data->type = cpu_to_le32(SETUP_DTB);
1040 setup_data->len = cpu_to_le32(dtb_size);
1041
1042 load_image_size(dtb_filename, setup_data->data, dtb_size);
1043 }
1044
45a50b16 1045 memcpy(setup, header, MIN(sizeof(header), setup_size));
57a46d05
AG
1046
1047 fw_cfg_add_i32(fw_cfg, FW_CFG_KERNEL_ADDR, prot_addr);
1048 fw_cfg_add_i32(fw_cfg, FW_CFG_KERNEL_SIZE, kernel_size);
1049 fw_cfg_add_bytes(fw_cfg, FW_CFG_KERNEL_DATA, kernel, kernel_size);
1050
1051 fw_cfg_add_i32(fw_cfg, FW_CFG_SETUP_ADDR, real_addr);
1052 fw_cfg_add_i32(fw_cfg, FW_CFG_SETUP_SIZE, setup_size);
1053 fw_cfg_add_bytes(fw_cfg, FW_CFG_SETUP_DATA, setup, setup_size);
1054
98e753a6
IM
1055 option_rom[nb_option_roms].bootindex = 0;
1056 option_rom[nb_option_roms].name = "linuxboot.bin";
1057 if (pcmc->linuxboot_dma_enabled && fw_cfg_dma_enabled(fw_cfg)) {
b2a575a1 1058 option_rom[nb_option_roms].name = "linuxboot_dma.bin";
b2a575a1 1059 }
57a46d05 1060 nb_option_roms++;
642a4f96
TS
1061}
1062
b41a2cd1
FB
1063#define NE2000_NB_MAX 6
1064
675d6f82
BS
1065static const int ne2000_io[NE2000_NB_MAX] = { 0x300, 0x320, 0x340, 0x360,
1066 0x280, 0x380 };
1067static const int ne2000_irq[NE2000_NB_MAX] = { 9, 10, 11, 3, 4, 5 };
b41a2cd1 1068
48a18b3c 1069void pc_init_ne2k_isa(ISABus *bus, NICInfo *nd)
a41b2ff2
PB
1070{
1071 static int nb_ne2k = 0;
1072
1073 if (nb_ne2k == NE2000_NB_MAX)
1074 return;
48a18b3c 1075 isa_ne2000_init(bus, ne2000_io[nb_ne2k],
9453c5bc 1076 ne2000_irq[nb_ne2k], nd);
a41b2ff2
PB
1077 nb_ne2k++;
1078}
1079
92a16d7a 1080DeviceState *cpu_get_current_apic(void)
0e26b7b8 1081{
4917cf44
AF
1082 if (current_cpu) {
1083 X86CPU *cpu = X86_CPU(current_cpu);
02e51483 1084 return cpu->apic_state;
0e26b7b8
BS
1085 } else {
1086 return NULL;
1087 }
1088}
1089
845773ab 1090void pc_acpi_smi_interrupt(void *opaque, int irq, int level)
53b67b30 1091{
c3affe56 1092 X86CPU *cpu = opaque;
53b67b30
BS
1093
1094 if (level) {
c3affe56 1095 cpu_interrupt(CPU(cpu), CPU_INTERRUPT_SMI);
53b67b30
BS
1096 }
1097}
1098
074281d6 1099static void pc_new_cpu(const char *typename, int64_t apic_id, Error **errp)
31050930 1100{
074281d6 1101 Object *cpu = NULL;
31050930
IM
1102 Error *local_err = NULL;
1103
074281d6 1104 cpu = object_new(typename);
31050930 1105
c7b4efb4 1106 object_property_set_uint(cpu, apic_id, "apic-id", &local_err);
074281d6 1107 object_property_set_bool(cpu, true, "realized", &local_err);
31050930 1108
074281d6 1109 object_unref(cpu);
021c9d25 1110 error_propagate(errp, local_err);
31050930
IM
1111}
1112
c649983b
IM
1113void pc_hot_add_cpu(const int64_t id, Error **errp)
1114{
38690a1c 1115 MachineState *ms = MACHINE(qdev_get_machine());
c649983b 1116 int64_t apic_id = x86_cpu_apic_id_from_index(id);
0e3bd562 1117 Error *local_err = NULL;
c649983b 1118
8de433cb
IM
1119 if (id < 0) {
1120 error_setg(errp, "Invalid CPU id: %" PRIi64, id);
1121 return;
1122 }
1123
5ff020b7
EH
1124 if (apic_id >= ACPI_CPU_HOTPLUG_ID_LIMIT) {
1125 error_setg(errp, "Unable to add CPU: %" PRIi64
1126 ", resulting APIC ID (%" PRIi64 ") is too large",
1127 id, apic_id);
1128 return;
1129 }
1130
311ca98d 1131 pc_new_cpu(ms->cpu_type, apic_id, &local_err);
0e3bd562
AF
1132 if (local_err) {
1133 error_propagate(errp, local_err);
1134 return;
1135 }
c649983b
IM
1136}
1137
4884b7bf 1138void pc_cpus_init(PCMachineState *pcms)
70166477
IY
1139{
1140 int i;
c96a1c0b 1141 const CPUArchIdList *possible_cpus;
311ca98d 1142 MachineState *ms = MACHINE(pcms);
c96a1c0b 1143 MachineClass *mc = MACHINE_GET_CLASS(pcms);
70166477 1144
ebde2465
IM
1145 /* Calculates the limit to CPU APIC ID values
1146 *
1147 * Limit for the APIC ID value, so that all
1148 * CPU APIC IDs are < pcms->apic_id_limit.
1149 *
1150 * This is used for FW_CFG_MAX_CPUS. See comments on bochs_bios_init().
1151 */
1152 pcms->apic_id_limit = x86_cpu_apic_id_from_index(max_cpus - 1) + 1;
311ca98d 1153 possible_cpus = mc->possible_cpu_arch_ids(ms);
c96a1c0b 1154 for (i = 0; i < smp_cpus; i++) {
d342eb76
IM
1155 pc_new_cpu(possible_cpus->cpus[i].type, possible_cpus->cpus[i].arch_id,
1156 &error_fatal);
70166477
IY
1157 }
1158}
1159
217f1b4a
HZ
1160static void pc_build_feature_control_file(PCMachineState *pcms)
1161{
38690a1c
IM
1162 MachineState *ms = MACHINE(pcms);
1163 X86CPU *cpu = X86_CPU(ms->possible_cpus->cpus[0].cpu);
217f1b4a
HZ
1164 CPUX86State *env = &cpu->env;
1165 uint32_t unused, ecx, edx;
1166 uint64_t feature_control_bits = 0;
1167 uint64_t *val;
1168
1169 cpu_x86_cpuid(env, 1, 0, &unused, &unused, &ecx, &edx);
1170 if (ecx & CPUID_EXT_VMX) {
1171 feature_control_bits |= FEATURE_CONTROL_VMXON_ENABLED_OUTSIDE_SMX;
1172 }
1173
1174 if ((edx & (CPUID_EXT2_MCE | CPUID_EXT2_MCA)) ==
1175 (CPUID_EXT2_MCE | CPUID_EXT2_MCA) &&
1176 (env->mcg_cap & MCG_LMCE_P)) {
1177 feature_control_bits |= FEATURE_CONTROL_LMCE;
1178 }
1179
1180 if (!feature_control_bits) {
1181 return;
1182 }
1183
1184 val = g_malloc(sizeof(*val));
1185 *val = cpu_to_le64(feature_control_bits | FEATURE_CONTROL_LOCKED);
1186 fw_cfg_add_file(pcms->fw_cfg, "etc/msr_feature_control", val, sizeof(*val));
1187}
1188
e3cadac0
IM
1189static void rtc_set_cpus_count(ISADevice *rtc, uint16_t cpus_count)
1190{
1191 if (cpus_count > 0xff) {
1192 /* If the number of CPUs can't be represented in 8 bits, the
1193 * BIOS must use "FW_CFG_NB_CPUS". Set RTC field to 0 just
1194 * to make old BIOSes fail more predictably.
1195 */
1196 rtc_set_memory(rtc, 0x5f, 0);
1197 } else {
1198 rtc_set_memory(rtc, 0x5f, cpus_count - 1);
1199 }
1200}
1201
3459a625 1202static
9ebeed0c 1203void pc_machine_done(Notifier *notifier, void *data)
3459a625 1204{
9ebeed0c
EH
1205 PCMachineState *pcms = container_of(notifier,
1206 PCMachineState, machine_done);
1207 PCIBus *bus = pcms->bus;
2118196b 1208
ba157b69 1209 /* set the number of CPUs */
e3cadac0 1210 rtc_set_cpus_count(pcms->rtc, pcms->boot_cpus);
ba157b69 1211
2118196b
MA
1212 if (bus) {
1213 int extra_hosts = 0;
1214
1215 QLIST_FOREACH(bus, &bus->child, sibling) {
1216 /* look for expander root buses */
1217 if (pci_bus_is_root(bus)) {
1218 extra_hosts++;
1219 }
1220 }
f264d360 1221 if (extra_hosts && pcms->fw_cfg) {
2118196b
MA
1222 uint64_t *val = g_malloc(sizeof(*val));
1223 *val = cpu_to_le64(extra_hosts);
f264d360 1224 fw_cfg_add_file(pcms->fw_cfg,
2118196b
MA
1225 "etc/extra-pci-roots", val, sizeof(*val));
1226 }
1227 }
1228
bb292f5a 1229 acpi_setup();
6d42eefa 1230 if (pcms->fw_cfg) {
f2098f48 1231 pc_build_smbios(pcms);
217f1b4a 1232 pc_build_feature_control_file(pcms);
e3cadac0
IM
1233 /* update FW_CFG_NB_CPUS to account for -device added CPUs */
1234 fw_cfg_modify_i16(pcms->fw_cfg, FW_CFG_NB_CPUS, pcms->boot_cpus);
6d42eefa 1235 }
60c5e104 1236
1a26f466 1237 if (pcms->apic_id_limit > 255 && !xen_enabled()) {
60c5e104
IM
1238 IntelIOMMUState *iommu = INTEL_IOMMU_DEVICE(x86_iommu_get_default());
1239
1240 if (!iommu || !iommu->x86_iommu.intr_supported ||
1241 iommu->intr_eim != ON_OFF_AUTO_ON) {
1242 error_report("current -smp configuration requires "
1243 "Extended Interrupt Mode enabled. "
1244 "You can add an IOMMU using: "
1245 "-device intel-iommu,intremap=on,eim=on");
1246 exit(EXIT_FAILURE);
1247 }
1248 }
3459a625
MT
1249}
1250
e4e8ba04 1251void pc_guest_info_init(PCMachineState *pcms)
3459a625 1252{
1f3aba37 1253 int i;
b20c9bd5 1254
dd4c2f01
EH
1255 pcms->apic_xrupt_override = kvm_allows_irq0_override();
1256 pcms->numa_nodes = nb_numa_nodes;
1257 pcms->node_mem = g_malloc0(pcms->numa_nodes *
1258 sizeof *pcms->node_mem);
8c85901e 1259 for (i = 0; i < nb_numa_nodes; i++) {
dd4c2f01 1260 pcms->node_mem[i] = numa_info[i].node_mem;
8c85901e
WG
1261 }
1262
9ebeed0c
EH
1263 pcms->machine_done.notify = pc_machine_done;
1264 qemu_add_machine_init_done_notifier(&pcms->machine_done);
3459a625
MT
1265}
1266
83d08f26
MT
1267/* setup pci memory address space mapping into system address space */
1268void pc_pci_as_mapping_init(Object *owner, MemoryRegion *system_memory,
1269 MemoryRegion *pci_address_space)
39848901 1270{
83d08f26
MT
1271 /* Set to lower priority than RAM */
1272 memory_region_add_subregion_overlap(system_memory, 0x0,
1273 pci_address_space, -1);
39848901
IM
1274}
1275
f7e4dd6c
GH
1276void pc_acpi_init(const char *default_dsdt)
1277{
c5a98cf3 1278 char *filename;
f7e4dd6c
GH
1279
1280 if (acpi_tables != NULL) {
1281 /* manually set via -acpitable, leave it alone */
1282 return;
1283 }
1284
1285 filename = qemu_find_file(QEMU_FILE_TYPE_BIOS, default_dsdt);
1286 if (filename == NULL) {
2ab4b135 1287 warn_report("failed to find %s", default_dsdt);
c5a98cf3 1288 } else {
5bdb59a2
MA
1289 QemuOpts *opts = qemu_opts_create(qemu_find_opts("acpi"), NULL, 0,
1290 &error_abort);
c5a98cf3 1291 Error *err = NULL;
f7e4dd6c 1292
5bdb59a2 1293 qemu_opt_set(opts, "file", filename, &error_abort);
0c764a9d 1294
1a4b2666 1295 acpi_table_add_builtin(opts, &err);
c5a98cf3 1296 if (err) {
88f83f35 1297 warn_reportf_err(err, "failed to load %s: ", filename);
c5a98cf3 1298 }
c5a98cf3 1299 g_free(filename);
f7e4dd6c 1300 }
f7e4dd6c
GH
1301}
1302
7bc35e0f 1303void xen_load_linux(PCMachineState *pcms)
b33a5bbf
CL
1304{
1305 int i;
1306 FWCfgState *fw_cfg;
1307
df1f79fd 1308 assert(MACHINE(pcms)->kernel_filename != NULL);
b33a5bbf 1309
305ae888 1310 fw_cfg = fw_cfg_init_io(FW_CFG_IO_BASE);
e3cadac0 1311 fw_cfg_add_i16(fw_cfg, FW_CFG_NB_CPUS, pcms->boot_cpus);
b33a5bbf
CL
1312 rom_set_fw(fw_cfg);
1313
df1f79fd 1314 load_linux(pcms, fw_cfg);
b33a5bbf
CL
1315 for (i = 0; i < nb_option_roms; i++) {
1316 assert(!strcmp(option_rom[i].name, "linuxboot.bin") ||
b2a575a1 1317 !strcmp(option_rom[i].name, "linuxboot_dma.bin") ||
b33a5bbf
CL
1318 !strcmp(option_rom[i].name, "multiboot.bin"));
1319 rom_add_option(option_rom[i].name, option_rom[i].bootindex);
1320 }
f264d360 1321 pcms->fw_cfg = fw_cfg;
b33a5bbf
CL
1322}
1323
5934e216
EH
1324void pc_memory_init(PCMachineState *pcms,
1325 MemoryRegion *system_memory,
1326 MemoryRegion *rom_memory,
1327 MemoryRegion **ram_memory)
80cabfad 1328{
cbc5b5f3
JJ
1329 int linux_boot, i;
1330 MemoryRegion *ram, *option_rom_mr;
00cb2a99 1331 MemoryRegion *ram_below_4g, *ram_above_4g;
a88b362c 1332 FWCfgState *fw_cfg;
62b160c0 1333 MachineState *machine = MACHINE(pcms);
16a9e8a5 1334 PCMachineClass *pcmc = PC_MACHINE_GET_CLASS(pcms);
d592d303 1335
c8d163bc
EH
1336 assert(machine->ram_size == pcms->below_4g_mem_size +
1337 pcms->above_4g_mem_size);
9521d42b
PB
1338
1339 linux_boot = (machine->kernel_filename != NULL);
80cabfad 1340
00cb2a99 1341 /* Allocate RAM. We allocate it as a single memory region and use
66a0a2cb 1342 * aliases to address portions of it, mostly for backwards compatibility
00cb2a99
AK
1343 * with older qemus that used qemu_ram_alloc().
1344 */
7267c094 1345 ram = g_malloc(sizeof(*ram));
9521d42b
PB
1346 memory_region_allocate_system_memory(ram, NULL, "pc.ram",
1347 machine->ram_size);
ae0a5466 1348 *ram_memory = ram;
7267c094 1349 ram_below_4g = g_malloc(sizeof(*ram_below_4g));
2c9b15ca 1350 memory_region_init_alias(ram_below_4g, NULL, "ram-below-4g", ram,
c8d163bc 1351 0, pcms->below_4g_mem_size);
00cb2a99 1352 memory_region_add_subregion(system_memory, 0, ram_below_4g);
c8d163bc
EH
1353 e820_add_entry(0, pcms->below_4g_mem_size, E820_RAM);
1354 if (pcms->above_4g_mem_size > 0) {
7267c094 1355 ram_above_4g = g_malloc(sizeof(*ram_above_4g));
2c9b15ca 1356 memory_region_init_alias(ram_above_4g, NULL, "ram-above-4g", ram,
c8d163bc
EH
1357 pcms->below_4g_mem_size,
1358 pcms->above_4g_mem_size);
00cb2a99
AK
1359 memory_region_add_subregion(system_memory, 0x100000000ULL,
1360 ram_above_4g);
c8d163bc 1361 e820_add_entry(0x100000000ULL, pcms->above_4g_mem_size, E820_RAM);
bbe80adf 1362 }
82b36dc3 1363
bb292f5a 1364 if (!pcmc->has_reserved_memory &&
ca8336f3 1365 (machine->ram_slots ||
9521d42b 1366 (machine->maxram_size > machine->ram_size))) {
ca8336f3
IM
1367 MachineClass *mc = MACHINE_GET_CLASS(machine);
1368
1369 error_report("\"-memory 'slots|maxmem'\" is not supported by: %s",
1370 mc->name);
1371 exit(EXIT_FAILURE);
1372 }
1373
b0c14ec4
DH
1374 /* always allocate the device memory information */
1375 machine->device_memory = g_malloc0(sizeof(*machine->device_memory));
1376
f2ffbe2b 1377 /* initialize device memory address space */
bb292f5a 1378 if (pcmc->has_reserved_memory &&
9521d42b 1379 (machine->ram_size < machine->maxram_size)) {
f2ffbe2b 1380 ram_addr_t device_mem_size = machine->maxram_size - machine->ram_size;
619d11e4 1381
a0cc8856
IM
1382 if (machine->ram_slots > ACPI_MAX_RAM_SLOTS) {
1383 error_report("unsupported amount of memory slots: %"PRIu64,
1384 machine->ram_slots);
1385 exit(EXIT_FAILURE);
1386 }
1387
f2c38522
PK
1388 if (QEMU_ALIGN_UP(machine->maxram_size,
1389 TARGET_PAGE_SIZE) != machine->maxram_size) {
1390 error_report("maximum memory size must by aligned to multiple of "
1391 "%d bytes", TARGET_PAGE_SIZE);
1392 exit(EXIT_FAILURE);
1393 }
1394
b0c14ec4 1395 machine->device_memory->base =
c8d163bc 1396 ROUND_UP(0x100000000ULL + pcms->above_4g_mem_size, 1ULL << 30);
619d11e4 1397
16a9e8a5 1398 if (pcmc->enforce_aligned_dimm) {
f2ffbe2b
DH
1399 /* size device region assuming 1G page max alignment per slot */
1400 device_mem_size += (1ULL << 30) * machine->ram_slots;
085f8e88
IM
1401 }
1402
f2ffbe2b
DH
1403 if ((machine->device_memory->base + device_mem_size) <
1404 device_mem_size) {
619d11e4
IM
1405 error_report("unsupported amount of maximum memory: " RAM_ADDR_FMT,
1406 machine->maxram_size);
1407 exit(EXIT_FAILURE);
1408 }
1409
b0c14ec4 1410 memory_region_init(&machine->device_memory->mr, OBJECT(pcms),
f2ffbe2b 1411 "device-memory", device_mem_size);
b0c14ec4
DH
1412 memory_region_add_subregion(system_memory, machine->device_memory->base,
1413 &machine->device_memory->mr);
619d11e4 1414 }
cbc5b5f3
JJ
1415
1416 /* Initialize PC system firmware */
5db3f0de 1417 pc_system_firmware_init(rom_memory, !pcmc->pci_enabled);
00cb2a99 1418
7267c094 1419 option_rom_mr = g_malloc(sizeof(*option_rom_mr));
98a99ce0 1420 memory_region_init_ram(option_rom_mr, NULL, "pc.rom", PC_ROM_SIZE,
f8ed85ac 1421 &error_fatal);
208fa0e4
IM
1422 if (pcmc->pci_enabled) {
1423 memory_region_set_readonly(option_rom_mr, true);
1424 }
4463aee6 1425 memory_region_add_subregion_overlap(rom_memory,
00cb2a99
AK
1426 PC_ROM_MIN_VGA,
1427 option_rom_mr,
1428 1);
f753ff16 1429
ebde2465 1430 fw_cfg = bochs_bios_init(&address_space_memory, pcms);
c886fc4c 1431
8832cb80 1432 rom_set_fw(fw_cfg);
1d108d97 1433
b0c14ec4 1434 if (pcmc->has_reserved_memory && machine->device_memory->base) {
de268e13 1435 uint64_t *val = g_malloc(sizeof(*val));
2f8b5008 1436 PCMachineClass *pcmc = PC_MACHINE_GET_CLASS(pcms);
b0c14ec4 1437 uint64_t res_mem_end = machine->device_memory->base;
2f8b5008
IM
1438
1439 if (!pcmc->broken_reserved_end) {
b0c14ec4 1440 res_mem_end += memory_region_size(&machine->device_memory->mr);
2f8b5008 1441 }
3385e8e2 1442 *val = cpu_to_le64(ROUND_UP(res_mem_end, 0x1ULL << 30));
de268e13
IM
1443 fw_cfg_add_file(fw_cfg, "etc/reserved-memory-end", val, sizeof(*val));
1444 }
1445
f753ff16 1446 if (linux_boot) {
df1f79fd 1447 load_linux(pcms, fw_cfg);
f753ff16
PB
1448 }
1449
1450 for (i = 0; i < nb_option_roms; i++) {
2e55e842 1451 rom_add_option(option_rom[i].name, option_rom[i].bootindex);
406c8df3 1452 }
f264d360 1453 pcms->fw_cfg = fw_cfg;
cb135f59
PX
1454
1455 /* Init default IOAPIC address space */
1456 pcms->ioapic_as = &address_space_memory;
3d53f5c3
IY
1457}
1458
9fa99d25
MA
1459/*
1460 * The 64bit pci hole starts after "above 4G RAM" and
1461 * potentially the space reserved for memory hotplug.
1462 */
1463uint64_t pc_pci_hole64_start(void)
1464{
1465 PCMachineState *pcms = PC_MACHINE(qdev_get_machine());
1466 PCMachineClass *pcmc = PC_MACHINE_GET_CLASS(pcms);
b0c14ec4 1467 MachineState *ms = MACHINE(pcms);
9fa99d25
MA
1468 uint64_t hole64_start = 0;
1469
b0c14ec4
DH
1470 if (pcmc->has_reserved_memory && ms->device_memory->base) {
1471 hole64_start = ms->device_memory->base;
9fa99d25 1472 if (!pcmc->broken_reserved_end) {
b0c14ec4 1473 hole64_start += memory_region_size(&ms->device_memory->mr);
9fa99d25
MA
1474 }
1475 } else {
1476 hole64_start = 0x100000000ULL + pcms->above_4g_mem_size;
1477 }
1478
1479 return ROUND_UP(hole64_start, 1ULL << 30);
1480}
1481
0b0cc076 1482qemu_irq pc_allocate_cpu_irq(void)
845773ab 1483{
0b0cc076 1484 return qemu_allocate_irq(pic_irq_request, NULL, 0);
845773ab
IY
1485}
1486
48a18b3c 1487DeviceState *pc_vga_init(ISABus *isa_bus, PCIBus *pci_bus)
765d7908 1488{
ad6d45fa
AL
1489 DeviceState *dev = NULL;
1490
bab47d9a 1491 rom_set_order_override(FW_CFG_ORDER_OVERRIDE_VGA);
16094b75
AJ
1492 if (pci_bus) {
1493 PCIDevice *pcidev = pci_vga_init(pci_bus);
1494 dev = pcidev ? &pcidev->qdev : NULL;
1495 } else if (isa_bus) {
1496 ISADevice *isadev = isa_vga_init(isa_bus);
4a17cc4f 1497 dev = isadev ? DEVICE(isadev) : NULL;
765d7908 1498 }
bab47d9a 1499 rom_reset_order_override();
ad6d45fa 1500 return dev;
765d7908
IY
1501}
1502
258711c6
JG
1503static const MemoryRegionOps ioport80_io_ops = {
1504 .write = ioport80_write,
c02e1eac 1505 .read = ioport80_read,
258711c6
JG
1506 .endianness = DEVICE_NATIVE_ENDIAN,
1507 .impl = {
1508 .min_access_size = 1,
1509 .max_access_size = 1,
1510 },
1511};
1512
1513static const MemoryRegionOps ioportF0_io_ops = {
1514 .write = ioportF0_write,
c02e1eac 1515 .read = ioportF0_read,
258711c6
JG
1516 .endianness = DEVICE_NATIVE_ENDIAN,
1517 .impl = {
1518 .min_access_size = 1,
1519 .max_access_size = 1,
1520 },
1521};
1522
ac64273c
PMD
1523static void pc_superio_init(ISABus *isa_bus, bool create_fdctrl, bool no_vmport)
1524{
1525 int i;
1526 DriveInfo *fd[MAX_FD];
1527 qemu_irq *a20_line;
1528 ISADevice *i8042, *port92, *vmmouse;
1529
def337ff 1530 serial_hds_isa_init(isa_bus, 0, MAX_ISA_SERIAL_PORTS);
ac64273c
PMD
1531 parallel_hds_isa_init(isa_bus, MAX_PARALLEL_PORTS);
1532
1533 for (i = 0; i < MAX_FD; i++) {
1534 fd[i] = drive_get(IF_FLOPPY, 0, i);
1535 create_fdctrl |= !!fd[i];
1536 }
1537 if (create_fdctrl) {
1538 fdctrl_init_isa(isa_bus, fd);
1539 }
1540
1541 i8042 = isa_create_simple(isa_bus, "i8042");
1542 if (!no_vmport) {
1543 vmport_init(isa_bus);
1544 vmmouse = isa_try_create(isa_bus, "vmmouse");
1545 } else {
1546 vmmouse = NULL;
1547 }
1548 if (vmmouse) {
1549 DeviceState *dev = DEVICE(vmmouse);
1550 qdev_prop_set_ptr(dev, "ps2_mouse", i8042);
1551 qdev_init_nofail(dev);
1552 }
1553 port92 = isa_create_simple(isa_bus, "port92");
1554
1555 a20_line = qemu_allocate_irqs(handle_a20_line_change, first_cpu, 2);
1556 i8042_setup_a20_line(i8042, a20_line[0]);
1557 port92_init(port92, a20_line[1]);
1558 g_free(a20_line);
1559}
1560
48a18b3c 1561void pc_basic_device_init(ISABus *isa_bus, qemu_irq *gsi,
1611977c 1562 ISADevice **rtc_state,
fd53c87c 1563 bool create_fdctrl,
7a10ef51 1564 bool no_vmport,
feddd2fd 1565 bool has_pit,
3a87d009 1566 uint32_t hpet_irqs)
ffe513da
IY
1567{
1568 int i;
ce967e2f
JK
1569 DeviceState *hpet = NULL;
1570 int pit_isa_irq = 0;
1571 qemu_irq pit_alt_irq = NULL;
7d932dfd 1572 qemu_irq rtc_irq = NULL;
ac64273c 1573 ISADevice *pit = NULL;
258711c6
JG
1574 MemoryRegion *ioport80_io = g_new(MemoryRegion, 1);
1575 MemoryRegion *ioportF0_io = g_new(MemoryRegion, 1);
ffe513da 1576
2c9b15ca 1577 memory_region_init_io(ioport80_io, NULL, &ioport80_io_ops, NULL, "ioport80", 1);
258711c6 1578 memory_region_add_subregion(isa_bus->address_space_io, 0x80, ioport80_io);
ffe513da 1579
2c9b15ca 1580 memory_region_init_io(ioportF0_io, NULL, &ioportF0_io_ops, NULL, "ioportF0", 1);
258711c6 1581 memory_region_add_subregion(isa_bus->address_space_io, 0xf0, ioportF0_io);
ffe513da 1582
5d17c0d2
JK
1583 /*
1584 * Check if an HPET shall be created.
1585 *
1586 * Without KVM_CAP_PIT_STATE2, we cannot switch off the in-kernel PIT
1587 * when the HPET wants to take over. Thus we have to disable the latter.
1588 */
1589 if (!no_hpet && (!kvm_irqchip_in_kernel() || kvm_has_pit_state2())) {
7a10ef51 1590 /* In order to set property, here not using sysbus_try_create_simple */
51116102 1591 hpet = qdev_try_create(NULL, TYPE_HPET);
dd703b99 1592 if (hpet) {
7a10ef51
LPF
1593 /* For pc-piix-*, hpet's intcap is always IRQ2. For pc-q35-1.7
1594 * and earlier, use IRQ2 for compat. Otherwise, use IRQ16~23,
1595 * IRQ8 and IRQ2.
1596 */
5d7fb0f2 1597 uint8_t compat = object_property_get_uint(OBJECT(hpet),
7a10ef51
LPF
1598 HPET_INTCAP, NULL);
1599 if (!compat) {
1600 qdev_prop_set_uint32(hpet, HPET_INTCAP, hpet_irqs);
1601 }
1602 qdev_init_nofail(hpet);
1603 sysbus_mmio_map(SYS_BUS_DEVICE(hpet), 0, HPET_BASE);
1604
b881fbe9 1605 for (i = 0; i < GSI_NUM_PINS; i++) {
1356b98d 1606 sysbus_connect_irq(SYS_BUS_DEVICE(hpet), i, gsi[i]);
dd703b99 1607 }
ce967e2f
JK
1608 pit_isa_irq = -1;
1609 pit_alt_irq = qdev_get_gpio_in(hpet, HPET_LEGACY_PIT_INT);
1610 rtc_irq = qdev_get_gpio_in(hpet, HPET_LEGACY_RTC_INT);
822557eb 1611 }
ffe513da 1612 }
6c646a11 1613 *rtc_state = mc146818_rtc_init(isa_bus, 2000, rtc_irq);
7d932dfd
JK
1614
1615 qemu_register_boot_set(pc_boot_set, *rtc_state);
1616
feddd2fd 1617 if (!xen_enabled() && has_pit) {
15eafc2e 1618 if (kvm_pit_in_kernel()) {
c2d8d311
SS
1619 pit = kvm_pit_init(isa_bus, 0x40);
1620 } else {
acf695ec 1621 pit = i8254_pit_init(isa_bus, 0x40, pit_isa_irq, pit_alt_irq);
c2d8d311
SS
1622 }
1623 if (hpet) {
1624 /* connect PIT to output control line of the HPET */
4a17cc4f 1625 qdev_connect_gpio_out(hpet, 0, qdev_get_gpio_in(DEVICE(pit), 0));
c2d8d311
SS
1626 }
1627 pcspk_init(isa_bus, pit);
ce967e2f 1628 }
ffe513da 1629
55f613ac 1630 i8257_dma_init(isa_bus, 0);
ffe513da 1631
ac64273c
PMD
1632 /* Super I/O */
1633 pc_superio_init(isa_bus, create_fdctrl, no_vmport);
ffe513da
IY
1634}
1635
4b9c264b 1636void pc_nic_init(PCMachineClass *pcmc, ISABus *isa_bus, PCIBus *pci_bus)
9011a1a7
IY
1637{
1638 int i;
1639
bab47d9a 1640 rom_set_order_override(FW_CFG_ORDER_OVERRIDE_NIC);
9011a1a7
IY
1641 for (i = 0; i < nb_nics; i++) {
1642 NICInfo *nd = &nd_table[i];
4b9c264b 1643 const char *model = nd->model ? nd->model : pcmc->default_nic_model;
9011a1a7 1644
4b9c264b 1645 if (g_str_equal(model, "ne2k_isa")) {
9011a1a7
IY
1646 pc_init_ne2k_isa(isa_bus, nd);
1647 } else {
4b9c264b 1648 pci_nic_init_nofail(nd, pci_bus, model, NULL);
9011a1a7
IY
1649 }
1650 }
bab47d9a 1651 rom_reset_order_override();
9011a1a7
IY
1652}
1653
a39e3564
JB
1654void ioapic_init_gsi(GSIState *gsi_state, const char *parent_name)
1655{
1656 DeviceState *dev;
1657 SysBusDevice *d;
1658 unsigned int i;
1659
15eafc2e 1660 if (kvm_ioapic_in_kernel()) {
a39e3564
JB
1661 dev = qdev_create(NULL, "kvm-ioapic");
1662 } else {
1663 dev = qdev_create(NULL, "ioapic");
1664 }
1665 if (parent_name) {
1666 object_property_add_child(object_resolve_path(parent_name, NULL),
1667 "ioapic", OBJECT(dev), NULL);
1668 }
1669 qdev_init_nofail(dev);
1356b98d 1670 d = SYS_BUS_DEVICE(dev);
3a4a4697 1671 sysbus_mmio_map(d, 0, IO_APIC_DEFAULT_ADDRESS);
a39e3564
JB
1672
1673 for (i = 0; i < IOAPIC_NUM_PINS; i++) {
1674 gsi_state->ioapic_irq[i] = qdev_get_gpio_in(dev, i);
1675 }
1676}
d5747cac 1677
95bee274
IM
1678static void pc_dimm_plug(HotplugHandler *hotplug_dev,
1679 DeviceState *dev, Error **errp)
1680{
3fbcdc27 1681 HotplugHandlerClass *hhc;
95bee274
IM
1682 Error *local_err = NULL;
1683 PCMachineState *pcms = PC_MACHINE(hotplug_dev);
16a9e8a5 1684 PCMachineClass *pcmc = PC_MACHINE_GET_CLASS(pcms);
95bee274
IM
1685 PCDIMMDevice *dimm = PC_DIMM(dev);
1686 PCDIMMDeviceClass *ddc = PC_DIMM_GET_CLASS(dimm);
04790978 1687 MemoryRegion *mr;
92a37a04 1688 uint64_t align = TARGET_PAGE_SIZE;
7f3cf2d6 1689 bool is_nvdimm = object_dynamic_cast(OBJECT(dev), TYPE_NVDIMM);
95bee274 1690
04790978
TH
1691 mr = ddc->get_memory_region(dimm, &local_err);
1692 if (local_err) {
1693 goto out;
1694 }
1695
16a9e8a5 1696 if (memory_region_get_alignment(mr) && pcmc->enforce_aligned_dimm) {
91aa70ab
IM
1697 align = memory_region_get_alignment(mr);
1698 }
1699
8cd91ace
HZ
1700 /*
1701 * When -no-acpi is used with Q35 machine type, no ACPI is built,
1702 * but pcms->acpi_dev is still created. Check !acpi_enabled in
1703 * addition to cover this case.
1704 */
1705 if (!pcms->acpi_dev || !acpi_enabled) {
3fbcdc27 1706 error_setg(&local_err,
8cd91ace 1707 "memory hotplug is not enabled: missing acpi device or acpi disabled");
3fbcdc27
IM
1708 goto out;
1709 }
1710
7f3cf2d6
SH
1711 if (is_nvdimm && !pcms->acpi_nvdimm_state.is_enabled) {
1712 error_setg(&local_err,
1713 "nvdimm is not enabled: missing 'nvdimm' in '-M'");
1714 goto out;
1715 }
1716
bd6c3e4a 1717 pc_dimm_memory_plug(dev, MACHINE(pcms), align, &local_err);
43bbb49e 1718 if (local_err) {
b8865591
IM
1719 goto out;
1720 }
1721
7f3cf2d6 1722 if (is_nvdimm) {
284197e4 1723 nvdimm_plug(&pcms->acpi_nvdimm_state);
c7f8d0f3
XG
1724 }
1725
3fbcdc27 1726 hhc = HOTPLUG_HANDLER_GET_CLASS(pcms->acpi_dev);
8e23184b 1727 hhc->plug(HOTPLUG_HANDLER(pcms->acpi_dev), dev, &error_abort);
95bee274
IM
1728out:
1729 error_propagate(errp, local_err);
1730}
1731
64fec58e
TC
1732static void pc_dimm_unplug_request(HotplugHandler *hotplug_dev,
1733 DeviceState *dev, Error **errp)
1734{
1735 HotplugHandlerClass *hhc;
1736 Error *local_err = NULL;
1737 PCMachineState *pcms = PC_MACHINE(hotplug_dev);
1738
8cd91ace
HZ
1739 /*
1740 * When -no-acpi is used with Q35 machine type, no ACPI is built,
1741 * but pcms->acpi_dev is still created. Check !acpi_enabled in
1742 * addition to cover this case.
1743 */
1744 if (!pcms->acpi_dev || !acpi_enabled) {
64fec58e 1745 error_setg(&local_err,
8cd91ace 1746 "memory hotplug is not enabled: missing acpi device or acpi disabled");
64fec58e
TC
1747 goto out;
1748 }
1749
b097cc52
XG
1750 if (object_dynamic_cast(OBJECT(dev), TYPE_NVDIMM)) {
1751 error_setg(&local_err,
1752 "nvdimm device hot unplug is not supported yet.");
1753 goto out;
1754 }
1755
64fec58e
TC
1756 hhc = HOTPLUG_HANDLER_GET_CLASS(pcms->acpi_dev);
1757 hhc->unplug_request(HOTPLUG_HANDLER(pcms->acpi_dev), dev, &local_err);
1758
1759out:
1760 error_propagate(errp, local_err);
1761}
1762
f7d3e29d
TC
1763static void pc_dimm_unplug(HotplugHandler *hotplug_dev,
1764 DeviceState *dev, Error **errp)
1765{
1766 PCMachineState *pcms = PC_MACHINE(hotplug_dev);
f7d3e29d
TC
1767 HotplugHandlerClass *hhc;
1768 Error *local_err = NULL;
1769
1770 hhc = HOTPLUG_HANDLER_GET_CLASS(pcms->acpi_dev);
1771 hhc->unplug(HOTPLUG_HANDLER(pcms->acpi_dev), dev, &local_err);
1772
1773 if (local_err) {
1774 goto out;
1775 }
1776
bd6c3e4a 1777 pc_dimm_memory_unplug(dev, MACHINE(pcms));
f7d3e29d
TC
1778 object_unparent(OBJECT(dev));
1779
1780 out:
1781 error_propagate(errp, local_err);
1782}
1783
3811ef14
IM
1784static int pc_apic_cmp(const void *a, const void *b)
1785{
1786 CPUArchId *apic_a = (CPUArchId *)a;
1787 CPUArchId *apic_b = (CPUArchId *)b;
1788
1789 return apic_a->arch_id - apic_b->arch_id;
1790}
1791
7baef5cf 1792/* returns pointer to CPUArchId descriptor that matches CPU's apic_id
38690a1c 1793 * in ms->possible_cpus->cpus, if ms->possible_cpus->cpus has no
b12227af 1794 * entry corresponding to CPU's apic_id returns NULL.
7baef5cf 1795 */
1ea69c0e 1796static CPUArchId *pc_find_cpu_slot(MachineState *ms, uint32_t id, int *idx)
7baef5cf 1797{
7baef5cf
IM
1798 CPUArchId apic_id, *found_cpu;
1799
1ea69c0e 1800 apic_id.arch_id = id;
38690a1c
IM
1801 found_cpu = bsearch(&apic_id, ms->possible_cpus->cpus,
1802 ms->possible_cpus->len, sizeof(*ms->possible_cpus->cpus),
7baef5cf
IM
1803 pc_apic_cmp);
1804 if (found_cpu && idx) {
38690a1c 1805 *idx = found_cpu - ms->possible_cpus->cpus;
7baef5cf
IM
1806 }
1807 return found_cpu;
1808}
1809
5279569e
GZ
1810static void pc_cpu_plug(HotplugHandler *hotplug_dev,
1811 DeviceState *dev, Error **errp)
1812{
7baef5cf 1813 CPUArchId *found_cpu;
5279569e
GZ
1814 HotplugHandlerClass *hhc;
1815 Error *local_err = NULL;
1ea69c0e 1816 X86CPU *cpu = X86_CPU(dev);
5279569e
GZ
1817 PCMachineState *pcms = PC_MACHINE(hotplug_dev);
1818
a44a49db
IM
1819 if (pcms->acpi_dev) {
1820 hhc = HOTPLUG_HANDLER_GET_CLASS(pcms->acpi_dev);
1821 hhc->plug(HOTPLUG_HANDLER(pcms->acpi_dev), dev, &local_err);
1822 if (local_err) {
1823 goto out;
1824 }
5279569e
GZ
1825 }
1826
e3cadac0
IM
1827 /* increment the number of CPUs */
1828 pcms->boot_cpus++;
26ef65be 1829 if (pcms->rtc) {
e3cadac0 1830 rtc_set_cpus_count(pcms->rtc, pcms->boot_cpus);
26ef65be
IM
1831 }
1832 if (pcms->fw_cfg) {
e3cadac0 1833 fw_cfg_modify_i16(pcms->fw_cfg, FW_CFG_NB_CPUS, pcms->boot_cpus);
2d996150
GZ
1834 }
1835
1ea69c0e 1836 found_cpu = pc_find_cpu_slot(MACHINE(pcms), cpu->apic_id, NULL);
8aba3842 1837 found_cpu->cpu = OBJECT(dev);
5279569e
GZ
1838out:
1839 error_propagate(errp, local_err);
1840}
8872c25a
IM
1841static void pc_cpu_unplug_request_cb(HotplugHandler *hotplug_dev,
1842 DeviceState *dev, Error **errp)
1843{
73360e27 1844 int idx = -1;
8872c25a
IM
1845 HotplugHandlerClass *hhc;
1846 Error *local_err = NULL;
1ea69c0e 1847 X86CPU *cpu = X86_CPU(dev);
8872c25a
IM
1848 PCMachineState *pcms = PC_MACHINE(hotplug_dev);
1849
75ba2ddb
IM
1850 if (!pcms->acpi_dev) {
1851 error_setg(&local_err, "CPU hot unplug not supported without ACPI");
1852 goto out;
1853 }
1854
1ea69c0e 1855 pc_find_cpu_slot(MACHINE(pcms), cpu->apic_id, &idx);
73360e27
IM
1856 assert(idx != -1);
1857 if (idx == 0) {
1858 error_setg(&local_err, "Boot CPU is unpluggable");
1859 goto out;
1860 }
1861
8872c25a
IM
1862 hhc = HOTPLUG_HANDLER_GET_CLASS(pcms->acpi_dev);
1863 hhc->unplug_request(HOTPLUG_HANDLER(pcms->acpi_dev), dev, &local_err);
1864
1865 if (local_err) {
1866 goto out;
1867 }
1868
1869 out:
1870 error_propagate(errp, local_err);
1871
1872}
1873
1874static void pc_cpu_unplug_cb(HotplugHandler *hotplug_dev,
1875 DeviceState *dev, Error **errp)
1876{
8fe6374e 1877 CPUArchId *found_cpu;
8872c25a
IM
1878 HotplugHandlerClass *hhc;
1879 Error *local_err = NULL;
1ea69c0e 1880 X86CPU *cpu = X86_CPU(dev);
8872c25a
IM
1881 PCMachineState *pcms = PC_MACHINE(hotplug_dev);
1882
1883 hhc = HOTPLUG_HANDLER_GET_CLASS(pcms->acpi_dev);
1884 hhc->unplug(HOTPLUG_HANDLER(pcms->acpi_dev), dev, &local_err);
1885
1886 if (local_err) {
1887 goto out;
1888 }
1889
1ea69c0e 1890 found_cpu = pc_find_cpu_slot(MACHINE(pcms), cpu->apic_id, NULL);
8fe6374e
IM
1891 found_cpu->cpu = NULL;
1892 object_unparent(OBJECT(dev));
8872c25a 1893
e3cadac0
IM
1894 /* decrement the number of CPUs */
1895 pcms->boot_cpus--;
1896 /* Update the number of CPUs in CMOS */
1897 rtc_set_cpus_count(pcms->rtc, pcms->boot_cpus);
1898 fw_cfg_modify_i16(pcms->fw_cfg, FW_CFG_NB_CPUS, pcms->boot_cpus);
8872c25a
IM
1899 out:
1900 error_propagate(errp, local_err);
1901}
5279569e 1902
4ec60c76
IM
1903static void pc_cpu_pre_plug(HotplugHandler *hotplug_dev,
1904 DeviceState *dev, Error **errp)
1905{
1906 int idx;
a15d2728 1907 CPUState *cs;
e8f7b83e 1908 CPUArchId *cpu_slot;
d89c2b8b 1909 X86CPUTopoInfo topo;
4ec60c76 1910 X86CPU *cpu = X86_CPU(dev);
6970c5ff 1911 MachineState *ms = MACHINE(hotplug_dev);
4ec60c76 1912 PCMachineState *pcms = PC_MACHINE(hotplug_dev);
4ec60c76 1913
6970c5ff
IM
1914 if(!object_dynamic_cast(OBJECT(cpu), ms->cpu_type)) {
1915 error_setg(errp, "Invalid CPU type, expected cpu type: '%s'",
1916 ms->cpu_type);
1917 return;
1918 }
1919
e8f7b83e
IM
1920 /* if APIC ID is not set, set it based on socket/core/thread properties */
1921 if (cpu->apic_id == UNASSIGNED_APIC_ID) {
1922 int max_socket = (max_cpus - 1) / smp_threads / smp_cores;
1923
1924 if (cpu->socket_id < 0) {
1925 error_setg(errp, "CPU socket-id is not set");
1926 return;
1927 } else if (cpu->socket_id > max_socket) {
1928 error_setg(errp, "Invalid CPU socket-id: %u must be in range 0:%u",
1929 cpu->socket_id, max_socket);
1930 return;
1931 }
1932 if (cpu->core_id < 0) {
1933 error_setg(errp, "CPU core-id is not set");
1934 return;
1935 } else if (cpu->core_id > (smp_cores - 1)) {
1936 error_setg(errp, "Invalid CPU core-id: %u must be in range 0:%u",
1937 cpu->core_id, smp_cores - 1);
1938 return;
1939 }
1940 if (cpu->thread_id < 0) {
1941 error_setg(errp, "CPU thread-id is not set");
1942 return;
1943 } else if (cpu->thread_id > (smp_threads - 1)) {
1944 error_setg(errp, "Invalid CPU thread-id: %u must be in range 0:%u",
1945 cpu->thread_id, smp_threads - 1);
1946 return;
1947 }
1948
1949 topo.pkg_id = cpu->socket_id;
1950 topo.core_id = cpu->core_id;
1951 topo.smt_id = cpu->thread_id;
1952 cpu->apic_id = apicid_from_topo_ids(smp_cores, smp_threads, &topo);
1953 }
1954
1ea69c0e 1955 cpu_slot = pc_find_cpu_slot(MACHINE(pcms), cpu->apic_id, &idx);
4ec60c76 1956 if (!cpu_slot) {
38690a1c
IM
1957 MachineState *ms = MACHINE(pcms);
1958
e8f7b83e
IM
1959 x86_topo_ids_from_apicid(cpu->apic_id, smp_cores, smp_threads, &topo);
1960 error_setg(errp, "Invalid CPU [socket: %u, core: %u, thread: %u] with"
1961 " APIC ID %" PRIu32 ", valid index range 0:%d",
1962 topo.pkg_id, topo.core_id, topo.smt_id, cpu->apic_id,
38690a1c 1963 ms->possible_cpus->len - 1);
4ec60c76
IM
1964 return;
1965 }
1966
1967 if (cpu_slot->cpu) {
1968 error_setg(errp, "CPU[%d] with APIC ID %" PRIu32 " exists",
1969 idx, cpu->apic_id);
1970 return;
1971 }
d89c2b8b
IM
1972
1973 /* if 'address' properties socket-id/core-id/thread-id are not set, set them
c5514d0e 1974 * so that machine_query_hotpluggable_cpus would show correct values
d89c2b8b
IM
1975 */
1976 /* TODO: move socket_id/core_id/thread_id checks into x86_cpu_realizefn()
1977 * once -smp refactoring is complete and there will be CPU private
1978 * CPUState::nr_cores and CPUState::nr_threads fields instead of globals */
1979 x86_topo_ids_from_apicid(cpu->apic_id, smp_cores, smp_threads, &topo);
1980 if (cpu->socket_id != -1 && cpu->socket_id != topo.pkg_id) {
1981 error_setg(errp, "property socket-id: %u doesn't match set apic-id:"
1982 " 0x%x (socket-id: %u)", cpu->socket_id, cpu->apic_id, topo.pkg_id);
1983 return;
1984 }
1985 cpu->socket_id = topo.pkg_id;
1986
1987 if (cpu->core_id != -1 && cpu->core_id != topo.core_id) {
1988 error_setg(errp, "property core-id: %u doesn't match set apic-id:"
1989 " 0x%x (core-id: %u)", cpu->core_id, cpu->apic_id, topo.core_id);
1990 return;
1991 }
1992 cpu->core_id = topo.core_id;
1993
1994 if (cpu->thread_id != -1 && cpu->thread_id != topo.smt_id) {
1995 error_setg(errp, "property thread-id: %u doesn't match set apic-id:"
1996 " 0x%x (thread-id: %u)", cpu->thread_id, cpu->apic_id, topo.smt_id);
1997 return;
1998 }
1999 cpu->thread_id = topo.smt_id;
a15d2728
IM
2000
2001 cs = CPU(cpu);
2002 cs->cpu_index = idx;
93b2a8cb 2003
a0ceb640 2004 numa_cpu_pre_plug(cpu_slot, dev, errp);
4ec60c76
IM
2005}
2006
2007static void pc_machine_device_pre_plug_cb(HotplugHandler *hotplug_dev,
2008 DeviceState *dev, Error **errp)
2009{
2010 if (object_dynamic_cast(OBJECT(dev), TYPE_CPU)) {
2011 pc_cpu_pre_plug(hotplug_dev, dev, errp);
2012 }
2013}
2014
95bee274
IM
2015static void pc_machine_device_plug_cb(HotplugHandler *hotplug_dev,
2016 DeviceState *dev, Error **errp)
2017{
2018 if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2019 pc_dimm_plug(hotplug_dev, dev, errp);
5279569e
GZ
2020 } else if (object_dynamic_cast(OBJECT(dev), TYPE_CPU)) {
2021 pc_cpu_plug(hotplug_dev, dev, errp);
95bee274
IM
2022 }
2023}
2024
d9c5c5b8
TC
2025static void pc_machine_device_unplug_request_cb(HotplugHandler *hotplug_dev,
2026 DeviceState *dev, Error **errp)
2027{
64fec58e
TC
2028 if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2029 pc_dimm_unplug_request(hotplug_dev, dev, errp);
8872c25a
IM
2030 } else if (object_dynamic_cast(OBJECT(dev), TYPE_CPU)) {
2031 pc_cpu_unplug_request_cb(hotplug_dev, dev, errp);
64fec58e
TC
2032 } else {
2033 error_setg(errp, "acpi: device unplug request for not supported device"
2034 " type: %s", object_get_typename(OBJECT(dev)));
2035 }
d9c5c5b8
TC
2036}
2037
232391c1
TC
2038static void pc_machine_device_unplug_cb(HotplugHandler *hotplug_dev,
2039 DeviceState *dev, Error **errp)
2040{
f7d3e29d
TC
2041 if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM)) {
2042 pc_dimm_unplug(hotplug_dev, dev, errp);
8872c25a
IM
2043 } else if (object_dynamic_cast(OBJECT(dev), TYPE_CPU)) {
2044 pc_cpu_unplug_cb(hotplug_dev, dev, errp);
f7d3e29d
TC
2045 } else {
2046 error_setg(errp, "acpi: device unplug for not supported device"
2047 " type: %s", object_get_typename(OBJECT(dev)));
2048 }
232391c1
TC
2049}
2050
95bee274
IM
2051static HotplugHandler *pc_get_hotpug_handler(MachineState *machine,
2052 DeviceState *dev)
2053{
5279569e
GZ
2054 if (object_dynamic_cast(OBJECT(dev), TYPE_PC_DIMM) ||
2055 object_dynamic_cast(OBJECT(dev), TYPE_CPU)) {
95bee274
IM
2056 return HOTPLUG_HANDLER(machine);
2057 }
2058
38aefb57 2059 return NULL;
95bee274
IM
2060}
2061
bf1e8939 2062static void
f2ffbe2b
DH
2063pc_machine_get_device_memory_region_size(Object *obj, Visitor *v,
2064 const char *name, void *opaque,
2065 Error **errp)
bf1e8939 2066{
b0c14ec4
DH
2067 MachineState *ms = MACHINE(obj);
2068 int64_t value = memory_region_size(&ms->device_memory->mr);
bf1e8939 2069
51e72bc1 2070 visit_type_int(v, name, &value, errp);
bf1e8939
IM
2071}
2072
c87b1520 2073static void pc_machine_get_max_ram_below_4g(Object *obj, Visitor *v,
d7bce999
EB
2074 const char *name, void *opaque,
2075 Error **errp)
c87b1520
DS
2076{
2077 PCMachineState *pcms = PC_MACHINE(obj);
2078 uint64_t value = pcms->max_ram_below_4g;
2079
51e72bc1 2080 visit_type_size(v, name, &value, errp);
c87b1520
DS
2081}
2082
2083static void pc_machine_set_max_ram_below_4g(Object *obj, Visitor *v,
d7bce999
EB
2084 const char *name, void *opaque,
2085 Error **errp)
c87b1520
DS
2086{
2087 PCMachineState *pcms = PC_MACHINE(obj);
2088 Error *error = NULL;
2089 uint64_t value;
2090
51e72bc1 2091 visit_type_size(v, name, &value, &error);
c87b1520
DS
2092 if (error) {
2093 error_propagate(errp, error);
2094 return;
2095 }
2096 if (value > (1ULL << 32)) {
455b0fde
EB
2097 error_setg(&error,
2098 "Machine option 'max-ram-below-4g=%"PRIu64
2099 "' expects size less than or equal to 4G", value);
c87b1520
DS
2100 error_propagate(errp, error);
2101 return;
2102 }
2103
2104 if (value < (1ULL << 20)) {
9e5d2c52
AF
2105 warn_report("Only %" PRIu64 " bytes of RAM below the 4GiB boundary,"
2106 "BIOS may not work with less than 1MiB", value);
c87b1520
DS
2107 }
2108
2109 pcms->max_ram_below_4g = value;
2110}
2111
d7bce999
EB
2112static void pc_machine_get_vmport(Object *obj, Visitor *v, const char *name,
2113 void *opaque, Error **errp)
9b23cfb7
DDAG
2114{
2115 PCMachineState *pcms = PC_MACHINE(obj);
d1048bef 2116 OnOffAuto vmport = pcms->vmport;
9b23cfb7 2117
51e72bc1 2118 visit_type_OnOffAuto(v, name, &vmport, errp);
9b23cfb7
DDAG
2119}
2120
d7bce999
EB
2121static void pc_machine_set_vmport(Object *obj, Visitor *v, const char *name,
2122 void *opaque, Error **errp)
9b23cfb7
DDAG
2123{
2124 PCMachineState *pcms = PC_MACHINE(obj);
2125
51e72bc1 2126 visit_type_OnOffAuto(v, name, &pcms->vmport, errp);
9b23cfb7
DDAG
2127}
2128
355023f2
PB
2129bool pc_machine_is_smm_enabled(PCMachineState *pcms)
2130{
2131 bool smm_available = false;
2132
2133 if (pcms->smm == ON_OFF_AUTO_OFF) {
2134 return false;
2135 }
2136
2137 if (tcg_enabled() || qtest_enabled()) {
2138 smm_available = true;
2139 } else if (kvm_enabled()) {
2140 smm_available = kvm_has_smm();
2141 }
2142
2143 if (smm_available) {
2144 return true;
2145 }
2146
2147 if (pcms->smm == ON_OFF_AUTO_ON) {
2148 error_report("System Management Mode not supported by this hypervisor.");
2149 exit(1);
2150 }
2151 return false;
2152}
2153
d7bce999
EB
2154static void pc_machine_get_smm(Object *obj, Visitor *v, const char *name,
2155 void *opaque, Error **errp)
355023f2
PB
2156{
2157 PCMachineState *pcms = PC_MACHINE(obj);
2158 OnOffAuto smm = pcms->smm;
2159
51e72bc1 2160 visit_type_OnOffAuto(v, name, &smm, errp);
355023f2
PB
2161}
2162
d7bce999
EB
2163static void pc_machine_set_smm(Object *obj, Visitor *v, const char *name,
2164 void *opaque, Error **errp)
355023f2
PB
2165{
2166 PCMachineState *pcms = PC_MACHINE(obj);
2167
51e72bc1 2168 visit_type_OnOffAuto(v, name, &pcms->smm, errp);
355023f2
PB
2169}
2170
87252e1b
XG
2171static bool pc_machine_get_nvdimm(Object *obj, Error **errp)
2172{
2173 PCMachineState *pcms = PC_MACHINE(obj);
2174
5fe79386 2175 return pcms->acpi_nvdimm_state.is_enabled;
87252e1b
XG
2176}
2177
2178static void pc_machine_set_nvdimm(Object *obj, bool value, Error **errp)
2179{
2180 PCMachineState *pcms = PC_MACHINE(obj);
2181
5fe79386 2182 pcms->acpi_nvdimm_state.is_enabled = value;
87252e1b
XG
2183}
2184
be232eb0
CP
2185static bool pc_machine_get_smbus(Object *obj, Error **errp)
2186{
2187 PCMachineState *pcms = PC_MACHINE(obj);
2188
2189 return pcms->smbus;
2190}
2191
2192static void pc_machine_set_smbus(Object *obj, bool value, Error **errp)
2193{
2194 PCMachineState *pcms = PC_MACHINE(obj);
2195
2196 pcms->smbus = value;
2197}
2198
272f0428
CP
2199static bool pc_machine_get_sata(Object *obj, Error **errp)
2200{
2201 PCMachineState *pcms = PC_MACHINE(obj);
2202
2203 return pcms->sata;
2204}
2205
2206static void pc_machine_set_sata(Object *obj, bool value, Error **errp)
2207{
2208 PCMachineState *pcms = PC_MACHINE(obj);
2209
2210 pcms->sata = value;
2211}
2212
feddd2fd
CP
2213static bool pc_machine_get_pit(Object *obj, Error **errp)
2214{
2215 PCMachineState *pcms = PC_MACHINE(obj);
2216
2217 return pcms->pit;
2218}
2219
2220static void pc_machine_set_pit(Object *obj, bool value, Error **errp)
2221{
2222 PCMachineState *pcms = PC_MACHINE(obj);
2223
2224 pcms->pit = value;
2225}
2226
bf1e8939
IM
2227static void pc_machine_initfn(Object *obj)
2228{
c87b1520
DS
2229 PCMachineState *pcms = PC_MACHINE(obj);
2230
5ec7d098 2231 pcms->max_ram_below_4g = 0; /* use default */
355023f2 2232 pcms->smm = ON_OFF_AUTO_AUTO;
d1048bef 2233 pcms->vmport = ON_OFF_AUTO_AUTO;
87252e1b 2234 /* nvdimm is disabled on default. */
5fe79386 2235 pcms->acpi_nvdimm_state.is_enabled = false;
021746c1
WL
2236 /* acpi build is enabled by default if machine supports it */
2237 pcms->acpi_build_enabled = PC_MACHINE_GET_CLASS(pcms)->has_acpi_build;
be232eb0 2238 pcms->smbus = true;
272f0428 2239 pcms->sata = true;
feddd2fd 2240 pcms->pit = true;
bf1e8939
IM
2241}
2242
ae50c55a
ZG
2243static void pc_machine_reset(void)
2244{
2245 CPUState *cs;
2246 X86CPU *cpu;
2247
2248 qemu_devices_reset();
2249
2250 /* Reset APIC after devices have been reset to cancel
2251 * any changes that qemu_devices_reset() might have done.
2252 */
2253 CPU_FOREACH(cs) {
2254 cpu = X86_CPU(cs);
2255
2256 if (cpu->apic_state) {
2257 device_reset(cpu->apic_state);
2258 }
2259 }
2260}
2261
ea089eeb
IM
2262static CpuInstanceProperties
2263pc_cpu_index_to_props(MachineState *ms, unsigned cpu_index)
fb43b73b 2264{
ea089eeb
IM
2265 MachineClass *mc = MACHINE_GET_CLASS(ms);
2266 const CPUArchIdList *possible_cpus = mc->possible_cpu_arch_ids(ms);
2267
2268 assert(cpu_index < possible_cpus->len);
2269 return possible_cpus->cpus[cpu_index].props;
fb43b73b
IM
2270}
2271
79e07936
IM
2272static int64_t pc_get_default_cpu_node_id(const MachineState *ms, int idx)
2273{
2274 X86CPUTopoInfo topo;
2275
2276 assert(idx < ms->possible_cpus->len);
2277 x86_topo_ids_from_apicid(ms->possible_cpus->cpus[idx].arch_id,
2278 smp_cores, smp_threads, &topo);
2279 return topo.pkg_id % nb_numa_nodes;
2280}
2281
c96a1c0b 2282static const CPUArchIdList *pc_possible_cpu_arch_ids(MachineState *ms)
3811ef14 2283{
c96a1c0b
IM
2284 int i;
2285
2286 if (ms->possible_cpus) {
2287 /*
2288 * make sure that max_cpus hasn't changed since the first use, i.e.
2289 * -smp hasn't been parsed after it
2290 */
2291 assert(ms->possible_cpus->len == max_cpus);
2292 return ms->possible_cpus;
2293 }
2294
2295 ms->possible_cpus = g_malloc0(sizeof(CPUArchIdList) +
2296 sizeof(CPUArchId) * max_cpus);
2297 ms->possible_cpus->len = max_cpus;
2298 for (i = 0; i < ms->possible_cpus->len; i++) {
c67ae933
IM
2299 X86CPUTopoInfo topo;
2300
d342eb76 2301 ms->possible_cpus->cpus[i].type = ms->cpu_type;
f2d672c2 2302 ms->possible_cpus->cpus[i].vcpus_count = 1;
c96a1c0b 2303 ms->possible_cpus->cpus[i].arch_id = x86_cpu_apic_id_from_index(i);
c67ae933
IM
2304 x86_topo_ids_from_apicid(ms->possible_cpus->cpus[i].arch_id,
2305 smp_cores, smp_threads, &topo);
2306 ms->possible_cpus->cpus[i].props.has_socket_id = true;
2307 ms->possible_cpus->cpus[i].props.socket_id = topo.pkg_id;
2308 ms->possible_cpus->cpus[i].props.has_core_id = true;
2309 ms->possible_cpus->cpus[i].props.core_id = topo.core_id;
2310 ms->possible_cpus->cpus[i].props.has_thread_id = true;
2311 ms->possible_cpus->cpus[i].props.thread_id = topo.smt_id;
c96a1c0b
IM
2312 }
2313 return ms->possible_cpus;
3811ef14
IM
2314}
2315
1255166b
BD
2316static void x86_nmi(NMIState *n, int cpu_index, Error **errp)
2317{
2318 /* cpu index isn't used */
2319 CPUState *cs;
2320
2321 CPU_FOREACH(cs) {
2322 X86CPU *cpu = X86_CPU(cs);
2323
2324 if (!cpu->apic_state) {
2325 cpu_interrupt(cs, CPU_INTERRUPT_NMI);
2326 } else {
2327 apic_deliver_nmi(cpu->apic_state);
2328 }
2329 }
2330}
2331
95bee274
IM
2332static void pc_machine_class_init(ObjectClass *oc, void *data)
2333{
2334 MachineClass *mc = MACHINE_CLASS(oc);
2335 PCMachineClass *pcmc = PC_MACHINE_CLASS(oc);
2336 HotplugHandlerClass *hc = HOTPLUG_HANDLER_CLASS(oc);
1255166b 2337 NMIClass *nc = NMI_CLASS(oc);
95bee274 2338
7102fa70
EH
2339 pcmc->pci_enabled = true;
2340 pcmc->has_acpi_build = true;
2341 pcmc->rsdp_in_ram = true;
2342 pcmc->smbios_defaults = true;
2343 pcmc->smbios_uuid_encoded = true;
2344 pcmc->gigabyte_align = true;
2345 pcmc->has_reserved_memory = true;
2346 pcmc->kvmclock_enabled = true;
16a9e8a5 2347 pcmc->enforce_aligned_dimm = true;
cd4040ec
EH
2348 /* BIOS ACPI tables: 128K. Other BIOS datastructures: less than 4K reported
2349 * to be used at the moment, 32K should be enough for a while. */
2350 pcmc->acpi_data_size = 0x20000 + 0x8000;
36f96c4b 2351 pcmc->save_tsc_khz = true;
98e753a6 2352 pcmc->linuxboot_dma_enabled = true;
debbdc00 2353 assert(!mc->get_hotplug_handler);
95bee274 2354 mc->get_hotplug_handler = pc_get_hotpug_handler;
ea089eeb 2355 mc->cpu_index_to_instance_props = pc_cpu_index_to_props;
79e07936 2356 mc->get_default_cpu_node_id = pc_get_default_cpu_node_id;
3811ef14 2357 mc->possible_cpu_arch_ids = pc_possible_cpu_arch_ids;
7b8be49d 2358 mc->auto_enable_numa_with_memhp = true;
c5514d0e 2359 mc->has_hotpluggable_cpus = true;
41742767 2360 mc->default_boot_order = "cad";
4458fb3a 2361 mc->hot_add_cpu = pc_hot_add_cpu;
2059839b 2362 mc->block_default_type = IF_IDE;
4458fb3a 2363 mc->max_cpus = 255;
ae50c55a 2364 mc->reset = pc_machine_reset;
4ec60c76 2365 hc->pre_plug = pc_machine_device_pre_plug_cb;
95bee274 2366 hc->plug = pc_machine_device_plug_cb;
d9c5c5b8 2367 hc->unplug_request = pc_machine_device_unplug_request_cb;
232391c1 2368 hc->unplug = pc_machine_device_unplug_cb;
1255166b 2369 nc->nmi_monitor_handler = x86_nmi;
311ca98d 2370 mc->default_cpu_type = TARGET_DEFAULT_CPU_TYPE;
0efc257d 2371
f2ffbe2b
DH
2372 object_class_property_add(oc, PC_MACHINE_DEVMEM_REGION_SIZE, "int",
2373 pc_machine_get_device_memory_region_size, NULL,
0efc257d
EH
2374 NULL, NULL, &error_abort);
2375
2376 object_class_property_add(oc, PC_MACHINE_MAX_RAM_BELOW_4G, "size",
2377 pc_machine_get_max_ram_below_4g, pc_machine_set_max_ram_below_4g,
2378 NULL, NULL, &error_abort);
2379
2380 object_class_property_set_description(oc, PC_MACHINE_MAX_RAM_BELOW_4G,
2381 "Maximum ram below the 4G boundary (32bit boundary)", &error_abort);
2382
2383 object_class_property_add(oc, PC_MACHINE_SMM, "OnOffAuto",
2384 pc_machine_get_smm, pc_machine_set_smm,
2385 NULL, NULL, &error_abort);
2386 object_class_property_set_description(oc, PC_MACHINE_SMM,
2387 "Enable SMM (pc & q35)", &error_abort);
2388
2389 object_class_property_add(oc, PC_MACHINE_VMPORT, "OnOffAuto",
2390 pc_machine_get_vmport, pc_machine_set_vmport,
2391 NULL, NULL, &error_abort);
2392 object_class_property_set_description(oc, PC_MACHINE_VMPORT,
2393 "Enable vmport (pc & q35)", &error_abort);
2394
2395 object_class_property_add_bool(oc, PC_MACHINE_NVDIMM,
2396 pc_machine_get_nvdimm, pc_machine_set_nvdimm, &error_abort);
be232eb0
CP
2397
2398 object_class_property_add_bool(oc, PC_MACHINE_SMBUS,
2399 pc_machine_get_smbus, pc_machine_set_smbus, &error_abort);
272f0428
CP
2400
2401 object_class_property_add_bool(oc, PC_MACHINE_SATA,
2402 pc_machine_get_sata, pc_machine_set_sata, &error_abort);
feddd2fd
CP
2403
2404 object_class_property_add_bool(oc, PC_MACHINE_PIT,
2405 pc_machine_get_pit, pc_machine_set_pit, &error_abort);
95bee274
IM
2406}
2407
d5747cac
IM
2408static const TypeInfo pc_machine_info = {
2409 .name = TYPE_PC_MACHINE,
2410 .parent = TYPE_MACHINE,
2411 .abstract = true,
2412 .instance_size = sizeof(PCMachineState),
bf1e8939 2413 .instance_init = pc_machine_initfn,
d5747cac 2414 .class_size = sizeof(PCMachineClass),
95bee274
IM
2415 .class_init = pc_machine_class_init,
2416 .interfaces = (InterfaceInfo[]) {
2417 { TYPE_HOTPLUG_HANDLER },
1255166b 2418 { TYPE_NMI },
95bee274
IM
2419 { }
2420 },
d5747cac
IM
2421};
2422
2423static void pc_machine_register_types(void)
2424{
2425 type_register_static(&pc_machine_info);
2426}
2427
2428type_init(pc_machine_register_types)