]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
add support for proxmox backup
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
3ff84d6f 5
5da072fb
TL
6use Cwd 'abs_path';
7use Digest::SHA;
8use Fcntl ':flock';
9use Fcntl;
1e3baf05 10use File::Basename;
5da072fb 11use File::Copy qw(copy);
1e3baf05
DM
12use File::Path;
13use File::stat;
14use Getopt::Long;
5da072fb
TL
15use IO::Dir;
16use IO::File;
17use IO::Handle;
18use IO::Select;
19use IO::Socket::UNIX;
1e3baf05 20use IPC::Open3;
c971c4f2 21use JSON;
1f30ac3a 22use MIME::Base64;
5da072fb
TL
23use POSIX;
24use Storable qw(dclone);
25use Time::HiRes qw(gettimeofday);
26use URI::Escape;
425441e6 27use UUID;
5da072fb 28
1e3baf05 29use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
48cf040f 30use PVE::DataCenterConfig;
5da072fb 31use PVE::Exception qw(raise raise_param_exc);
81d6e4e1 32use PVE::GuestHelpers qw(safe_string_ne safe_num_ne safe_boolean_ne);
1e3baf05 33use PVE::INotify;
5da072fb 34use PVE::JSONSchema qw(get_standard_option);
1e3baf05 35use PVE::ProcFSTools;
91bd6c90 36use PVE::RPCEnvironment;
5da072fb 37use PVE::Storage;
b71351a7 38use PVE::SysFSTools;
d04d6af1 39use PVE::Systemd;
05a4c550 40use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline file_get_contents dir_glob_foreach get_host_arch $IPV6RE);
5da072fb
TL
41
42use PVE::QMPClient;
43use PVE::QemuConfig;
2f18c84d 44use PVE::QemuServer::Helpers qw(min_version config_aware_timeout);
5da072fb 45use PVE::QemuServer::Cloudinit;
d786a274 46use PVE::QemuServer::CPUConfig qw(print_cpu_device get_cpu_options);
e0fd2b2f 47use PVE::QemuServer::Drive qw(is_valid_drivename drive_is_cloudinit drive_is_cdrom parse_drive print_drive foreach_drive foreach_volid);
2ea5fb7e 48use PVE::QemuServer::Machine;
5da072fb 49use PVE::QemuServer::Memory;
0a13e08e 50use PVE::QemuServer::Monitor qw(mon_cmd);
5da072fb
TL
51use PVE::QemuServer::PCI qw(print_pci_addr print_pcie_addr print_pcie_root_port);
52use PVE::QemuServer::USB qw(parse_usb_device);
1e3baf05 53
28e129cc
AD
54my $have_sdn;
55eval {
56 require PVE::Network::SDN::Zones;
57 $have_sdn = 1;
58};
59
102cf9d8 60my $EDK2_FW_BASE = '/usr/share/pve-edk2-firmware/';
96ed3574
WB
61my $OVMF = {
62 x86_64 => [
63 "$EDK2_FW_BASE/OVMF_CODE.fd",
64 "$EDK2_FW_BASE/OVMF_VARS.fd"
65 ],
66 aarch64 => [
67 "$EDK2_FW_BASE/AAVMF_CODE.fd",
68 "$EDK2_FW_BASE/AAVMF_VARS.fd"
69 ],
70};
2ddc0a5c 71
7f0b5beb 72my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 73
19672434 74# Note about locking: we use flock on the config file protect
1e3baf05
DM
75# against concurent actions.
76# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 77# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
78# allowed when such lock is set. But you can ignore this kind of
79# lock with the --skiplock flag.
80
97d62eb7 81cfs_register_file('/qemu-server/',
1858638f
DM
82 \&parse_vm_config,
83 \&write_vm_config);
1e3baf05 84
3ea94c60
DM
85PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
86 description => "Some command save/restore state from this location.",
87 type => 'string',
88 maxLength => 128,
89 optional => 1,
90});
91
c6737ef1
DC
92PVE::JSONSchema::register_standard_option('pve-qemu-machine', {
93 description => "Specifies the Qemu machine type.",
94 type => 'string',
9471e48b 95 pattern => '(pc|pc(-i440fx)?-\d+(\.\d+)+(\+pve\d+)?(\.pxe)?|q35|pc-q35-\d+(\.\d+)+(\+pve\d+)?(\.pxe)?|virt(?:-\d+(\.\d+)+)?(\+pve\d+)?)',
c6737ef1
DC
96 maxLength => 40,
97 optional => 1,
98});
99
1e3baf05
DM
100#no warnings 'redefine';
101
c8effec3
AD
102sub cgroups_write {
103 my ($controller, $vmid, $option, $value) = @_;
104
3a515a88
DM
105 my $path = "/sys/fs/cgroup/$controller/qemu.slice/$vmid.scope/$option";
106 PVE::ProcFSTools::write_proc_entry($path, $value);
c8effec3
AD
107
108}
109
38277afc
TL
110my $nodename_cache;
111sub nodename {
112 $nodename_cache //= PVE::INotify::nodename();
113 return $nodename_cache;
114}
1e3baf05 115
ec3582b5
WB
116my $watchdog_fmt = {
117 model => {
118 default_key => 1,
119 type => 'string',
120 enum => [qw(i6300esb ib700)],
121 description => "Watchdog type to emulate.",
122 default => 'i6300esb',
123 optional => 1,
124 },
125 action => {
126 type => 'string',
127 enum => [qw(reset shutdown poweroff pause debug none)],
128 description => "The action to perform if after activation the guest fails to poll the watchdog in time.",
129 optional => 1,
130 },
131};
132PVE::JSONSchema::register_format('pve-qm-watchdog', $watchdog_fmt);
133
9d66b397
SI
134my $agent_fmt = {
135 enabled => {
136 description => "Enable/disable Qemu GuestAgent.",
137 type => 'boolean',
138 default => 0,
139 default_key => 1,
140 },
141 fstrim_cloned_disks => {
142 description => "Run fstrim after cloning/moving a disk.",
143 type => 'boolean',
144 optional => 1,
145 default => 0
146 },
48657158
MD
147 type => {
148 description => "Select the agent type",
149 type => 'string',
150 default => 'virtio',
151 optional => 1,
152 enum => [qw(virtio isa)],
153 },
9d66b397
SI
154};
155
55655ebc
DC
156my $vga_fmt = {
157 type => {
158 description => "Select the VGA type.",
159 type => 'string',
160 default => 'std',
161 optional => 1,
162 default_key => 1,
7c954c42 163 enum => [qw(cirrus qxl qxl2 qxl3 qxl4 none serial0 serial1 serial2 serial3 std virtio vmware)],
55655ebc
DC
164 },
165 memory => {
166 description => "Sets the VGA memory (in MiB). Has no effect with serial display.",
167 type => 'integer',
168 optional => 1,
169 minimum => 4,
170 maximum => 512,
171 },
172};
173
6dbcb073
DC
174my $ivshmem_fmt = {
175 size => {
176 type => 'integer',
177 minimum => 1,
178 description => "The size of the file in MB.",
179 },
180 name => {
181 type => 'string',
182 pattern => '[a-zA-Z0-9\-]+',
183 optional => 1,
184 format_description => 'string',
185 description => "The name of the file. Will be prefixed with 'pve-shm-'. Default is the VMID. Will be deleted when the VM is stopped.",
186 },
187};
188
1448547f
AL
189my $audio_fmt = {
190 device => {
191 type => 'string',
192 enum => [qw(ich9-intel-hda intel-hda AC97)],
193 description => "Configure an audio device."
194 },
195 driver => {
196 type => 'string',
197 enum => ['spice'],
198 default => 'spice',
199 optional => 1,
200 description => "Driver backend for the audio device."
201 },
202};
203
c4df18db
AL
204my $spice_enhancements_fmt = {
205 foldersharing => {
206 type => 'boolean',
207 optional => 1,
d282a24d 208 default => '0',
c4df18db
AL
209 description => "Enable folder sharing via SPICE. Needs Spice-WebDAV daemon installed in the VM."
210 },
211 videostreaming => {
212 type => 'string',
213 enum => ['off', 'all', 'filter'],
d282a24d 214 default => 'off',
c4df18db
AL
215 optional => 1,
216 description => "Enable video streaming. Uses compression for detected video streams."
217 },
218};
219
2cf61f33
SR
220my $rng_fmt = {
221 source => {
222 type => 'string',
223 enum => ['/dev/urandom', '/dev/random', '/dev/hwrng'],
224 default_key => 1,
225 description => "The file on the host to gather entropy from. In most"
226 . " cases /dev/urandom should be preferred over /dev/random"
227 . " to avoid entropy-starvation issues on the host. Using"
228 . " urandom does *not* decrease security in any meaningful"
229 . " way, as it's still seeded from real entropy, and the"
230 . " bytes provided will most likely be mixed with real"
231 . " entropy on the guest as well. /dev/hwrng can be used"
232 . " to pass through a hardware RNG from the host.",
233 },
234 max_bytes => {
235 type => 'integer',
236 description => "Maximum bytes of entropy injected into the guest every"
237 . " 'period' milliseconds. Prefer a lower value when using"
238 . " /dev/random as source. Use 0 to disable limiting"
239 . " (potentially dangerous!).",
240 optional => 1,
241
242 # default is 1 KiB/s, provides enough entropy to the guest to avoid
243 # boot-starvation issues (e.g. systemd etc...) while allowing no chance
244 # of overwhelming the host, provided we're reading from /dev/urandom
245 default => 1024,
246 },
247 period => {
248 type => 'integer',
249 description => "Every 'period' milliseconds the entropy-injection quota"
250 . " is reset, allowing the guest to retrieve another"
251 . " 'max_bytes' of entropy.",
252 optional => 1,
253 default => 1000,
254 },
255};
256
1e3baf05
DM
257my $confdesc = {
258 onboot => {
259 optional => 1,
260 type => 'boolean',
261 description => "Specifies whether a VM will be started during system bootup.",
262 default => 0,
263 },
264 autostart => {
265 optional => 1,
266 type => 'boolean',
267 description => "Automatic restart after crash (currently ignored).",
268 default => 0,
269 },
2ff09f52
DA
270 hotplug => {
271 optional => 1,
b3c2bdd1
DM
272 type => 'string', format => 'pve-hotplug-features',
273 description => "Selectively enable hotplug features. This is a comma separated list of hotplug features: 'network', 'disk', 'cpu', 'memory' and 'usb'. Use '0' to disable hotplug completely. Value '1' is an alias for the default 'network,disk,usb'.",
274 default => 'network,disk,usb',
2ff09f52 275 },
1e3baf05
DM
276 reboot => {
277 optional => 1,
278 type => 'boolean',
279 description => "Allow reboot. If set to '0' the VM exit on reboot.",
280 default => 1,
281 },
282 lock => {
283 optional => 1,
284 type => 'string',
285 description => "Lock/unlock the VM.",
159719e5 286 enum => [qw(backup clone create migrate rollback snapshot snapshot-delete suspending suspended)],
1e3baf05
DM
287 },
288 cpulimit => {
289 optional => 1,
c6f773b8 290 type => 'number',
52261945
DM
291 description => "Limit of CPU usage.",
292 verbose_description => "Limit of CPU usage.\n\nNOTE: If the computer has 2 CPUs, it has total of '2' CPU time. Value '0' indicates no CPU limit.",
1e3baf05 293 minimum => 0,
c6f773b8 294 maximum => 128,
52261945 295 default => 0,
1e3baf05
DM
296 },
297 cpuunits => {
298 optional => 1,
299 type => 'integer',
52261945 300 description => "CPU weight for a VM.",
237239bf
PA
301 verbose_description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.",
302 minimum => 2,
303 maximum => 262144,
613d76a1 304 default => 1024,
1e3baf05
DM
305 },
306 memory => {
307 optional => 1,
308 type => 'integer',
7878afeb 309 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
310 minimum => 16,
311 default => 512,
312 },
13a48620
DA
313 balloon => {
314 optional => 1,
315 type => 'integer',
8b1accf7
DM
316 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
317 minimum => 0,
318 },
319 shares => {
320 optional => 1,
321 type => 'integer',
82329cd5 322 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning. Auto-ballooning is done by pvestatd.",
8b1accf7
DM
323 minimum => 0,
324 maximum => 50000,
325 default => 1000,
13a48620 326 },
1e3baf05
DM
327 keyboard => {
328 optional => 1,
329 type => 'string',
f889aa0f 330 description => "Keybord layout for vnc server. Default is read from the '/etc/pve/datacenter.cfg' configuration file.".
aea47dd6 331 "It should not be necessary to set it.",
e95fe75f 332 enum => PVE::Tools::kvmkeymaplist(),
aea47dd6 333 default => undef,
1e3baf05
DM
334 },
335 name => {
336 optional => 1,
7fabe17d 337 type => 'string', format => 'dns-name',
1e3baf05
DM
338 description => "Set a name for the VM. Only used on the configuration web interface.",
339 },
cdd20088
AD
340 scsihw => {
341 optional => 1,
342 type => 'string',
52261945 343 description => "SCSI controller model",
6731a4cf 344 enum => [qw(lsi lsi53c810 virtio-scsi-pci virtio-scsi-single megasas pvscsi)],
cdd20088
AD
345 default => 'lsi',
346 },
1e3baf05
DM
347 description => {
348 optional => 1,
349 type => 'string',
0581fe4f 350 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
351 },
352 ostype => {
353 optional => 1,
354 type => 'string',
0cb9971e 355 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 win10 l24 l26 solaris)],
52261945
DM
356 description => "Specify guest operating system.",
357 verbose_description => <<EODESC,
358Specify guest operating system. This is used to enable special
359optimization/features for specific operating systems:
360
361[horizontal]
362other;; unspecified OS
363wxp;; Microsoft Windows XP
364w2k;; Microsoft Windows 2000
365w2k3;; Microsoft Windows 2003
366w2k8;; Microsoft Windows 2008
367wvista;; Microsoft Windows Vista
368win7;; Microsoft Windows 7
44c2a647
TL
369win8;; Microsoft Windows 8/2012/2012r2
370win10;; Microsoft Windows 10/2016
52261945 371l24;; Linux 2.4 Kernel
a5269260 372l26;; Linux 2.6 - 5.X Kernel
52261945 373solaris;; Solaris/OpenSolaris/OpenIndiania kernel
1e3baf05
DM
374EODESC
375 },
376 boot => {
377 optional => 1,
378 type => 'string',
379 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
380 pattern => '[acdn]{1,4}',
32baffb4 381 default => 'cdn',
1e3baf05
DM
382 },
383 bootdisk => {
384 optional => 1,
385 type => 'string', format => 'pve-qm-bootdisk',
386 description => "Enable booting from specified disk.",
03e480fc 387 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
388 },
389 smp => {
390 optional => 1,
391 type => 'integer',
392 description => "The number of CPUs. Please use option -sockets instead.",
393 minimum => 1,
394 default => 1,
395 },
396 sockets => {
397 optional => 1,
398 type => 'integer',
399 description => "The number of CPU sockets.",
400 minimum => 1,
401 default => 1,
402 },
403 cores => {
404 optional => 1,
405 type => 'integer',
406 description => "The number of cores per socket.",
407 minimum => 1,
408 default => 1,
409 },
8a010eae
AD
410 numa => {
411 optional => 1,
412 type => 'boolean',
1917695c 413 description => "Enable/disable NUMA.",
8a010eae
AD
414 default => 0,
415 },
7023f3ea
AD
416 hugepages => {
417 optional => 1,
418 type => 'string',
419 description => "Enable/disable hugepages memory.",
420 enum => [qw(any 2 1024)],
421 },
de9d1e55 422 vcpus => {
3bd18e48
AD
423 optional => 1,
424 type => 'integer',
de9d1e55 425 description => "Number of hotplugged vcpus.",
3bd18e48 426 minimum => 1,
de9d1e55 427 default => 0,
3bd18e48 428 },
1e3baf05
DM
429 acpi => {
430 optional => 1,
431 type => 'boolean',
432 description => "Enable/disable ACPI.",
433 default => 1,
434 },
bc84dcca 435 agent => {
ab6a046f 436 optional => 1,
9d66b397
SI
437 description => "Enable/disable Qemu GuestAgent and its properties.",
438 type => 'string',
439 format => $agent_fmt,
ab6a046f 440 },
1e3baf05
DM
441 kvm => {
442 optional => 1,
443 type => 'boolean',
444 description => "Enable/disable KVM hardware virtualization.",
445 default => 1,
446 },
447 tdf => {
448 optional => 1,
449 type => 'boolean',
8c559505
DM
450 description => "Enable/disable time drift fix.",
451 default => 0,
1e3baf05 452 },
19672434 453 localtime => {
1e3baf05
DM
454 optional => 1,
455 type => 'boolean',
456 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
457 },
458 freeze => {
459 optional => 1,
460 type => 'boolean',
461 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
462 },
463 vga => {
464 optional => 1,
55655ebc
DC
465 type => 'string', format => $vga_fmt,
466 description => "Configure the VGA hardware.",
467 verbose_description => "Configure the VGA Hardware. If you want to use ".
468 "high resolution modes (>= 1280x1024x16) you may need to increase " .
469 "the vga memory option. Since QEMU 2.9 the default VGA display type " .
470 "is 'std' for all OS types besides some Windows versions (XP and " .
471 "older) which use 'cirrus'. The 'qxl' option enables the SPICE " .
472 "display server. For win* OS you can select how many independent " .
473 "displays you want, Linux guests can add displays them self.\n".
474 "You can also run without any graphic card, using a serial device as terminal.",
1e3baf05 475 },
0ea9541d
DM
476 watchdog => {
477 optional => 1,
478 type => 'string', format => 'pve-qm-watchdog',
52261945
DM
479 description => "Create a virtual hardware watchdog device.",
480 verbose_description => "Create a virtual hardware watchdog device. Once enabled" .
1917695c
TL
481 " (by a guest action), the watchdog must be periodically polled " .
482 "by an agent inside the guest or else the watchdog will reset " .
483 "the guest (or execute the respective action specified)",
0ea9541d 484 },
1e3baf05
DM
485 startdate => {
486 optional => 1,
19672434 487 type => 'string',
1e3baf05
DM
488 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
489 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
490 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
491 default => 'now',
492 },
43574f73 493 startup => get_standard_option('pve-startup-order'),
68eda3ab
AD
494 template => {
495 optional => 1,
496 type => 'boolean',
497 description => "Enable/disable Template.",
498 default => 0,
499 },
1e3baf05
DM
500 args => {
501 optional => 1,
502 type => 'string',
52261945
DM
503 description => "Arbitrary arguments passed to kvm.",
504 verbose_description => <<EODESCR,
c7a8aad6 505Arbitrary arguments passed to kvm, for example:
1e3baf05
DM
506
507args: -no-reboot -no-hpet
c7a8aad6
FG
508
509NOTE: this option is for experts only.
1e3baf05
DM
510EODESCR
511 },
512 tablet => {
513 optional => 1,
514 type => 'boolean',
515 default => 1,
52261945
DM
516 description => "Enable/disable the USB tablet device.",
517 verbose_description => "Enable/disable the USB tablet device. This device is " .
1917695c
TL
518 "usually needed to allow absolute mouse positioning with VNC. " .
519 "Else the mouse runs out of sync with normal VNC clients. " .
520 "If you're running lots of console-only guests on one host, " .
521 "you may consider disabling this to save some context switches. " .
522 "This is turned off by default if you use spice (-vga=qxl).",
1e3baf05
DM
523 },
524 migrate_speed => {
525 optional => 1,
526 type => 'integer',
527 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
528 minimum => 0,
529 default => 0,
530 },
531 migrate_downtime => {
532 optional => 1,
04432191 533 type => 'number',
1e3baf05
DM
534 description => "Set maximum tolerated downtime (in seconds) for migrations.",
535 minimum => 0,
04432191 536 default => 0.1,
1e3baf05
DM
537 },
538 cdrom => {
539 optional => 1,
b799312f 540 type => 'string', format => 'pve-qm-ide',
8485b9ba 541 typetext => '<volume>',
1e3baf05
DM
542 description => "This is an alias for option -ide2",
543 },
544 cpu => {
545 optional => 1,
546 description => "Emulated CPU type.",
547 type => 'string',
d786a274 548 format => $PVE::QemuServer::CPUConfig::cpu_fmt,
1e3baf05 549 },
b7ba6b79
DM
550 parent => get_standard_option('pve-snapshot-name', {
551 optional => 1,
552 description => "Parent snapshot name. This is used internally, and should not be modified.",
553 }),
982c7f12
DM
554 snaptime => {
555 optional => 1,
556 description => "Timestamp for snapshots.",
557 type => 'integer',
558 minimum => 0,
559 },
18bfb361
DM
560 vmstate => {
561 optional => 1,
562 type => 'string', format => 'pve-volume-id',
563 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
564 },
253624c7
FG
565 vmstatestorage => get_standard_option('pve-storage-id', {
566 description => "Default storage for VM state volumes/files.",
567 optional => 1,
568 }),
c6737ef1
DC
569 runningmachine => get_standard_option('pve-qemu-machine', {
570 description => "Specifies the Qemu machine type of the running vm. This is used internally for snapshots.",
571 }),
572 machine => get_standard_option('pve-qemu-machine'),
d731ecbe
WB
573 arch => {
574 description => "Virtual processor architecture. Defaults to the host.",
575 optional => 1,
576 type => 'string',
577 enum => [qw(x86_64 aarch64)],
578 },
2796e7d5
DM
579 smbios1 => {
580 description => "Specify SMBIOS type 1 fields.",
581 type => 'string', format => 'pve-qm-smbios1',
5d004b00 582 maxLength => 512,
2796e7d5
DM
583 optional => 1,
584 },
cb0e4540
AG
585 protection => {
586 optional => 1,
587 type => 'boolean',
52261945 588 description => "Sets the protection flag of the VM. This will disable the remove VM and remove disk operations.",
cb0e4540
AG
589 default => 0,
590 },
3edb45e7 591 bios => {
a783c78e 592 optional => 1,
3edb45e7
DM
593 type => 'string',
594 enum => [ qw(seabios ovmf) ],
595 description => "Select BIOS implementation.",
596 default => 'seabios',
a783c78e 597 },
6ee499ff
DC
598 vmgenid => {
599 type => 'string',
600 pattern => '(?:[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}|[01])',
601 format_description => 'UUID',
f7ed64e7
TL
602 description => "Set VM Generation ID. Use '1' to autogenerate on create or update, pass '0' to disable explicitly.",
603 verbose_description => "The VM generation ID (vmgenid) device exposes a".
604 " 128-bit integer value identifier to the guest OS. This allows to".
605 " notify the guest operating system when the virtual machine is".
606 " executed with a different configuration (e.g. snapshot execution".
607 " or creation from a template). The guest operating system notices".
608 " the change, and is then able to react as appropriate by marking".
609 " its copies of distributed databases as dirty, re-initializing its".
610 " random number generator, etc.\n".
611 "Note that auto-creation only works when done throug API/CLI create".
612 " or update methods, but not when manually editing the config file.",
613 default => "1 (autogenerated)",
6ee499ff
DC
614 optional => 1,
615 },
9e784b11
DC
616 hookscript => {
617 type => 'string',
618 format => 'pve-volume-id',
619 optional => 1,
620 description => "Script that will be executed during various steps in the vms lifetime.",
621 },
6dbcb073
DC
622 ivshmem => {
623 type => 'string',
624 format => $ivshmem_fmt,
625 description => "Inter-VM shared memory. Useful for direct communication between VMs, or to the host.",
626 optional => 1,
2e7b5925
AL
627 },
628 audio0 => {
629 type => 'string',
1448547f 630 format => $audio_fmt,
194b65f1 631 description => "Configure a audio device, useful in combination with QXL/Spice.",
2e7b5925
AL
632 optional => 1
633 },
c4df18db
AL
634 spice_enhancements => {
635 type => 'string',
636 format => $spice_enhancements_fmt,
637 description => "Configure additional enhancements for SPICE.",
638 optional => 1
639 },
b8e7068a
DC
640 tags => {
641 type => 'string', format => 'pve-tag-list',
642 description => 'Tags of the VM. This is only meta information.',
643 optional => 1,
644 },
2cf61f33
SR
645 rng0 => {
646 type => 'string',
647 format => $rng_fmt,
648 description => "Configure a VirtIO-based Random Number Generator.",
649 optional => 1,
650 },
9ed7a77c
WB
651};
652
cb702ebe
DL
653my $cicustom_fmt = {
654 meta => {
655 type => 'string',
656 optional => 1,
657 description => 'Specify a custom file containing all meta data passed to the VM via cloud-init. This is provider specific meaning configdrive2 and nocloud differ.',
658 format => 'pve-volume-id',
659 format_description => 'volume',
660 },
661 network => {
662 type => 'string',
663 optional => 1,
664 description => 'Specify a custom file containing all network data passed to the VM via cloud-init.',
665 format => 'pve-volume-id',
666 format_description => 'volume',
667 },
668 user => {
669 type => 'string',
670 optional => 1,
671 description => 'Specify a custom file containing all user data passed to the VM via cloud-init.',
672 format => 'pve-volume-id',
673 format_description => 'volume',
674 },
675};
676PVE::JSONSchema::register_format('pve-qm-cicustom', $cicustom_fmt);
677
9ed7a77c 678my $confdesc_cloudinit = {
41cd94a0
WB
679 citype => {
680 optional => 1,
681 type => 'string',
498cdc36 682 description => 'Specifies the cloud-init configuration format. The default depends on the configured operating system type (`ostype`. We use the `nocloud` format for Linux, and `configdrive2` for windows.',
41cd94a0
WB
683 enum => ['configdrive2', 'nocloud'],
684 },
7b42f951
WB
685 ciuser => {
686 optional => 1,
687 type => 'string',
688 description => "cloud-init: User name to change ssh keys and password for instead of the image's configured default user.",
689 },
690 cipassword => {
691 optional => 1,
692 type => 'string',
1d1c4e1c 693 description => 'cloud-init: Password to assign the user. Using this is generally not recommended. Use ssh keys instead. Also note that older cloud-init versions do not support hashed passwords.',
7b42f951 694 },
cb702ebe
DL
695 cicustom => {
696 optional => 1,
697 type => 'string',
698 description => 'cloud-init: Specify custom files to replace the automatically generated ones at start.',
699 format => 'pve-qm-cicustom',
700 },
0c9a7596
AD
701 searchdomain => {
702 optional => 1,
703 type => 'string',
704 description => "cloud-init: Sets DNS search domains for a container. Create will automatically use the setting from the host if neither searchdomain nor nameserver are set.",
705 },
706 nameserver => {
707 optional => 1,
708 type => 'string', format => 'address-list',
709 description => "cloud-init: Sets DNS server IP address for a container. Create will automatically use the setting from the host if neither searchdomain nor nameserver are set.",
710 },
711 sshkeys => {
712 optional => 1,
713 type => 'string',
714 format => 'urlencoded',
1d1c4e1c 715 description => "cloud-init: Setup public SSH keys (one key per line, OpenSSH format).",
0c9a7596 716 },
1e3baf05
DM
717};
718
719# what about other qemu settings ?
720#cpu => 'string',
721#machine => 'string',
722#fda => 'file',
723#fdb => 'file',
724#mtdblock => 'file',
725#sd => 'file',
726#pflash => 'file',
727#snapshot => 'bool',
728#bootp => 'file',
729##tftp => 'dir',
730##smb => 'dir',
731#kernel => 'file',
732#append => 'string',
733#initrd => 'file',
734##soundhw => 'string',
735
736while (my ($k, $v) = each %$confdesc) {
737 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
738}
739
1e3baf05 740my $MAX_USB_DEVICES = 5;
5bdcf937 741my $MAX_NETS = 32;
c4e16381 742my $MAX_HOSTPCI_DEVICES = 16;
bae179aa 743my $MAX_SERIAL_PORTS = 4;
1989a89c 744my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
745my $MAX_NUMA = 8;
746
ffc0d8c7
WB
747my $numa_fmt = {
748 cpus => {
749 type => "string",
750 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
52261945 751 description => "CPUs accessing this NUMA node.",
ffc0d8c7
WB
752 format_description => "id[-id];...",
753 },
754 memory => {
755 type => "number",
52261945 756 description => "Amount of memory this NUMA node provides.",
ffc0d8c7
WB
757 optional => 1,
758 },
759 hostnodes => {
760 type => "string",
761 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
52261945 762 description => "Host NUMA nodes to use.",
ffc0d8c7
WB
763 format_description => "id[-id];...",
764 optional => 1,
765 },
766 policy => {
767 type => 'string',
768 enum => [qw(preferred bind interleave)],
52261945 769 description => "NUMA allocation policy.",
ffc0d8c7
WB
770 optional => 1,
771 },
772};
773PVE::JSONSchema::register_format('pve-qm-numanode', $numa_fmt);
2ed5d572
AD
774my $numadesc = {
775 optional => 1,
ffc0d8c7 776 type => 'string', format => $numa_fmt,
52261945 777 description => "NUMA topology.",
2ed5d572
AD
778};
779PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
780
781for (my $i = 0; $i < $MAX_NUMA; $i++) {
782 $confdesc->{"numa$i"} = $numadesc;
783}
1e3baf05
DM
784
785my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
55034103
KT
786 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3',
787 'e1000-82540em', 'e1000-82544gc', 'e1000-82545em'];
6b64503e 788my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 789
52261945
DM
790my $net_fmt_bridge_descr = <<__EOD__;
791Bridge to attach the network device to. The Proxmox VE standard bridge
792is called 'vmbr0'.
793
794If you do not specify a bridge, we create a kvm user (NATed) network
795device, which provides DHCP and DNS services. The following addresses
796are used:
797
798 10.0.2.2 Gateway
799 10.0.2.3 DNS Server
800 10.0.2.4 SMB Server
801
802The DHCP server assign addresses to the guest starting from 10.0.2.15.
803__EOD__
804
cd9c34d1 805my $net_fmt = {
399d96db 806 macaddr => get_standard_option('mac-addr', {
52261945 807 description => "MAC address. That address must be unique withing your network. This is automatically generated if not specified.",
399d96db 808 }),
7f694a71
DM
809 model => {
810 type => 'string',
52261945 811 description => "Network Card Model. The 'virtio' model provides the best performance with very low CPU overhead. If your guest does not support this driver, it is usually best to use 'e1000'.",
7f694a71
DM
812 enum => $nic_model_list,
813 default_key => 1,
814 },
815 (map { $_ => { keyAlias => 'model', alias => 'macaddr' }} @$nic_model_list),
cd9c34d1
WB
816 bridge => {
817 type => 'string',
52261945 818 description => $net_fmt_bridge_descr,
cd9c34d1
WB
819 format_description => 'bridge',
820 optional => 1,
821 },
822 queues => {
823 type => 'integer',
824 minimum => 0, maximum => 16,
825 description => 'Number of packet queues to be used on the device.',
cd9c34d1
WB
826 optional => 1,
827 },
828 rate => {
829 type => 'number',
830 minimum => 0,
52261945 831 description => "Rate limit in mbps (megabytes per second) as floating point number.",
cd9c34d1
WB
832 optional => 1,
833 },
834 tag => {
835 type => 'integer',
9f41a659 836 minimum => 1, maximum => 4094,
cd9c34d1 837 description => 'VLAN tag to apply to packets on this interface.',
cd9c34d1
WB
838 optional => 1,
839 },
840 trunks => {
841 type => 'string',
842 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
843 description => 'VLAN trunks to pass through this interface.',
7f694a71 844 format_description => 'vlanid[;vlanid...]',
cd9c34d1
WB
845 optional => 1,
846 },
847 firewall => {
848 type => 'boolean',
849 description => 'Whether this interface should be protected by the firewall.',
cd9c34d1
WB
850 optional => 1,
851 },
852 link_down => {
853 type => 'boolean',
52261945 854 description => 'Whether this interface should be disconnected (like pulling the plug).',
cd9c34d1
WB
855 optional => 1,
856 },
857};
52261945 858
1e3baf05
DM
859my $netdesc = {
860 optional => 1,
7f694a71 861 type => 'string', format => $net_fmt,
52261945 862 description => "Specify network devices.",
1e3baf05 863};
52261945 864
1e3baf05
DM
865PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
866
0c9a7596
AD
867my $ipconfig_fmt = {
868 ip => {
869 type => 'string',
870 format => 'pve-ipv4-config',
871 format_description => 'IPv4Format/CIDR',
872 description => 'IPv4 address in CIDR format.',
873 optional => 1,
874 default => 'dhcp',
875 },
876 gw => {
877 type => 'string',
878 format => 'ipv4',
879 format_description => 'GatewayIPv4',
880 description => 'Default gateway for IPv4 traffic.',
881 optional => 1,
882 requires => 'ip',
883 },
884 ip6 => {
885 type => 'string',
886 format => 'pve-ipv6-config',
887 format_description => 'IPv6Format/CIDR',
888 description => 'IPv6 address in CIDR format.',
889 optional => 1,
890 default => 'dhcp',
891 },
892 gw6 => {
893 type => 'string',
894 format => 'ipv6',
895 format_description => 'GatewayIPv6',
896 description => 'Default gateway for IPv6 traffic.',
897 optional => 1,
898 requires => 'ip6',
899 },
900};
901PVE::JSONSchema::register_format('pve-qm-ipconfig', $ipconfig_fmt);
902my $ipconfigdesc = {
903 optional => 1,
904 type => 'string', format => 'pve-qm-ipconfig',
905 description => <<'EODESCR',
906cloud-init: Specify IP addresses and gateways for the corresponding interface.
907
908IP addresses use CIDR notation, gateways are optional but need an IP of the same type specified.
909
910The special string 'dhcp' can be used for IP addresses to use DHCP, in which case no explicit gateway should be provided.
911For IPv6 the special string 'auto' can be used to use stateless autoconfiguration.
912
913If cloud-init is enabled and neither an IPv4 nor an IPv6 address is specified, it defaults to using dhcp on IPv4.
914EODESCR
915};
916PVE::JSONSchema::register_standard_option("pve-qm-ipconfig", $netdesc);
917
1e3baf05
DM
918for (my $i = 0; $i < $MAX_NETS; $i++) {
919 $confdesc->{"net$i"} = $netdesc;
9ed7a77c
WB
920 $confdesc_cloudinit->{"ipconfig$i"} = $ipconfigdesc;
921}
922
923foreach my $key (keys %$confdesc_cloudinit) {
924 $confdesc->{$key} = $confdesc_cloudinit->{$key};
1e3baf05
DM
925}
926
ffa42b86
DC
927PVE::JSONSchema::register_format('pve-volume-id-or-qm-path', \&verify_volume_id_or_qm_path);
928sub verify_volume_id_or_qm_path {
822c8a07
WB
929 my ($volid, $noerr) = @_;
930
ffa42b86
DC
931 if ($volid eq 'none' || $volid eq 'cdrom' || $volid =~ m|^/|) {
932 return $volid;
933 }
934
935 # if its neither 'none' nor 'cdrom' nor a path, check if its a volume-id
822c8a07
WB
936 $volid = eval { PVE::JSONSchema::check_format('pve-volume-id', $volid, '') };
937 if ($@) {
938 return undef if $noerr;
939 die $@;
940 }
941 return $volid;
942}
943
ff6ffe20 944my $usb_fmt = {
a6b9aee4
DC
945 host => {
946 default_key => 1,
947 type => 'string', format => 'pve-qm-usb-device',
948 format_description => 'HOSTUSBDEVICE|spice',
52261945
DM
949 description => <<EODESCR,
950The Host USB device or port or the value 'spice'. HOSTUSBDEVICE syntax is:
951
952 'bus-port(.port)*' (decimal numbers) or
953 'vendor_id:product_id' (hexadeciaml numbers) or
954 'spice'
955
956You can use the 'lsusb -t' command to list existing usb devices.
957
958NOTE: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
959
960The value 'spice' can be used to add a usb redirection devices for spice.
961EODESCR
a6b9aee4
DC
962 },
963 usb3 => {
964 optional => 1,
965 type => 'boolean',
97ef5356 966 description => "Specifies whether if given host option is a USB3 device or port.",
52261945 967 default => 0,
a6b9aee4
DC
968 },
969};
970
1e3baf05
DM
971my $usbdesc = {
972 optional => 1,
ff6ffe20 973 type => 'string', format => $usb_fmt,
52261945 974 description => "Configure an USB device (n is 0 to 4).",
1e3baf05
DM
975};
976PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
977
70740c1a 978my $PCIRE = qr/([a-f0-9]{4}:)?[a-f0-9]{2}:[a-f0-9]{2}(?:\.[a-f0-9])?/;
1f4f447b
WB
979my $hostpci_fmt = {
980 host => {
981 default_key => 1,
982 type => 'string',
983 pattern => qr/$PCIRE(;$PCIRE)*/,
984 format_description => 'HOSTPCIID[;HOSTPCIID2...]',
52261945 985 description => <<EODESCR,
370b05e7 986Host PCI device pass through. The PCI ID of a host's PCI device or a list
52261945
DM
987of PCI virtual functions of the host. HOSTPCIID syntax is:
988
989'bus:dev.func' (hexadecimal numbers)
990
991You can us the 'lspci' command to list existing PCI devices.
52261945 992EODESCR
1f4f447b
WB
993 },
994 rombar => {
995 type => 'boolean',
52261945 996 description => "Specify whether or not the device's ROM will be visible in the guest's memory map.",
1f4f447b
WB
997 optional => 1,
998 default => 1,
999 },
456a6fec
AD
1000 romfile => {
1001 type => 'string',
1002 pattern => '[^,;]+',
1003 format_description => 'string',
1004 description => "Custom pci device rom filename (must be located in /usr/share/kvm/).",
1005 optional => 1,
1006 },
1f4f447b
WB
1007 pcie => {
1008 type => 'boolean',
52261945 1009 description => "Choose the PCI-express bus (needs the 'q35' machine model).",
1f4f447b
WB
1010 optional => 1,
1011 default => 0,
1012 },
1013 'x-vga' => {
1014 type => 'boolean',
52261945 1015 description => "Enable vfio-vga device support.",
1f4f447b
WB
1016 optional => 1,
1017 default => 0,
1018 },
6ab45bd7
DC
1019 'mdev' => {
1020 type => 'string',
1021 format_description => 'string',
1022 pattern => '[^/\.:]+',
1023 optional => 1,
1024 description => <<EODESCR
1025The type of mediated device to use.
1026An instance of this type will be created on startup of the VM and
1027will be cleaned up when the VM stops.
1028EODESCR
1029 }
1f4f447b
WB
1030};
1031PVE::JSONSchema::register_format('pve-qm-hostpci', $hostpci_fmt);
1032
040b06b7
DA
1033my $hostpcidesc = {
1034 optional => 1,
1035 type => 'string', format => 'pve-qm-hostpci',
52261945 1036 description => "Map host PCI devices into guest.",
faab5306
DM
1037 verbose_description => <<EODESCR,
1038Map host PCI devices into guest.
1039
370b05e7 1040NOTE: This option allows direct access to host hardware. So it is no longer
faab5306
DM
1041possible to migrate such machines - use with special care.
1042
1043CAUTION: Experimental! User reported problems with this option.
1044EODESCR
040b06b7
DA
1045};
1046PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
1047
bae179aa
DA
1048my $serialdesc = {
1049 optional => 1,
ca0cef26 1050 type => 'string',
1b0b51ed 1051 pattern => '(/dev/.+|socket)',
52261945
DM
1052 description => "Create a serial device inside the VM (n is 0 to 3)",
1053 verbose_description => <<EODESCR,
52261945
DM
1054Create a serial device inside the VM (n is 0 to 3), and pass through a
1055host serial device (i.e. /dev/ttyS0), or create a unix socket on the
1056host side (use 'qm terminal' to open a terminal connection).
bae179aa 1057
8a61e0fd 1058NOTE: If you pass through a host serial device, it is no longer possible to migrate such machines - use with special care.
bae179aa 1059
52261945 1060CAUTION: Experimental! User reported problems with this option.
bae179aa
DA
1061EODESCR
1062};
bae179aa 1063
1989a89c
DA
1064my $paralleldesc= {
1065 optional => 1,
ca0cef26 1066 type => 'string',
9ecc8431 1067 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
52261945
DM
1068 description => "Map host parallel devices (n is 0 to 2).",
1069 verbose_description => <<EODESCR,
19672434 1070Map host parallel devices (n is 0 to 2).
1989a89c 1071
8a61e0fd 1072NOTE: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
1989a89c 1073
52261945 1074CAUTION: Experimental! User reported problems with this option.
1989a89c
DA
1075EODESCR
1076};
1989a89c
DA
1077
1078for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
1079 $confdesc->{"parallel$i"} = $paralleldesc;
1080}
1081
bae179aa
DA
1082for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
1083 $confdesc->{"serial$i"} = $serialdesc;
1084}
1085
040b06b7
DA
1086for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
1087 $confdesc->{"hostpci$i"} = $hostpcidesc;
1088}
1e3baf05 1089
e0fd2b2f
FE
1090for my $key (keys %{$PVE::QemuServer::Drive::drivedesc_hash}) {
1091 $confdesc->{$key} = $PVE::QemuServer::Drive::drivedesc_hash->{$key};
cdb0931f
DA
1092}
1093
e0fd2b2f
FE
1094for (my $i = 0; $i < $PVE::QemuServer::Drive::MAX_UNUSED_DISKS; $i++) {
1095 $confdesc->{"unused$i"} = $PVE::QemuServer::Drive::unuseddesc;
1e3baf05
DM
1096}
1097
1e3baf05
DM
1098for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
1099 $confdesc->{"usb$i"} = $usbdesc;
1100}
1101
1e3baf05
DM
1102my $kvm_api_version = 0;
1103
1104sub kvm_version {
1e3baf05
DM
1105 return $kvm_api_version if $kvm_api_version;
1106
646f2df4
WB
1107 open my $fh, '<', '/dev/kvm'
1108 or return undef;
1e3baf05 1109
646f2df4
WB
1110 # 0xae00 => KVM_GET_API_VERSION
1111 $kvm_api_version = ioctl($fh, 0xae00, 0);
1e3baf05 1112
646f2df4 1113 return $kvm_api_version;
1e3baf05
DM
1114}
1115
1476b99f
DC
1116my $kvm_user_version = {};
1117my $kvm_mtime = {};
1e3baf05
DM
1118
1119sub kvm_user_version {
1476b99f 1120 my ($binary) = @_;
1e3baf05 1121
1476b99f
DC
1122 $binary //= get_command_for_arch(get_host_arch()); # get the native arch by default
1123 my $st = stat($binary);
1e3baf05 1124
1476b99f
DC
1125 my $cachedmtime = $kvm_mtime->{$binary} // -1;
1126 return $kvm_user_version->{$binary} if $kvm_user_version->{$binary} &&
1127 $cachedmtime == $st->mtime;
1128
1129 $kvm_user_version->{$binary} = 'unknown';
1130 $kvm_mtime->{$binary} = $st->mtime;
1e3baf05 1131
09b11429
TL
1132 my $code = sub {
1133 my $line = shift;
1134 if ($line =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)(\.\d+)?[,\s]/) {
1476b99f 1135 $kvm_user_version->{$binary} = $2;
09b11429
TL
1136 }
1137 };
19672434 1138
1476b99f 1139 eval { run_command([$binary, '--version'], outfunc => $code); };
09b11429 1140 warn $@ if $@;
1e3baf05 1141
1476b99f 1142 return $kvm_user_version->{$binary};
1e3baf05
DM
1143
1144}
1145
db70021b
TL
1146sub kernel_has_vhost_net {
1147 return -c '/dev/vhost-net';
1148}
1e3baf05 1149
1e3baf05
DM
1150sub option_exists {
1151 my $key = shift;
1152 return defined($confdesc->{$key});
19672434 1153}
1e3baf05 1154
1e3baf05 1155my $cdrom_path;
1e3baf05
DM
1156sub get_cdrom_path {
1157
1158 return $cdrom_path if $cdrom_path;
1159
1160 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
1161 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
1162 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
1163}
1164
1165sub get_iso_path {
1166 my ($storecfg, $vmid, $cdrom) = @_;
1167
1168 if ($cdrom eq 'cdrom') {
1169 return get_cdrom_path();
1170 } elsif ($cdrom eq 'none') {
1171 return '';
1172 } elsif ($cdrom =~ m|^/|) {
1173 return $cdrom;
1174 } else {
6b64503e 1175 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
1176 }
1177}
1178
1179# try to convert old style file names to volume IDs
1180sub filename_to_volume_id {
1181 my ($vmid, $file, $media) = @_;
1182
0c9a7596 1183 if (!($file eq 'none' || $file eq 'cdrom' ||
1e3baf05 1184 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 1185
1e3baf05 1186 return undef if $file =~ m|/|;
19672434 1187
1e3baf05
DM
1188 if ($media && $media eq 'cdrom') {
1189 $file = "local:iso/$file";
1190 } else {
1191 $file = "local:$vmid/$file";
1192 }
1193 }
1194
1195 return $file;
1196}
1197
1198sub verify_media_type {
1199 my ($opt, $vtype, $media) = @_;
1200
1201 return if !$media;
1202
1203 my $etype;
1204 if ($media eq 'disk') {
a125592c 1205 $etype = 'images';
1e3baf05
DM
1206 } elsif ($media eq 'cdrom') {
1207 $etype = 'iso';
1208 } else {
1209 die "internal error";
1210 }
1211
1212 return if ($vtype eq $etype);
19672434 1213
1e3baf05
DM
1214 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
1215}
1216
1217sub cleanup_drive_path {
1218 my ($opt, $storecfg, $drive) = @_;
1219
1220 # try to convert filesystem paths to volume IDs
1221
1222 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
1223 ($drive->{file} !~ m|^/dev/.+|) &&
1224 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 1225 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
1226 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
1227 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
1228 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
1229 verify_media_type($opt, $vtype, $drive->{media});
1230 $drive->{file} = $volid;
1231 }
1232
1233 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
1234}
1235
b3c2bdd1
DM
1236sub parse_hotplug_features {
1237 my ($data) = @_;
1238
1239 my $res = {};
1240
1241 return $res if $data eq '0';
a1b7d579 1242
b3c2bdd1
DM
1243 $data = $confdesc->{hotplug}->{default} if $data eq '1';
1244
45827685 1245 foreach my $feature (PVE::Tools::split_list($data)) {
b3c2bdd1
DM
1246 if ($feature =~ m/^(network|disk|cpu|memory|usb)$/) {
1247 $res->{$1} = 1;
1248 } else {
596a0a20 1249 die "invalid hotplug feature '$feature'\n";
b3c2bdd1
DM
1250 }
1251 }
1252 return $res;
1253}
1254
1255PVE::JSONSchema::register_format('pve-hotplug-features', \&pve_verify_hotplug_features);
1256sub pve_verify_hotplug_features {
1257 my ($value, $noerr) = @_;
1258
1259 return $value if parse_hotplug_features($value);
1260
1261 return undef if $noerr;
1262
1263 die "unable to parse hotplug option\n";
1264}
1265
28ef82d3
DM
1266sub scsi_inquiry {
1267 my($fh, $noerr) = @_;
1268
1269 my $SG_IO = 0x2285;
1270 my $SG_GET_VERSION_NUM = 0x2282;
1271
1272 my $versionbuf = "\x00" x 8;
1273 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1274 if (!$ret) {
1275 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1276 return undef;
1277 }
97d62eb7 1278 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1279 if ($version < 30000) {
1280 die "scsi generic interface too old\n" if !$noerr;
1281 return undef;
1282 }
97d62eb7 1283
28ef82d3
DM
1284 my $buf = "\x00" x 36;
1285 my $sensebuf = "\x00" x 8;
f334aa3e 1286 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1287
28ef82d3
DM
1288 # see /usr/include/scsi/sg.h
1289 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1290
97d62eb7
DM
1291 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1292 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1293 $cmd, $sensebuf, 6000);
1294
1295 $ret = ioctl($fh, $SG_IO, $packet);
1296 if (!$ret) {
1297 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1298 return undef;
1299 }
97d62eb7 1300
28ef82d3
DM
1301 my @res = unpack($sg_io_hdr_t, $packet);
1302 if ($res[17] || $res[18]) {
1303 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1304 return undef;
1305 }
1306
1307 my $res = {};
09984754 1308 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1309 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1310
09984754
DM
1311 $res->{removable} = $byte1 & 128 ? 1 : 0;
1312 $res->{type} = $byte0 & 31;
1313
28ef82d3
DM
1314 return $res;
1315}
1316
1317sub path_is_scsi {
1318 my ($path) = @_;
1319
1320 my $fh = IO::File->new("+<$path") || return undef;
1321 my $res = scsi_inquiry($fh, 1);
1322 close($fh);
1323
1324 return $res;
1325}
1326
db656e5f 1327sub print_tabletdevice_full {
d559309f 1328 my ($conf, $arch) = @_;
b467f79a 1329
3392d6ca 1330 my $q35 = PVE::QemuServer::Machine::machine_type_is_q35($conf);
db656e5f
DM
1331
1332 # we use uhci for old VMs because tablet driver was buggy in older qemu
d559309f 1333 my $usbbus;
3392d6ca 1334 if (PVE::QemuServer::Machine::machine_type_is_q35($conf) || $arch eq 'aarch64') {
d559309f
WB
1335 $usbbus = 'ehci';
1336 } else {
1337 $usbbus = 'uhci';
1338 }
b467f79a 1339
db656e5f
DM
1340 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1341}
1342
d559309f
WB
1343sub print_keyboarddevice_full {
1344 my ($conf, $arch, $machine) = @_;
1345
1346 return undef if $arch ne 'aarch64';
1347
1348 return "usb-kbd,id=keyboard,bus=ehci.0,port=2";
1349}
1350
ca916ecc 1351sub print_drivedevice_full {
d559309f 1352 my ($storecfg, $conf, $vmid, $drive, $bridges, $arch, $machine_type) = @_;
ca916ecc
DA
1353
1354 my $device = '';
1355 my $maxdev = 0;
19672434 1356
ca916ecc 1357 if ($drive->{interface} eq 'virtio') {
d559309f 1358 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges, $arch, $machine_type);
2ed36a41 1359 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
51f492cd 1360 $device .= ",iothread=iothread-$drive->{interface}$drive->{index}" if $drive->{iothread};
2ed36a41 1361 } elsif ($drive->{interface} eq 'scsi') {
6731a4cf 1362
ee034f5c 1363 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $drive);
2ed36a41
DM
1364 my $unit = $drive->{index} % $maxdev;
1365 my $devicetype = 'hd';
69bcf246
WB
1366 my $path = '';
1367 if (drive_is_cdrom($drive)) {
1368 $devicetype = 'cd';
29b19529 1369 } else {
69bcf246
WB
1370 if ($drive->{file} =~ m|^/|) {
1371 $path = $drive->{file};
1372 if (my $info = path_is_scsi($path)) {
8e3c33ab 1373 if ($info->{type} == 0 && $drive->{scsiblock}) {
69bcf246
WB
1374 $devicetype = 'block';
1375 } elsif ($info->{type} == 1) { # tape
1376 $devicetype = 'generic';
1377 }
1378 }
1379 } else {
1380 $path = PVE::Storage::path($storecfg, $drive->{file});
1381 }
1382
a034e3d6 1383 # for compatibility only, we prefer scsi-hd (#2408, #2355, #2380)
9471e48b 1384 my $version = PVE::QemuServer::Machine::extract_version($machine_type, kvm_user_version());
a034e3d6 1385 if ($path =~ m/^iscsi\:\/\// &&
2ea5fb7e 1386 !min_version($version, 4, 1)) {
69bcf246
WB
1387 $devicetype = 'generic';
1388 }
1389 }
1390
1391 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1392 $device = "scsi-$devicetype,bus=$controller_prefix$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1393 } else {
1394 $device = "scsi-$devicetype,bus=$controller_prefix$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1395 }
cdd20088 1396
6c875f9f
NC
1397 if ($drive->{ssd} && ($devicetype eq 'block' || $devicetype eq 'hd')) {
1398 $device .= ",rotation_rate=1";
1399 }
e741c516 1400 $device .= ",wwn=$drive->{wwn}" if $drive->{wwn};
6c875f9f
NC
1401
1402 } elsif ($drive->{interface} eq 'ide' || $drive->{interface} eq 'sata') {
e0fd2b2f 1403 my $maxdev = ($drive->{interface} eq 'sata') ? $PVE::QemuServer::Drive::MAX_SATA_DISKS : 2;
2ed36a41
DM
1404 my $controller = int($drive->{index} / $maxdev);
1405 my $unit = $drive->{index} % $maxdev;
1406 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1407
6c875f9f
NC
1408 $device = "ide-$devicetype";
1409 if ($drive->{interface} eq 'ide') {
1410 $device .= ",bus=ide.$controller,unit=$unit";
1411 } else {
1412 $device .= ",bus=ahci$controller.$unit";
1413 }
1414 $device .= ",drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1415
1416 if ($devicetype eq 'hd') {
1417 if (my $model = $drive->{model}) {
1418 $model = URI::Escape::uri_unescape($model);
1419 $device .= ",model=$model";
1420 }
1421 if ($drive->{ssd}) {
1422 $device .= ",rotation_rate=1";
1423 }
0f2812c2 1424 }
e741c516 1425 $device .= ",wwn=$drive->{wwn}" if $drive->{wwn};
2ed36a41
DM
1426 } elsif ($drive->{interface} eq 'usb') {
1427 die "implement me";
1428 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1429 } else {
1430 die "unsupported interface type";
ca916ecc
DA
1431 }
1432
3b408e82
DM
1433 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1434
a70e7e6c
TL
1435 if (my $serial = $drive->{serial}) {
1436 $serial = URI::Escape::uri_unescape($serial);
1437 $device .= ",serial=$serial";
1438 }
1439
1440
ca916ecc
DA
1441 return $device;
1442}
1443
15b21acc 1444sub get_initiator_name {
46f58b5f 1445 my $initiator;
15b21acc 1446
46f58b5f
DM
1447 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1448 while (defined(my $line = <$fh>)) {
1449 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1450 $initiator = $1;
1451 last;
1452 }
46f58b5f
DM
1453 $fh->close();
1454
15b21acc
MR
1455 return $initiator;
1456}
1457
776c5f50 1458sub print_drive_commandline_full {
1e3baf05
DM
1459 my ($storecfg, $vmid, $drive) = @_;
1460
d81f0f09
DM
1461 my $path;
1462 my $volid = $drive->{file};
1463 my $format;
370b05e7 1464
d81f0f09
DM
1465 if (drive_is_cdrom($drive)) {
1466 $path = get_iso_path($storecfg, $vmid, $volid);
1467 } else {
1468 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
1469 if ($storeid) {
1470 $path = PVE::Storage::path($storecfg, $volid);
1471 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
1472 $format = qemu_img_format($scfg, $volname);
1473 } else {
1474 $path = $volid;
5b61bff2 1475 $format = "raw";
d81f0f09
DM
1476 }
1477 }
1478
1e3baf05 1479 my $opts = '';
8a267708 1480 my @qemu_drive_options = qw(heads secs cyls trans media format cache rerror werror aio discard);
1e3baf05 1481 foreach my $o (@qemu_drive_options) {
5fc74861 1482 $opts .= ",$o=$drive->{$o}" if defined($drive->{$o});
19672434 1483 }
8a267708
DC
1484
1485 # snapshot only accepts on|off
1486 if (defined($drive->{snapshot})) {
1487 my $v = $drive->{snapshot} ? 'on' : 'off';
1488 $opts .= ",snapshot=$v";
1489 }
1490
fb8e95a2
WB
1491 foreach my $type (['', '-total'], [_rd => '-read'], [_wr => '-write']) {
1492 my ($dir, $qmpname) = @$type;
1493 if (my $v = $drive->{"mbps$dir"}) {
1494 $opts .= ",throttling.bps$qmpname=".int($v*1024*1024);
1495 }
1496 if (my $v = $drive->{"mbps${dir}_max"}) {
1497 $opts .= ",throttling.bps$qmpname-max=".int($v*1024*1024);
1498 }
1499 if (my $v = $drive->{"bps${dir}_max_length"}) {
1500 $opts .= ",throttling.bps$qmpname-max-length=$v";
1501 }
1502 if (my $v = $drive->{"iops${dir}"}) {
1503 $opts .= ",throttling.iops$qmpname=$v";
1504 }
1505 if (my $v = $drive->{"iops${dir}_max"}) {
8aca1654 1506 $opts .= ",throttling.iops$qmpname-max=$v";
fb8e95a2
WB
1507 }
1508 if (my $v = $drive->{"iops${dir}_max_length"}) {
8aca1654 1509 $opts .= ",throttling.iops$qmpname-max-length=$v";
fb8e95a2
WB
1510 }
1511 }
1512
d81f0f09
DM
1513 $opts .= ",format=$format" if $format && !$drive->{format};
1514
b2ee900e
WB
1515 my $cache_direct = 0;
1516
1517 if (my $cache = $drive->{cache}) {
1518 $cache_direct = $cache =~ /^(?:off|none|directsync)$/;
1519 } elsif (!drive_is_cdrom($drive)) {
1520 $opts .= ",cache=none";
1521 $cache_direct = 1;
1522 }
1523
1524 # aio native works only with O_DIRECT
1525 if (!$drive->{aio}) {
1526 if($cache_direct) {
1527 $opts .= ",aio=native";
1528 } else {
1529 $opts .= ",aio=threads";
1530 }
1531 }
11490cf2 1532
6e47c3b4
WB
1533 if (!drive_is_cdrom($drive)) {
1534 my $detectzeroes;
7d4e30f3 1535 if (defined($drive->{detect_zeroes}) && !$drive->{detect_zeroes}) {
6e47c3b4
WB
1536 $detectzeroes = 'off';
1537 } elsif ($drive->{discard}) {
1538 $detectzeroes = $drive->{discard} eq 'on' ? 'unmap' : 'on';
1539 } else {
1540 # This used to be our default with discard not being specified:
1541 $detectzeroes = 'on';
1542 }
1543 $opts .= ",detect-zeroes=$detectzeroes" if $detectzeroes;
1544 }
f1e05305 1545
1e3baf05
DM
1546 my $pathinfo = $path ? "file=$path," : '';
1547
3ebfcc86 1548 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1549}
1550
cc4d6182 1551sub print_netdevice_full {
d559309f 1552 my ($vmid, $conf, $net, $netid, $bridges, $use_old_bios_files, $arch, $machine_type) = @_;
cc4d6182
DA
1553
1554 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1555
1556 my $device = $net->{model};
1557 if ($net->{model} eq 'virtio') {
1558 $device = 'virtio-net-pci';
1559 };
1560
d559309f 1561 my $pciaddr = print_pci_addr("$netid", $bridges, $arch, $machine_type);
5e2068d2 1562 my $tmpstr = "$device,mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1563 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1564 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1565 my $vectors = $net->{queues} * 2 + 2;
1566 $tmpstr .= ",vectors=$vectors,mq=on";
1567 }
cc4d6182 1568 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
ba9e1000
DM
1569
1570 if ($use_old_bios_files) {
1571 my $romfile;
1572 if ($device eq 'virtio-net-pci') {
1573 $romfile = 'pxe-virtio.rom';
1574 } elsif ($device eq 'e1000') {
1575 $romfile = 'pxe-e1000.rom';
1576 } elsif ($device eq 'ne2k') {
1577 $romfile = 'pxe-ne2k_pci.rom';
1578 } elsif ($device eq 'pcnet') {
1579 $romfile = 'pxe-pcnet.rom';
1580 } elsif ($device eq 'rtl8139') {
1581 $romfile = 'pxe-rtl8139.rom';
1582 }
1583 $tmpstr .= ",romfile=$romfile" if $romfile;
1584 }
1585
cc4d6182
DA
1586 return $tmpstr;
1587}
1588
1589sub print_netdev_full {
d559309f 1590 my ($vmid, $conf, $arch, $net, $netid, $hotplug) = @_;
cc4d6182
DA
1591
1592 my $i = '';
1593 if ($netid =~ m/^net(\d+)$/) {
1594 $i = int($1);
1595 }
1596
1597 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1598
1599 my $ifname = "tap${vmid}i$i";
1600
1601 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1602 die "interface name '$ifname' is too long (max 15 character)\n"
1603 if length($ifname) >= 16;
1604
1605 my $vhostparam = '';
6f0cb675 1606 if (is_native($arch)) {
db70021b 1607 $vhostparam = ',vhost=on' if kernel_has_vhost_net() && $net->{model} eq 'virtio';
6f0cb675 1608 }
cc4d6182
DA
1609
1610 my $vmname = $conf->{name} || "vm$vmid";
1611
a9410357 1612 my $netdev = "";
208ba94e 1613 my $script = $hotplug ? "pve-bridge-hotplug" : "pve-bridge";
a9410357 1614
cc4d6182 1615 if ($net->{bridge}) {
208ba94e 1616 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/$script,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1617 } else {
a9410357 1618 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1619 }
a9410357
AD
1620
1621 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1622
1623 return $netdev;
cc4d6182 1624}
1e3baf05 1625
55655ebc
DC
1626my $vga_map = {
1627 'cirrus' => 'cirrus-vga',
1628 'std' => 'VGA',
1629 'vmware' => 'vmware-svga',
1630 'virtio' => 'virtio-vga',
1631};
1632
1633sub print_vga_device {
2ea5fb7e 1634 my ($conf, $vga, $arch, $machine_version, $machine, $id, $qxlnum, $bridges) = @_;
55655ebc
DC
1635
1636 my $type = $vga_map->{$vga->{type}};
86c9fafe 1637 if ($arch eq 'aarch64' && defined($type) && $type eq 'virtio-vga') {
d559309f
WB
1638 $type = 'virtio-gpu';
1639 }
55655ebc 1640 my $vgamem_mb = $vga->{memory};
6021c7a5
AL
1641
1642 my $max_outputs = '';
55655ebc
DC
1643 if ($qxlnum) {
1644 $type = $id ? 'qxl' : 'qxl-vga';
6021c7a5 1645
c5a4c92c 1646 if (!$conf->{ostype} || $conf->{ostype} =~ m/^(?:l\d\d)|(?:other)$/) {
6021c7a5 1647 # set max outputs so linux can have up to 4 qxl displays with one device
2ea5fb7e 1648 if (min_version($machine_version, 4, 1)) {
9e8976ea
TL
1649 $max_outputs = ",max_outputs=4";
1650 }
6021c7a5 1651 }
55655ebc 1652 }
6021c7a5 1653
55655ebc
DC
1654 die "no devicetype for $vga->{type}\n" if !$type;
1655
1656 my $memory = "";
1657 if ($vgamem_mb) {
1658 if ($vga->{type} eq 'virtio') {
1659 my $bytes = PVE::Tools::convert_size($vgamem_mb, "mb" => "b");
1660 $memory = ",max_hostmem=$bytes";
1661 } elsif ($qxlnum) {
1662 # from https://www.spice-space.org/multiple-monitors.html
1663 $memory = ",vgamem_mb=$vga->{memory}";
1664 my $ram = $vgamem_mb * 4;
1665 my $vram = $vgamem_mb * 2;
1666 $memory .= ",ram_size_mb=$ram,vram_size_mb=$vram";
1667 } else {
1668 $memory = ",vgamem_mb=$vga->{memory}";
1669 }
1670 } elsif ($qxlnum && $id) {
1671 $memory = ",ram_size=67108864,vram_size=33554432";
1672 }
1673
3392d6ca 1674 my $q35 = PVE::QemuServer::Machine::machine_type_is_q35($conf);
55655ebc
DC
1675 my $vgaid = "vga" . ($id // '');
1676 my $pciaddr;
daadd5a4 1677
55655ebc 1678 if ($q35 && $vgaid eq 'vga') {
daadd5a4 1679 # the first display uses pcie.0 bus on q35 machines
d559309f 1680 $pciaddr = print_pcie_addr($vgaid, $bridges, $arch, $machine);
55655ebc 1681 } else {
d559309f 1682 $pciaddr = print_pci_addr($vgaid, $bridges, $arch, $machine);
55655ebc
DC
1683 }
1684
6021c7a5 1685 return "$type,id=${vgaid}${memory}${max_outputs}${pciaddr}";
55655ebc
DC
1686}
1687
ffc0d8c7
WB
1688sub parse_number_sets {
1689 my ($set) = @_;
1690 my $res = [];
1691 foreach my $part (split(/;/, $set)) {
1692 if ($part =~ /^\s*(\d+)(?:-(\d+))?\s*$/) {
1693 die "invalid range: $part ($2 < $1)\n" if defined($2) && $2 < $1;
1694 push @$res, [ $1, $2 ];
2ed5d572 1695 } else {
ffc0d8c7 1696 die "invalid range: $part\n";
2ed5d572
AD
1697 }
1698 }
ffc0d8c7
WB
1699 return $res;
1700}
2ed5d572 1701
ffc0d8c7
WB
1702sub parse_numa {
1703 my ($data) = @_;
1704
1705 my $res = PVE::JSONSchema::parse_property_string($numa_fmt, $data);
1706 $res->{cpus} = parse_number_sets($res->{cpus}) if defined($res->{cpus});
1707 $res->{hostnodes} = parse_number_sets($res->{hostnodes}) if defined($res->{hostnodes});
2ed5d572
AD
1708 return $res;
1709}
1710
040b06b7
DA
1711sub parse_hostpci {
1712 my ($value) = @_;
1713
1714 return undef if !$value;
1715
1f4f447b 1716 my $res = PVE::JSONSchema::parse_property_string($hostpci_fmt, $value);
0cea6a01 1717
1f4f447b
WB
1718 my @idlist = split(/;/, $res->{host});
1719 delete $res->{host};
1720 foreach my $id (@idlist) {
844b55fb 1721 my $devs = PVE::SysFSTools::lspci($id);
c7728fdb 1722 die "no PCI device found for '$id'\n" if !scalar(@$devs);
844b55fb 1723 push @{$res->{pciid}}, @$devs;
040b06b7 1724 }
040b06b7
DA
1725 return $res;
1726}
1727
1e3baf05
DM
1728# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1729sub parse_net {
1730 my ($data) = @_;
1731
cd9c34d1
WB
1732 my $res = eval { PVE::JSONSchema::parse_property_string($net_fmt, $data) };
1733 if ($@) {
1734 warn $@;
1735 return undef;
1e3baf05 1736 }
b5b99790
WB
1737 if (!defined($res->{macaddr})) {
1738 my $dc = PVE::Cluster::cfs_read_file('datacenter.cfg');
1739 $res->{macaddr} = PVE::Tools::random_ether_addr($dc->{mac_prefix});
1740 }
0c9a7596
AD
1741 return $res;
1742}
1743
1744# ipconfigX ip=cidr,gw=ip,ip6=cidr,gw6=ip
1745sub parse_ipconfig {
1746 my ($data) = @_;
1747
1748 my $res = eval { PVE::JSONSchema::parse_property_string($ipconfig_fmt, $data) };
1749 if ($@) {
1750 warn $@;
1751 return undef;
1752 }
1753
1754 if ($res->{gw} && !$res->{ip}) {
1755 warn 'gateway specified without specifying an IP address';
1756 return undef;
1757 }
1758 if ($res->{gw6} && !$res->{ip6}) {
1759 warn 'IPv6 gateway specified without specifying an IPv6 address';
1760 return undef;
1761 }
1762 if ($res->{gw} && $res->{ip} eq 'dhcp') {
1763 warn 'gateway specified together with DHCP';
1764 return undef;
1765 }
1766 if ($res->{gw6} && $res->{ip6} !~ /^$IPV6RE/) {
1767 # gw6 + auto/dhcp
1768 warn "IPv6 gateway specified together with $res->{ip6} address";
1769 return undef;
1770 }
1771
1772 if (!$res->{ip} && !$res->{ip6}) {
1773 return { ip => 'dhcp', ip6 => 'dhcp' };
1774 }
1775
1e3baf05
DM
1776 return $res;
1777}
1778
1779sub print_net {
1780 my $net = shift;
1781
cd9c34d1 1782 return PVE::JSONSchema::print_property_string($net, $net_fmt);
1e3baf05
DM
1783}
1784
1785sub add_random_macs {
1786 my ($settings) = @_;
1787
1788 foreach my $opt (keys %$settings) {
1789 next if $opt !~ m/^net(\d+)$/;
1790 my $net = parse_net($settings->{$opt});
1791 next if !$net;
1792 $settings->{$opt} = print_net($net);
1793 }
1794}
1795
055d554d
DM
1796sub vm_is_volid_owner {
1797 my ($storecfg, $vmid, $volid) = @_;
1798
1799 if ($volid !~ m|^/|) {
1800 my ($path, $owner);
1801 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1802 if ($owner && ($owner == $vmid)) {
1803 return 1;
1804 }
1805 }
1806
1807 return undef;
1808}
1809
055d554d
DM
1810sub vmconfig_register_unused_drive {
1811 my ($storecfg, $vmid, $conf, $drive) = @_;
1812
2d9ddec5
WB
1813 if (drive_is_cloudinit($drive)) {
1814 eval { PVE::Storage::vdisk_free($storecfg, $drive->{file}) };
1815 warn $@ if $@;
1816 } elsif (!drive_is_cdrom($drive)) {
055d554d
DM
1817 my $volid = $drive->{file};
1818 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
8793d495 1819 PVE::QemuConfig->add_unused_volume($conf, $volid, $vmid);
055d554d
DM
1820 }
1821 }
1822}
1823
1f30ac3a 1824# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str][,base64=bool]
ff6ffe20 1825my $smbios1_fmt = {
bd27e851
WB
1826 uuid => {
1827 type => 'string',
1828 pattern => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1829 format_description => 'UUID',
52261945 1830 description => "Set SMBIOS1 UUID.",
bd27e851
WB
1831 optional => 1,
1832 },
1833 version => {
1834 type => 'string',
1f30ac3a
CE
1835 pattern => '[A-Za-z0-9+\/]+={0,2}',
1836 format_description => 'Base64 encoded string',
52261945 1837 description => "Set SMBIOS1 version.",
bd27e851
WB
1838 optional => 1,
1839 },
1840 serial => {
1841 type => 'string',
1f30ac3a
CE
1842 pattern => '[A-Za-z0-9+\/]+={0,2}',
1843 format_description => 'Base64 encoded string',
52261945 1844 description => "Set SMBIOS1 serial number.",
bd27e851
WB
1845 optional => 1,
1846 },
1847 manufacturer => {
1848 type => 'string',
1f30ac3a
CE
1849 pattern => '[A-Za-z0-9+\/]+={0,2}',
1850 format_description => 'Base64 encoded string',
52261945 1851 description => "Set SMBIOS1 manufacturer.",
bd27e851
WB
1852 optional => 1,
1853 },
1854 product => {
1855 type => 'string',
1f30ac3a
CE
1856 pattern => '[A-Za-z0-9+\/]+={0,2}',
1857 format_description => 'Base64 encoded string',
52261945 1858 description => "Set SMBIOS1 product ID.",
bd27e851
WB
1859 optional => 1,
1860 },
1861 sku => {
1862 type => 'string',
1f30ac3a
CE
1863 pattern => '[A-Za-z0-9+\/]+={0,2}',
1864 format_description => 'Base64 encoded string',
52261945 1865 description => "Set SMBIOS1 SKU string.",
bd27e851
WB
1866 optional => 1,
1867 },
1868 family => {
1869 type => 'string',
1f30ac3a
CE
1870 pattern => '[A-Za-z0-9+\/]+={0,2}',
1871 format_description => 'Base64 encoded string',
52261945 1872 description => "Set SMBIOS1 family string.",
bd27e851
WB
1873 optional => 1,
1874 },
1f30ac3a
CE
1875 base64 => {
1876 type => 'boolean',
1877 description => 'Flag to indicate that the SMBIOS values are base64 encoded',
1878 optional => 1,
1879 },
2796e7d5
DM
1880};
1881
2796e7d5
DM
1882sub parse_smbios1 {
1883 my ($data) = @_;
1884
ff6ffe20 1885 my $res = eval { PVE::JSONSchema::parse_property_string($smbios1_fmt, $data) };
bd27e851 1886 warn $@ if $@;
2796e7d5
DM
1887 return $res;
1888}
1889
cd11416f
DM
1890sub print_smbios1 {
1891 my ($smbios1) = @_;
ff6ffe20 1892 return PVE::JSONSchema::print_property_string($smbios1, $smbios1_fmt);
cd11416f
DM
1893}
1894
ff6ffe20 1895PVE::JSONSchema::register_format('pve-qm-smbios1', $smbios1_fmt);
2796e7d5 1896
0ea9541d
DM
1897sub parse_watchdog {
1898 my ($value) = @_;
1899
1900 return undef if !$value;
1901
ec3582b5
WB
1902 my $res = eval { PVE::JSONSchema::parse_property_string($watchdog_fmt, $value) };
1903 warn $@ if $@;
0ea9541d
DM
1904 return $res;
1905}
1906
9d66b397
SI
1907sub parse_guest_agent {
1908 my ($value) = @_;
1909
1910 return {} if !defined($value->{agent});
1911
1912 my $res = eval { PVE::JSONSchema::parse_property_string($agent_fmt, $value->{agent}) };
1913 warn $@ if $@;
1914
1915 # if the agent is disabled ignore the other potentially set properties
1916 return {} if !$res->{enabled};
1917 return $res;
1918}
1919
55655ebc
DC
1920sub parse_vga {
1921 my ($value) = @_;
1922
1923 return {} if !$value;
1924 my $res = eval { PVE::JSONSchema::parse_property_string($vga_fmt, $value) };
1925 warn $@ if $@;
1926 return $res;
1927}
1928
2cf61f33
SR
1929sub parse_rng {
1930 my ($value) = @_;
1931
1932 return undef if !$value;
1933
1934 my $res = eval { PVE::JSONSchema::parse_property_string($rng_fmt, $value) };
1935 warn $@ if $@;
1936 return $res;
1937}
1938
1e3baf05
DM
1939PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1940sub verify_usb_device {
1941 my ($value, $noerr) = @_;
1942
1943 return $value if parse_usb_device($value);
1944
1945 return undef if $noerr;
19672434 1946
1e3baf05
DM
1947 die "unable to parse usb device\n";
1948}
1949
1e3baf05
DM
1950# add JSON properties for create and set function
1951sub json_config_properties {
1952 my $prop = shift;
1953
1954 foreach my $opt (keys %$confdesc) {
c6737ef1 1955 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate' || $opt eq 'runningmachine';
1e3baf05
DM
1956 $prop->{$opt} = $confdesc->{$opt};
1957 }
1958
1959 return $prop;
1960}
1961
d41121fd
DM
1962# return copy of $confdesc_cloudinit to generate documentation
1963sub cloudinit_config_properties {
1964
1965 return dclone($confdesc_cloudinit);
1966}
1967
1e3baf05
DM
1968sub check_type {
1969 my ($key, $value) = @_;
1970
1971 die "unknown setting '$key'\n" if !$confdesc->{$key};
1972
1973 my $type = $confdesc->{$key}->{type};
1974
6b64503e 1975 if (!defined($value)) {
1e3baf05
DM
1976 die "got undefined value\n";
1977 }
1978
1979 if ($value =~ m/[\n\r]/) {
1980 die "property contains a line feed\n";
1981 }
1982
1983 if ($type eq 'boolean') {
19672434
DM
1984 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1985 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1986 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1987 } elsif ($type eq 'integer') {
1988 return int($1) if $value =~ m/^(\d+)$/;
1989 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1990 } elsif ($type eq 'number') {
1991 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1992 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1993 } elsif ($type eq 'string') {
1994 if (my $fmt = $confdesc->{$key}->{format}) {
1e3baf05 1995 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1996 return $value;
1997 }
1e3baf05 1998 $value =~ s/^\"(.*)\"$/$1/;
19672434 1999 return $value;
1e3baf05
DM
2000 } else {
2001 die "internal error"
2002 }
2003}
2004
1e3baf05 2005sub destroy_vm {
b04ea584 2006 my ($storecfg, $vmid, $skiplock, $replacement_conf) = @_;
1e3baf05 2007
ffda963f 2008 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 2009
ffda963f 2010 PVE::QemuConfig->check_lock($conf) if !$skiplock;
1e3baf05 2011
5e67a2d2
DC
2012 if ($conf->{template}) {
2013 # check if any base image is still used by a linked clone
2014 foreach_drive($conf, sub {
2015 my ($ds, $drive) = @_;
5e67a2d2
DC
2016 return if drive_is_cdrom($drive);
2017
2018 my $volid = $drive->{file};
5e67a2d2
DC
2019 return if !$volid || $volid =~ m|^/|;
2020
2021 die "base volume '$volid' is still in use by linked cloned\n"
2022 if PVE::Storage::volume_is_base_and_used($storecfg, $volid);
2023
2024 });
2025 }
2026
19672434 2027 # only remove disks owned by this VM
1e3baf05
DM
2028 foreach_drive($conf, sub {
2029 my ($ds, $drive) = @_;
9c52f5ed 2030 return if drive_is_cdrom($drive, 1);
1e3baf05
DM
2031
2032 my $volid = $drive->{file};
ff1a2432 2033 return if !$volid || $volid =~ m|^/|;
1e3baf05 2034
6b64503e 2035 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 2036 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 2037
a2f50f01 2038 eval { PVE::Storage::vdisk_free($storecfg, $volid) };
31b52247 2039 warn "Could not remove disk '$volid', check manually: $@" if $@;
1e3baf05 2040 });
19672434 2041
1e3baf05 2042 # also remove unused disk
a2f50f01
TL
2043 my $vmdisks = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
2044 PVE::Storage::foreach_volid($vmdisks, sub {
2045 my ($volid, $sid, $volname, $d) = @_;
2046 eval { PVE::Storage::vdisk_free($storecfg, $volid) };
1e3baf05 2047 warn $@ if $@;
a2f50f01 2048 });
dfda979e 2049
b04ea584 2050 if (defined $replacement_conf) {
8baf8bc7 2051 PVE::QemuConfig->write_config($vmid, $replacement_conf);
dfda979e
DJ
2052 } else {
2053 PVE::QemuConfig->destroy_config($vmid);
2054 }
1e3baf05
DM
2055}
2056
1e3baf05
DM
2057sub parse_vm_config {
2058 my ($filename, $raw) = @_;
2059
2060 return undef if !defined($raw);
2061
554ac7e7 2062 my $res = {
fc1ddcdc 2063 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 2064 snapshots => {},
0d732d16 2065 pending => {},
554ac7e7 2066 };
1e3baf05 2067
19672434 2068 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
2069 || die "got strange filename '$filename'";
2070
2071 my $vmid = $1;
2072
0d18dcfc 2073 my $conf = $res;
b0ec896e 2074 my $descr;
e297c490 2075 my $section = '';
0581fe4f 2076
0d18dcfc
DM
2077 my @lines = split(/\n/, $raw);
2078 foreach my $line (@lines) {
1e3baf05 2079 next if $line =~ m/^\s*$/;
be190583 2080
eab09f4e 2081 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 2082 $section = 'pending';
b0ec896e
DM
2083 if (defined($descr)) {
2084 $descr =~ s/\s+$//;
2085 $conf->{description} = $descr;
2086 }
2087 $descr = undef;
e297c490 2088 $conf = $res->{$section} = {};
eab09f4e
AD
2089 next;
2090
0d732d16 2091 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 2092 $section = $1;
b0ec896e
DM
2093 if (defined($descr)) {
2094 $descr =~ s/\s+$//;
2095 $conf->{description} = $descr;
2096 }
2097 $descr = undef;
e297c490 2098 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
2099 next;
2100 }
1e3baf05 2101
0581fe4f 2102 if ($line =~ m/^\#(.*)\s*$/) {
b0ec896e 2103 $descr = '' if !defined($descr);
0581fe4f
DM
2104 $descr .= PVE::Tools::decode_text($1) . "\n";
2105 next;
2106 }
2107
1e3baf05 2108 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
b0ec896e 2109 $descr = '' if !defined($descr);
0581fe4f 2110 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
2111 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
2112 $conf->{snapstate} = $1;
1e3baf05
DM
2113 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
2114 my $key = $1;
2115 my $value = $2;
0d18dcfc 2116 $conf->{$key} = $value;
ef824322 2117 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
e297c490 2118 my $value = $1;
ef824322
DM
2119 if ($section eq 'pending') {
2120 $conf->{delete} = $value; # we parse this later
2121 } else {
2122 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
eab09f4e 2123 }
15cf7698 2124 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(.+?)\s*$/) {
1e3baf05
DM
2125 my $key = $1;
2126 my $value = $2;
2127 eval { $value = check_type($key, $value); };
2128 if ($@) {
2129 warn "vm $vmid - unable to parse value of '$key' - $@";
2130 } else {
b799312f 2131 $key = 'ide2' if $key eq 'cdrom';
1e3baf05 2132 my $fmt = $confdesc->{$key}->{format};
b799312f 2133 if ($fmt && $fmt =~ /^pve-qm-(?:ide|scsi|virtio|sata)$/) {
1e3baf05
DM
2134 my $v = parse_drive($key, $value);
2135 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
2136 $v->{file} = $volid;
71c58bb7 2137 $value = print_drive($v);
1e3baf05
DM
2138 } else {
2139 warn "vm $vmid - unable to parse value of '$key'\n";
2140 next;
2141 }
2142 }
2143
b799312f 2144 $conf->{$key} = $value;
1e3baf05
DM
2145 }
2146 }
2147 }
2148
b0ec896e
DM
2149 if (defined($descr)) {
2150 $descr =~ s/\s+$//;
2151 $conf->{description} = $descr;
2152 }
0d18dcfc 2153 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
2154
2155 return $res;
2156}
2157
1858638f
DM
2158sub write_vm_config {
2159 my ($filename, $conf) = @_;
1e3baf05 2160
0d18dcfc
DM
2161 delete $conf->{snapstate}; # just to be sure
2162
1858638f
DM
2163 if ($conf->{cdrom}) {
2164 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2165 $conf->{ide2} = $conf->{cdrom};
2166 delete $conf->{cdrom};
2167 }
1e3baf05
DM
2168
2169 # we do not use 'smp' any longer
1858638f
DM
2170 if ($conf->{sockets}) {
2171 delete $conf->{smp};
2172 } elsif ($conf->{smp}) {
2173 $conf->{sockets} = $conf->{smp};
2174 delete $conf->{cores};
2175 delete $conf->{smp};
1e3baf05
DM
2176 }
2177
ee2f90b1 2178 my $used_volids = {};
0d18dcfc 2179
ee2f90b1 2180 my $cleanup_config = sub {
ef824322 2181 my ($cref, $pending, $snapname) = @_;
1858638f 2182
ee2f90b1
DM
2183 foreach my $key (keys %$cref) {
2184 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
ef824322 2185 $key eq 'snapstate' || $key eq 'pending';
ee2f90b1 2186 my $value = $cref->{$key};
ef824322
DM
2187 if ($key eq 'delete') {
2188 die "propertry 'delete' is only allowed in [PENDING]\n"
2189 if !$pending;
2190 # fixme: check syntax?
2191 next;
2192 }
ee2f90b1
DM
2193 eval { $value = check_type($key, $value); };
2194 die "unable to parse value of '$key' - $@" if $@;
1858638f 2195
ee2f90b1
DM
2196 $cref->{$key} = $value;
2197
74479ee9 2198 if (!$snapname && is_valid_drivename($key)) {
ed221350 2199 my $drive = parse_drive($key, $value);
ee2f90b1
DM
2200 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2201 }
1e3baf05 2202 }
ee2f90b1
DM
2203 };
2204
2205 &$cleanup_config($conf);
ef824322
DM
2206
2207 &$cleanup_config($conf->{pending}, 1);
2208
ee2f90b1 2209 foreach my $snapname (keys %{$conf->{snapshots}}) {
15c6e277 2210 die "internal error: snapshot name '$snapname' is forbidden" if lc($snapname) eq 'pending';
ef824322 2211 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
1e3baf05
DM
2212 }
2213
1858638f
DM
2214 # remove 'unusedX' settings if we re-add a volume
2215 foreach my $key (keys %$conf) {
2216 my $value = $conf->{$key};
ee2f90b1 2217 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 2218 delete $conf->{$key};
1e3baf05 2219 }
1858638f 2220 }
be190583 2221
0d18dcfc 2222 my $generate_raw_config = sub {
b0ec896e 2223 my ($conf, $pending) = @_;
0581fe4f 2224
0d18dcfc
DM
2225 my $raw = '';
2226
2227 # add description as comment to top of file
b0ec896e
DM
2228 if (defined(my $descr = $conf->{description})) {
2229 if ($descr) {
2230 foreach my $cl (split(/\n/, $descr)) {
2231 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2232 }
2233 } else {
2234 $raw .= "#\n" if $pending;
2235 }
0d18dcfc
DM
2236 }
2237
2238 foreach my $key (sort keys %$conf) {
ef824322 2239 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
0d18dcfc
DM
2240 $raw .= "$key: $conf->{$key}\n";
2241 }
2242 return $raw;
2243 };
0581fe4f 2244
0d18dcfc 2245 my $raw = &$generate_raw_config($conf);
ef824322
DM
2246
2247 if (scalar(keys %{$conf->{pending}})){
2248 $raw .= "\n[PENDING]\n";
b0ec896e 2249 $raw .= &$generate_raw_config($conf->{pending}, 1);
ef824322
DM
2250 }
2251
0d18dcfc
DM
2252 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2253 $raw .= "\n[$snapname]\n";
2254 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2255 }
1e3baf05 2256
1858638f
DM
2257 return $raw;
2258}
1e3baf05 2259
19672434 2260sub load_defaults {
1e3baf05
DM
2261
2262 my $res = {};
2263
2264 # we use static defaults from our JSON schema configuration
2265 foreach my $key (keys %$confdesc) {
2266 if (defined(my $default = $confdesc->{$key}->{default})) {
2267 $res->{$key} = $default;
2268 }
2269 }
19672434 2270
1e3baf05
DM
2271 return $res;
2272}
2273
2274sub config_list {
2275 my $vmlist = PVE::Cluster::get_vmlist();
2276 my $res = {};
2277 return $res if !$vmlist || !$vmlist->{ids};
2278 my $ids = $vmlist->{ids};
38277afc 2279 my $nodename = nodename();
1e3baf05 2280
1e3baf05
DM
2281 foreach my $vmid (keys %$ids) {
2282 my $d = $ids->{$vmid};
2283 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2284 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2285 $res->{$vmid}->{exists} = 1;
2286 }
2287 return $res;
2288}
2289
64e13401
DM
2290# test if VM uses local resources (to prevent migration)
2291sub check_local_resources {
2292 my ($conf, $noerr) = @_;
2293
ca6abacf 2294 my @loc_res = ();
19672434 2295
ca6abacf
TM
2296 push @loc_res, "hostusb" if $conf->{hostusb}; # old syntax
2297 push @loc_res, "hostpci" if $conf->{hostpci}; # old syntax
64e13401 2298
ca6abacf 2299 push @loc_res, "ivshmem" if $conf->{ivshmem};
6dbcb073 2300
0d29ab3b 2301 foreach my $k (keys %$conf) {
a9ce7583 2302 next if $k =~ m/^usb/ && ($conf->{$k} =~ m/^spice(?![^,])/);
d44712fc
EK
2303 # sockets are safe: they will recreated be on the target side post-migrate
2304 next if $k =~ m/^serial/ && ($conf->{$k} eq 'socket');
ca6abacf 2305 push @loc_res, $k if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2306 }
2307
ca6abacf 2308 die "VM uses local resources\n" if scalar @loc_res && !$noerr;
64e13401 2309
ca6abacf 2310 return \@loc_res;
64e13401
DM
2311}
2312
719893a9 2313# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2314sub check_storage_availability {
2315 my ($storecfg, $conf, $node) = @_;
2316
2317 foreach_drive($conf, sub {
2318 my ($ds, $drive) = @_;
2319
2320 my $volid = $drive->{file};
2321 return if !$volid;
2322
2323 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2324 return if !$sid;
2325
2326 # check if storage is available on both nodes
2327 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2328 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2329 });
2330}
2331
719893a9
DM
2332# list nodes where all VM images are available (used by has_feature API)
2333sub shared_nodes {
2334 my ($conf, $storecfg) = @_;
2335
2336 my $nodelist = PVE::Cluster::get_nodelist();
2337 my $nodehash = { map { $_ => 1 } @$nodelist };
38277afc 2338 my $nodename = nodename();
be190583 2339
719893a9
DM
2340 foreach_drive($conf, sub {
2341 my ($ds, $drive) = @_;
2342
2343 my $volid = $drive->{file};
2344 return if !$volid;
2345
2346 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2347 if ($storeid) {
2348 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2349 if ($scfg->{disable}) {
2350 $nodehash = {};
2351 } elsif (my $avail = $scfg->{nodes}) {
2352 foreach my $node (keys %$nodehash) {
2353 delete $nodehash->{$node} if !$avail->{$node};
2354 }
2355 } elsif (!$scfg->{shared}) {
2356 foreach my $node (keys %$nodehash) {
2357 delete $nodehash->{$node} if $node ne $nodename
2358 }
2359 }
2360 }
2361 });
2362
2363 return $nodehash
2364}
2365
f25852c2
TM
2366sub check_local_storage_availability {
2367 my ($conf, $storecfg) = @_;
2368
2369 my $nodelist = PVE::Cluster::get_nodelist();
2370 my $nodehash = { map { $_ => {} } @$nodelist };
2371
2372 foreach_drive($conf, sub {
2373 my ($ds, $drive) = @_;
2374
2375 my $volid = $drive->{file};
2376 return if !$volid;
2377
2378 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2379 if ($storeid) {
2380 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2381
2382 if ($scfg->{disable}) {
2383 foreach my $node (keys %$nodehash) {
32075a2c 2384 $nodehash->{$node}->{unavailable_storages}->{$storeid} = 1;
f25852c2
TM
2385 }
2386 } elsif (my $avail = $scfg->{nodes}) {
2387 foreach my $node (keys %$nodehash) {
2388 if (!$avail->{$node}) {
32075a2c 2389 $nodehash->{$node}->{unavailable_storages}->{$storeid} = 1;
f25852c2
TM
2390 }
2391 }
2392 }
2393 }
2394 });
2395
32075a2c
TL
2396 foreach my $node (values %$nodehash) {
2397 if (my $unavail = $node->{unavailable_storages}) {
2398 $node->{unavailable_storages} = [ sort keys %$unavail ];
2399 }
2400 }
2401
f25852c2
TM
2402 return $nodehash
2403}
2404
babf613a 2405# Compat only, use assert_config_exists_on_node and vm_running_locally where possible
1e3baf05 2406sub check_running {
7e8dcf2c 2407 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2408
babf613a
SR
2409 PVE::QemuConfig::assert_config_exists_on_node($vmid, $node) if !$nocheck;
2410 return PVE::QemuServer::Helpers::vm_running_locally($vmid);
1e3baf05
DM
2411}
2412
2413sub vzlist {
19672434 2414
1e3baf05
DM
2415 my $vzlist = config_list();
2416
d036e418 2417 my $fd = IO::Dir->new($PVE::QemuServer::Helpers::var_run_tmpdir) || return $vzlist;
1e3baf05 2418
19672434 2419 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2420 next if $de !~ m/^(\d+)\.pid$/;
2421 my $vmid = $1;
6b64503e
DM
2422 next if !defined($vzlist->{$vmid});
2423 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2424 $vzlist->{$vmid}->{pid} = $pid;
2425 }
2426 }
2427
2428 return $vzlist;
2429}
2430
b1a70cab
DM
2431our $vmstatus_return_properties = {
2432 vmid => get_standard_option('pve-vmid'),
2433 status => {
2434 description => "Qemu process status.",
2435 type => 'string',
2436 enum => ['stopped', 'running'],
2437 },
2438 maxmem => {
2439 description => "Maximum memory in bytes.",
2440 type => 'integer',
2441 optional => 1,
2442 renderer => 'bytes',
2443 },
2444 maxdisk => {
2445 description => "Root disk size in bytes.",
2446 type => 'integer',
2447 optional => 1,
2448 renderer => 'bytes',
2449 },
2450 name => {
2451 description => "VM name.",
2452 type => 'string',
2453 optional => 1,
2454 },
2455 qmpstatus => {
2456 description => "Qemu QMP agent status.",
2457 type => 'string',
2458 optional => 1,
2459 },
2460 pid => {
2461 description => "PID of running qemu process.",
2462 type => 'integer',
2463 optional => 1,
2464 },
2465 uptime => {
2466 description => "Uptime.",
2467 type => 'integer',
2468 optional => 1,
2469 renderer => 'duration',
2470 },
2471 cpus => {
2472 description => "Maximum usable CPUs.",
2473 type => 'number',
2474 optional => 1,
2475 },
e6ed61b4 2476 lock => {
11efdfa5 2477 description => "The current config lock, if any.",
e6ed61b4
DC
2478 type => 'string',
2479 optional => 1,
b8e7068a
DC
2480 },
2481 tags => {
2482 description => "The current configured tags, if any",
2483 type => 'string',
2484 optional => 1,
2485 },
b1a70cab
DM
2486};
2487
1e3baf05
DM
2488my $last_proc_pid_stat;
2489
03a33f30
DM
2490# get VM status information
2491# This must be fast and should not block ($full == false)
2492# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2493sub vmstatus {
03a33f30 2494 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2495
2496 my $res = {};
2497
19672434 2498 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2499
2500 my $list = vzlist();
3618ee99
EK
2501 my $defaults = load_defaults();
2502
694fcad4 2503 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2504
ae4915a2
DM
2505 my $cpucount = $cpuinfo->{cpus} || 1;
2506
1e3baf05
DM
2507 foreach my $vmid (keys %$list) {
2508 next if $opt_vmid && ($vmid ne $opt_vmid);
2509
9f78b695 2510 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 2511
b1a70cab 2512 my $d = { vmid => $vmid };
1e3baf05
DM
2513 $d->{pid} = $list->{$vmid}->{pid};
2514
2515 # fixme: better status?
2516 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2517
776c5f50 2518 my $size = PVE::QemuServer::Drive::bootdisk_size($storecfg, $conf);
af990afe
DM
2519 if (defined($size)) {
2520 $d->{disk} = 0; # no info available
1e3baf05
DM
2521 $d->{maxdisk} = $size;
2522 } else {
2523 $d->{disk} = 0;
2524 $d->{maxdisk} = 0;
2525 }
2526
3618ee99
EK
2527 $d->{cpus} = ($conf->{sockets} || $defaults->{sockets})
2528 * ($conf->{cores} || $defaults->{cores});
ae4915a2 2529 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
d7c8364b 2530 $d->{cpus} = $conf->{vcpus} if $conf->{vcpus};
ae4915a2 2531
1e3baf05 2532 $d->{name} = $conf->{name} || "VM $vmid";
3618ee99
EK
2533 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024)
2534 : $defaults->{memory}*(1024*1024);
1e3baf05 2535
8b1accf7 2536 if ($conf->{balloon}) {
4bdb0514 2537 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
3618ee99
EK
2538 $d->{shares} = defined($conf->{shares}) ? $conf->{shares}
2539 : $defaults->{shares};
8b1accf7
DM
2540 }
2541
1e3baf05
DM
2542 $d->{uptime} = 0;
2543 $d->{cpu} = 0;
1e3baf05
DM
2544 $d->{mem} = 0;
2545
2546 $d->{netout} = 0;
2547 $d->{netin} = 0;
2548
2549 $d->{diskread} = 0;
2550 $d->{diskwrite} = 0;
2551
ffda963f 2552 $d->{template} = PVE::QemuConfig->is_template($conf);
4d8c851b 2553
8107b378 2554 $d->{serial} = 1 if conf_has_serial($conf);
e6ed61b4 2555 $d->{lock} = $conf->{lock} if $conf->{lock};
b8e7068a 2556 $d->{tags} = $conf->{tags} if defined($conf->{tags});
8107b378 2557
1e3baf05
DM
2558 $res->{$vmid} = $d;
2559 }
2560
2561 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2562 foreach my $dev (keys %$netdev) {
2563 next if $dev !~ m/^tap([1-9]\d*)i/;
2564 my $vmid = $1;
2565 my $d = $res->{$vmid};
2566 next if !$d;
19672434 2567
1e3baf05
DM
2568 $d->{netout} += $netdev->{$dev}->{receive};
2569 $d->{netin} += $netdev->{$dev}->{transmit};
604ea644
AD
2570
2571 if ($full) {
2572 $d->{nics}->{$dev}->{netout} = $netdev->{$dev}->{receive};
2573 $d->{nics}->{$dev}->{netin} = $netdev->{$dev}->{transmit};
2574 }
2575
1e3baf05
DM
2576 }
2577
1e3baf05
DM
2578 my $ctime = gettimeofday;
2579
2580 foreach my $vmid (keys %$list) {
2581
2582 my $d = $res->{$vmid};
2583 my $pid = $d->{pid};
2584 next if !$pid;
2585
694fcad4
DM
2586 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2587 next if !$pstat; # not running
19672434 2588
694fcad4 2589 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2590
694fcad4 2591 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2592
694fcad4 2593 if ($pstat->{vsize}) {
6b64503e 2594 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2595 }
2596
2597 my $old = $last_proc_pid_stat->{$pid};
2598 if (!$old) {
19672434
DM
2599 $last_proc_pid_stat->{$pid} = {
2600 time => $ctime,
1e3baf05
DM
2601 used => $used,
2602 cpu => 0,
1e3baf05
DM
2603 };
2604 next;
2605 }
2606
7f0b5beb 2607 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2608
2609 if ($dtime > 1000) {
2610 my $dutime = $used - $old->{used};
2611
ae4915a2 2612 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2613 $last_proc_pid_stat->{$pid} = {
19672434 2614 time => $ctime,
1e3baf05
DM
2615 used => $used,
2616 cpu => $d->{cpu},
1e3baf05
DM
2617 };
2618 } else {
2619 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2620 }
2621 }
2622
f5eb281a 2623 return $res if !$full;
03a33f30
DM
2624
2625 my $qmpclient = PVE::QMPClient->new();
2626
64e7fcf2
DM
2627 my $ballooncb = sub {
2628 my ($vmid, $resp) = @_;
2629
2630 my $info = $resp->{'return'};
38babf81
DM
2631 return if !$info->{max_mem};
2632
64e7fcf2
DM
2633 my $d = $res->{$vmid};
2634
38babf81
DM
2635 # use memory assigned to VM
2636 $d->{maxmem} = $info->{max_mem};
2637 $d->{balloon} = $info->{actual};
2638
2639 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2640 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2641 $d->{freemem} = $info->{free_mem};
64e7fcf2
DM
2642 }
2643
604ea644 2644 $d->{ballooninfo} = $info;
64e7fcf2
DM
2645 };
2646
03a33f30
DM
2647 my $blockstatscb = sub {
2648 my ($vmid, $resp) = @_;
2649 my $data = $resp->{'return'} || [];
2650 my $totalrdbytes = 0;
2651 my $totalwrbytes = 0;
604ea644 2652
03a33f30
DM
2653 for my $blockstat (@$data) {
2654 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2655 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
604ea644
AD
2656
2657 $blockstat->{device} =~ s/drive-//;
2658 $res->{$vmid}->{blockstat}->{$blockstat->{device}} = $blockstat->{stats};
03a33f30
DM
2659 }
2660 $res->{$vmid}->{diskread} = $totalrdbytes;
2661 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2662 };
2663
2664 my $statuscb = sub {
2665 my ($vmid, $resp) = @_;
64e7fcf2 2666
03a33f30 2667 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2668 # this fails if ballon driver is not loaded, so this must be
2669 # the last commnand (following command are aborted if this fails).
38babf81 2670 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2671
2672 my $status = 'unknown';
2673 if (!defined($status = $resp->{'return'}->{status})) {
2674 warn "unable to get VM status\n";
2675 return;
2676 }
2677
2678 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2679 };
2680
2681 foreach my $vmid (keys %$list) {
2682 next if $opt_vmid && ($vmid ne $opt_vmid);
2683 next if !$res->{$vmid}->{pid}; # not running
2684 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2685 }
2686
b017fbda 2687 $qmpclient->queue_execute(undef, 2);
03a33f30
DM
2688
2689 foreach my $vmid (keys %$list) {
2690 next if $opt_vmid && ($vmid ne $opt_vmid);
2691 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2692 }
2693
1e3baf05
DM
2694 return $res;
2695}
2696
8107b378
DC
2697sub conf_has_serial {
2698 my ($conf) = @_;
2699
2700 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
2701 if ($conf->{"serial$i"}) {
2702 return 1;
2703 }
2704 }
2705
2706 return 0;
2707}
2708
d5535a00
TL
2709sub conf_has_audio {
2710 my ($conf, $id) = @_;
2711
2712 $id //= 0;
2713 my $audio = $conf->{"audio$id"};
2714 return undef if !defined($audio);
2715
2716 my $audioproperties = PVE::JSONSchema::parse_property_string($audio_fmt, $audio);
2717 my $audiodriver = $audioproperties->{driver} // 'spice';
2718
2719 return {
2720 dev => $audioproperties->{device},
b0f96836 2721 dev_id => "audiodev$id",
d5535a00
TL
2722 backend => $audiodriver,
2723 backend_id => "$audiodriver-backend${id}",
2724 };
2725}
2726
86b8228b
DM
2727sub vga_conf_has_spice {
2728 my ($vga) = @_;
2729
55655ebc
DC
2730 my $vgaconf = parse_vga($vga);
2731 my $vgatype = $vgaconf->{type};
2732 return 0 if !$vgatype || $vgatype !~ m/^qxl([234])?$/;
590e698c
DM
2733
2734 return $1 || 1;
86b8228b
DM
2735}
2736
d731ecbe
WB
2737sub is_native($) {
2738 my ($arch) = @_;
2739 return get_host_arch() eq $arch;
2740}
2741
045749f2
TL
2742sub get_vm_arch {
2743 my ($conf) = @_;
2744 return $conf->{arch} // get_host_arch();
2745}
2746
d731ecbe
WB
2747my $default_machines = {
2748 x86_64 => 'pc',
2749 aarch64 => 'virt',
2750};
2751
045749f2 2752sub get_vm_machine {
ac0077cc 2753 my ($conf, $forcemachine, $arch, $add_pve_version, $kvmversion) = @_;
045749f2
TL
2754
2755 my $machine = $forcemachine || $conf->{machine};
d731ecbe 2756
9471e48b 2757 if (!$machine || $machine =~ m/^(?:pc|q35|virt)$/) {
045749f2
TL
2758 $arch //= 'x86_64';
2759 $machine ||= $default_machines->{$arch};
ac0077cc
SR
2760 if ($add_pve_version) {
2761 $kvmversion //= kvm_user_version();
2762 my $pvever = PVE::QemuServer::Machine::get_pve_version($kvmversion);
2763 $machine .= "+pve$pvever";
2764 }
2765 }
2766
2767 if ($add_pve_version && $machine !~ m/\+pve\d+$/) {
2768 # for version-pinned machines that do not include a pve-version (e.g.
2769 # pc-q35-4.1), we assume 0 to keep them stable in case we bump
2770 $machine .= '+pve0';
045749f2
TL
2771 }
2772
2773 return $machine;
d731ecbe
WB
2774}
2775
96ed3574
WB
2776sub get_ovmf_files($) {
2777 my ($arch) = @_;
2778
2779 my $ovmf = $OVMF->{$arch}
2780 or die "no OVMF images known for architecture '$arch'\n";
2781
2782 return @$ovmf;
2783}
2784
6908fd9b
WB
2785my $Arch2Qemu = {
2786 aarch64 => '/usr/bin/qemu-system-aarch64',
2787 x86_64 => '/usr/bin/qemu-system-x86_64',
2788};
2789sub get_command_for_arch($) {
2790 my ($arch) = @_;
2791 return '/usr/bin/kvm' if is_native($arch);
2792
2793 my $cmd = $Arch2Qemu->{$arch}
2794 or die "don't know how to emulate architecture '$arch'\n";
2795 return $cmd;
2796}
2797
05a4c550
SR
2798# To use query_supported_cpu_flags and query_understood_cpu_flags to get flags
2799# to use in a QEMU command line (-cpu element), first array_intersect the result
2800# of query_supported_ with query_understood_. This is necessary because:
2801#
2802# a) query_understood_ returns flags the host cannot use and
2803# b) query_supported_ (rather the QMP call) doesn't actually return CPU
2804# flags, but CPU settings - with most of them being flags. Those settings
2805# (and some flags, curiously) cannot be specified as a "-cpu" argument.
2806#
2807# query_supported_ needs to start up to 2 temporary VMs and is therefore rather
2808# expensive. If you need the value returned from this, you can get it much
2809# cheaper from pmxcfs using PVE::Cluster::get_node_kv('cpuflags-$accel') with
2810# $accel being 'kvm' or 'tcg'.
2811#
2812# pvestatd calls this function on startup and whenever the QEMU/KVM version
2813# changes, automatically populating pmxcfs.
2814#
2815# Returns: { kvm => [ flagX, flagY, ... ], tcg => [ flag1, flag2, ... ] }
2816# since kvm and tcg machines support different flags
2817#
2818sub query_supported_cpu_flags {
52cffab6 2819 my ($arch) = @_;
05a4c550 2820
52cffab6
SR
2821 $arch //= get_host_arch();
2822 my $default_machine = $default_machines->{$arch};
2823
2824 my $flags = {};
05a4c550
SR
2825
2826 # FIXME: Once this is merged, the code below should work for ARM as well:
2827 # https://lists.nongnu.org/archive/html/qemu-devel/2019-06/msg04947.html
2828 die "QEMU/KVM cannot detect CPU flags on ARM (aarch64)\n" if
2829 $arch eq "aarch64";
2830
2831 my $kvm_supported = defined(kvm_version());
2832 my $qemu_cmd = get_command_for_arch($arch);
2833 my $fakevmid = -1;
2834 my $pidfile = PVE::QemuServer::Helpers::pidfile_name($fakevmid);
2835
2836 # Start a temporary (frozen) VM with vmid -1 to allow sending a QMP command
2837 my $query_supported_run_qemu = sub {
2838 my ($kvm) = @_;
2839
2840 my $flags = {};
2841 my $cmd = [
2842 $qemu_cmd,
2843 '-machine', $default_machine,
2844 '-display', 'none',
2845 '-chardev', "socket,id=qmp,path=/var/run/qemu-server/$fakevmid.qmp,server,nowait",
2846 '-mon', 'chardev=qmp,mode=control',
2847 '-pidfile', $pidfile,
2848 '-S', '-daemonize'
2849 ];
2850
2851 if (!$kvm) {
2852 push @$cmd, '-accel', 'tcg';
2853 }
2854
2855 my $rc = run_command($cmd, noerr => 1, quiet => 0);
2856 die "QEMU flag querying VM exited with code " . $rc if $rc;
2857
2858 eval {
2859 my $cmd_result = mon_cmd(
2860 $fakevmid,
2861 'query-cpu-model-expansion',
2862 type => 'full',
2863 model => { name => 'host' }
2864 );
2865
2866 my $props = $cmd_result->{model}->{props};
2867 foreach my $prop (keys %$props) {
2868 next if $props->{$prop} ne '1';
2869 # QEMU returns some flags multiple times, with '_', '.' or '-'
2870 # (e.g. lahf_lm and lahf-lm; sse4.2, sse4-2 and sse4_2; ...).
2871 # We only keep those with underscores, to match /proc/cpuinfo
2872 $prop =~ s/\.|-/_/g;
2873 $flags->{$prop} = 1;
2874 }
2875 };
2876 my $err = $@;
2877
2878 # force stop with 10 sec timeout and 'nocheck'
2879 # always stop, even if QMP failed
2880 vm_stop(undef, $fakevmid, 1, 1, 10, 0, 1);
2881
2882 die $err if $err;
2883
2884 return [ sort keys %$flags ];
2885 };
2886
2887 # We need to query QEMU twice, since KVM and TCG have different supported flags
2888 PVE::QemuConfig->lock_config($fakevmid, sub {
2889 $flags->{tcg} = eval { $query_supported_run_qemu->(0) };
2890 warn "warning: failed querying supported tcg flags: $@\n" if $@;
2891
2892 if ($kvm_supported) {
2893 $flags->{kvm} = eval { $query_supported_run_qemu->(1) };
2894 warn "warning: failed querying supported kvm flags: $@\n" if $@;
2895 }
2896 });
2897
2898 return $flags;
2899}
2900
2901# Understood CPU flags are written to a file at 'pve-qemu' compile time
2902my $understood_cpu_flag_dir = "/usr/share/kvm";
2903sub query_understood_cpu_flags {
2904 my $arch = get_host_arch();
2905 my $filepath = "$understood_cpu_flag_dir/recognized-CPUID-flags-$arch";
2906
2907 die "Cannot query understood QEMU CPU flags for architecture: $arch (file not found)\n"
2908 if ! -e $filepath;
2909
2910 my $raw = file_get_contents($filepath);
2911 $raw =~ s/^\s+|\s+$//g;
2912 my @flags = split(/\s+/, $raw);
2913
2914 return \@flags;
2915}
2916
1e3baf05 2917sub config_to_command {
67812f9c 2918 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2919
2920 my $cmd = [];
8c559505
DM
2921 my $globalFlags = [];
2922 my $machineFlags = [];
2923 my $rtcFlags = [];
5bdcf937 2924 my $devices = [];
b78ebef7 2925 my $pciaddr = '';
5bdcf937 2926 my $bridges = {};
b42d3cf9 2927 my $ostype = $conf->{ostype};
4317f69f 2928 my $winversion = windows_version($ostype);
d731ecbe 2929 my $kvm = $conf->{kvm};
38277afc 2930 my $nodename = nodename();
d731ecbe 2931
045749f2 2932 my $arch = get_vm_arch($conf);
1476b99f
DC
2933 my $kvm_binary = get_command_for_arch($arch);
2934 my $kvmver = kvm_user_version($kvm_binary);
045749f2 2935
a04dd5c4
SR
2936 if (!$kvmver || $kvmver !~ m/^(\d+)\.(\d+)/ || $1 < 3) {
2937 $kvmver //= "undefined";
2938 die "Detected old QEMU binary ('$kvmver', at least 3.0 is required)\n";
2939 }
2940
9471e48b
TL
2941 my $add_pve_version = min_version($kvmver, 4, 1);
2942
2943 my $machine_type = get_vm_machine($conf, $forcemachine, $arch, $add_pve_version);
2944 my $machine_version = PVE::QemuServer::Machine::extract_version($machine_type, $kvmver);
d731ecbe 2945 $kvm //= 1 if is_native($arch);
4317f69f 2946
a77a53ae 2947 $machine_version =~ m/(\d+)\.(\d+)/;
ac0077cc 2948 my ($machine_major, $machine_minor) = ($1, $2);
cbb39a7e 2949 die "Installed QEMU version '$kvmver' is too old to run machine type '$machine_type', please upgrade node '$nodename'\n"
ac0077cc
SR
2950 if !PVE::QemuServer::min_version($kvmver, $machine_major, $machine_minor);
2951
2952 if (!PVE::QemuServer::Machine::can_run_pve_machine_version($machine_version, $kvmver)) {
2953 my $max_pve_version = PVE::QemuServer::Machine::get_pve_version($machine_version);
2954 die "Installed qemu-server (max feature level for $machine_major.$machine_minor is pve$max_pve_version)"
2955 . " is too old to run machine type '$machine_type', please upgrade node '$nodename'\n";
2956 }
2957
2958 # if a specific +pve version is required for a feature, use $version_guard
2959 # instead of min_version to allow machines to be run with the minimum
2960 # required version
2961 my $required_pve_version = 0;
2962 my $version_guard = sub {
2963 my ($major, $minor, $pve) = @_;
2964 return 0 if !min_version($machine_version, $major, $minor, $pve);
2965 $required_pve_version = $pve if $pve && $pve > $required_pve_version;
2966 return 1;
2967 };
a77a53ae 2968
d731ecbe
WB
2969 if ($kvm) {
2970 die "KVM virtualisation configured, but not available. Either disable in VM configuration or enable in BIOS.\n"
2971 if !defined kvm_version();
2972 }
bfcd9b7e 2973
3392d6ca 2974 my $q35 = PVE::QemuServer::Machine::machine_type_is_q35($conf);
4d3f29ed 2975 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
249c4a6c
AD
2976 my $use_old_bios_files = undef;
2977 ($use_old_bios_files, $machine_type) = qemu_use_old_bios_files($machine_type);
db656e5f 2978
f08e17c7
AD
2979 my $cpuunits = defined($conf->{cpuunits}) ?
2980 $conf->{cpuunits} : $defaults->{cpuunits};
2981
1476b99f 2982 push @$cmd, $kvm_binary;
1e3baf05
DM
2983
2984 push @$cmd, '-id', $vmid;
2985
e4d4cda1
HR
2986 my $vmname = $conf->{name} || "vm$vmid";
2987
2988 push @$cmd, '-name', $vmname;
2989
1e3baf05
DM
2990 my $use_virtio = 0;
2991
d036e418 2992 my $qmpsocket = PVE::QemuServer::Helpers::qmp_socket($vmid);
c971c4f2
AD
2993 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2994 push @$cmd, '-mon', "chardev=qmp,mode=control";
2995
2ea5fb7e 2996 if (min_version($machine_version, 2, 12)) {
b4496b9e 2997 push @$cmd, '-chardev', "socket,id=qmp-event,path=/var/run/qmeventd.sock,reconnect=5";
71bd73b5
DC
2998 push @$cmd, '-mon', "chardev=qmp-event,mode=control";
2999 }
1e3baf05 3000
d036e418 3001 push @$cmd, '-pidfile' , PVE::QemuServer::Helpers::pidfile_name($vmid);
19672434 3002
1e3baf05
DM
3003 push @$cmd, '-daemonize';
3004
2796e7d5 3005 if ($conf->{smbios1}) {
1f30ac3a
CE
3006 my $smbios_conf = parse_smbios1($conf->{smbios1});
3007 if ($smbios_conf->{base64}) {
3008 # Do not pass base64 flag to qemu
3009 delete $smbios_conf->{base64};
3010 my $smbios_string = "";
3011 foreach my $key (keys %$smbios_conf) {
3012 my $value;
3013 if ($key eq "uuid") {
3014 $value = $smbios_conf->{uuid}
3015 } else {
3016 $value = decode_base64($smbios_conf->{$key});
3017 }
3018 # qemu accepts any binary data, only commas need escaping by double comma
3019 $value =~ s/,/,,/g;
3020 $smbios_string .= "," . $key . "=" . $value if $value;
3021 }
3022 push @$cmd, '-smbios', "type=1" . $smbios_string;
3023 } else {
3024 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
3025 }
2796e7d5
DM
3026 }
3027
96ed3574 3028 my ($ovmf_code, $ovmf_vars) = get_ovmf_files($arch);
3edb45e7 3029 if ($conf->{bios} && $conf->{bios} eq 'ovmf') {
96ed3574 3030 die "uefi base image not found\n" if ! -f $ovmf_code;
2ddc0a5c 3031
4dcce9ee 3032 my $path;
13bca7b4 3033 my $format;
4dcce9ee 3034 if (my $efidisk = $conf->{efidisk0}) {
ad396d54 3035 my $d = parse_drive('efidisk0', $efidisk);
2ddc0a5c 3036 my ($storeid, $volname) = PVE::Storage::parse_volume_id($d->{file}, 1);
13bca7b4 3037 $format = $d->{format};
2ddc0a5c
DC
3038 if ($storeid) {
3039 $path = PVE::Storage::path($storecfg, $d->{file});
13bca7b4
WB
3040 if (!defined($format)) {
3041 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
3042 $format = qemu_img_format($scfg, $volname);
3043 }
2ddc0a5c
DC
3044 } else {
3045 $path = $d->{file};
13bca7b4
WB
3046 die "efidisk format must be specified\n"
3047 if !defined($format);
2ddc0a5c 3048 }
2ddc0a5c 3049 } else {
4dcce9ee
TL
3050 warn "no efidisk configured! Using temporary efivars disk.\n";
3051 $path = "/tmp/$vmid-ovmf.fd";
96ed3574 3052 PVE::Tools::file_copy($ovmf_vars, $path, -s $ovmf_vars);
13bca7b4 3053 $format = 'raw';
2ddc0a5c 3054 }
4dcce9ee 3055
96ed3574 3056 push @$cmd, '-drive', "if=pflash,unit=0,format=raw,readonly,file=$ovmf_code";
2bfbee03 3057 push @$cmd, '-drive', "if=pflash,unit=1,format=$format,id=drive-efidisk0,file=$path";
a783c78e
AD
3058 }
3059
7583d156
DC
3060 # load q35 config
3061 if ($q35) {
3062 # we use different pcie-port hardware for qemu >= 4.0 for passthrough
2ea5fb7e 3063 if (min_version($machine_version, 4, 0)) {
7583d156
DC
3064 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35-4.0.cfg';
3065 } else {
3066 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
3067 }
3068 }
da8b4189 3069
844d8fa6
DC
3070 if ($conf->{vmgenid}) {
3071 push @$devices, '-device', 'vmgenid,guid='.$conf->{vmgenid};
3072 }
3073
d40e5e18 3074 # add usb controllers
d559309f 3075 my @usbcontrollers = PVE::QemuServer::USB::get_usb_controllers($conf, $bridges, $arch, $machine_type, $usbdesc->{format}, $MAX_USB_DEVICES);
d40e5e18 3076 push @$devices, @usbcontrollers if @usbcontrollers;
55655ebc 3077 my $vga = parse_vga($conf->{vga});
2fa3151e 3078
55655ebc
DC
3079 my $qxlnum = vga_conf_has_spice($conf->{vga});
3080 $vga->{type} = 'qxl' if $qxlnum;
2fa3151e 3081
55655ebc 3082 if (!$vga->{type}) {
869ad4a7
WB
3083 if ($arch eq 'aarch64') {
3084 $vga->{type} = 'virtio';
2ea5fb7e 3085 } elsif (min_version($machine_version, 2, 9)) {
55655ebc 3086 $vga->{type} = (!$winversion || $winversion >= 6) ? 'std' : 'cirrus';
a2a5cd64 3087 } else {
55655ebc 3088 $vga->{type} = ($winversion >= 6) ? 'std' : 'cirrus';
a2a5cd64 3089 }
5acbfe9e
DM
3090 }
3091
1e3baf05 3092 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
3093 my $tablet;
3094 if (defined($conf->{tablet})) {
3095 $tablet = $conf->{tablet};
3096 } else {
3097 $tablet = $defaults->{tablet};
590e698c 3098 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
55655ebc 3099 $tablet = 0 if $vga->{type} =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
3100 }
3101
d559309f
WB
3102 if ($tablet) {
3103 push @$devices, '-device', print_tabletdevice_full($conf, $arch) if $tablet;
3104 my $kbd = print_keyboarddevice_full($conf, $arch);
3105 push @$devices, '-device', $kbd if defined($kbd);
3106 }
b467f79a 3107
16a91d65 3108 my $kvm_off = 0;
4317f69f
AD
3109 my $gpu_passthrough;
3110
1e3baf05 3111 # host pci devices
040b06b7 3112 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
dae0c8e5
TL
3113 my $id = "hostpci$i";
3114 my $d = parse_hostpci($conf->{$id});
2e3b7e2a
AD
3115 next if !$d;
3116
dae0c8e5 3117 if (my $pcie = $d->{pcie}) {
2e3b7e2a 3118 die "q35 machine model is not enabled" if !$q35;
739ba340
DC
3119 # win7 wants to have the pcie devices directly on the pcie bus
3120 # instead of in the root port
3121 if ($winversion == 7) {
dae0c8e5 3122 $pciaddr = print_pcie_addr("${id}bus0");
739ba340 3123 } else {
c4e16381 3124 # add more root ports if needed, 4 are present by default
dae0c8e5 3125 # by pve-q35 cfgs, rest added here on demand.
c4e16381
AL
3126 if ($i > 3) {
3127 push @$devices, '-device', print_pcie_root_port($i);
3128 }
dae0c8e5 3129 $pciaddr = print_pcie_addr($id);
739ba340 3130 }
bd772c2e 3131 } else {
dae0c8e5 3132 $pciaddr = print_pci_addr($id, $bridges, $arch, $machine_type);
2e3b7e2a
AD
3133 }
3134
1f4f447b
WB
3135 my $xvga = '';
3136 if ($d->{'x-vga'}) {
dae0c8e5 3137 $xvga = ',x-vga=on' if !($conf->{bios} && $conf->{bios} eq 'ovmf');
16a91d65 3138 $kvm_off = 1;
bfc0bb81 3139 $vga->{type} = 'none' if !defined($conf->{vga});
4317f69f 3140 $gpu_passthrough = 1;
137483c0 3141 }
dae0c8e5 3142
4543ecf0
AD
3143 my $pcidevices = $d->{pciid};
3144 my $multifunction = 1 if @$pcidevices > 1;
dae0c8e5 3145
6ab45bd7
DC
3146 my $sysfspath;
3147 if ($d->{mdev} && scalar(@$pcidevices) == 1) {
dae0c8e5 3148 my $pci_id = $pcidevices->[0]->{id};
6ab45bd7 3149 my $uuid = PVE::SysFSTools::generate_mdev_uuid($vmid, $i);
70740c1a 3150 $sysfspath = "/sys/bus/pci/devices/$pci_id/$uuid";
6ab45bd7 3151 } elsif ($d->{mdev}) {
dae0c8e5 3152 warn "ignoring mediated device '$id' with multifunction device\n";
6ab45bd7 3153 }
2e3b7e2a 3154
4543ecf0 3155 my $j=0;
dae0c8e5 3156 foreach my $pcidevice (@$pcidevices) {
6ab45bd7 3157 my $devicestr = "vfio-pci";
dae0c8e5 3158
6ab45bd7
DC
3159 if ($sysfspath) {
3160 $devicestr .= ",sysfsdev=$sysfspath";
3161 } else {
2fd24788 3162 $devicestr .= ",host=$pcidevice->{id}";
6ab45bd7 3163 }
4543ecf0 3164
dae0c8e5
TL
3165 my $mf_addr = $multifunction ? ".$j" : '';
3166 $devicestr .= ",id=${id}${mf_addr}${pciaddr}${mf_addr}";
3167
3168 if ($j == 0) {
3169 $devicestr .= ',rombar=0' if defined($d->{rombar}) && !$d->{rombar};
3170 $devicestr .= "$xvga";
4543ecf0 3171 $devicestr .= ",multifunction=on" if $multifunction;
dae0c8e5 3172 $devicestr .= ",romfile=/usr/share/kvm/$d->{romfile}" if $d->{romfile};
4543ecf0
AD
3173 }
3174
3175 push @$devices, '-device', $devicestr;
3176 $j++;
3177 }
1e3baf05
DM
3178 }
3179
3180 # usb devices
ae36393d 3181 my $usb_dev_features = {};
2ea5fb7e 3182 $usb_dev_features->{spice_usb3} = 1 if min_version($machine_version, 4, 0);
ae36393d
AL
3183
3184 my @usbdevices = PVE::QemuServer::USB::get_usb_devices($conf, $usbdesc->{format}, $MAX_USB_DEVICES, $usb_dev_features);
d40e5e18 3185 push @$devices, @usbdevices if @usbdevices;
1e3baf05 3186 # serial devices
bae179aa 3187 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 3188 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
3189 if ($path eq 'socket') {
3190 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
3191 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
91b01bbb
WB
3192 # On aarch64, serial0 is the UART device. Qemu only allows
3193 # connecting UART devices via the '-serial' command line, as
3194 # the device has a fixed slot on the hardware...
3195 if ($arch eq 'aarch64' && $i == 0) {
3196 push @$devices, '-serial', "chardev:serial$i";
3197 } else {
3198 push @$devices, '-device', "isa-serial,chardev=serial$i";
3199 }
9f9d2fb2
DM
3200 } else {
3201 die "no such serial device\n" if ! -c $path;
3202 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
3203 push @$devices, '-device', "isa-serial,chardev=serial$i";
3204 }
34978be3 3205 }
1e3baf05
DM
3206 }
3207
3208 # parallel devices
1989a89c 3209 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 3210 if (my $path = $conf->{"parallel$i"}) {
19672434 3211 die "no such parallel device\n" if ! -c $path;
32e69805 3212 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 3213 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 3214 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 3215 }
1e3baf05
DM
3216 }
3217
d5535a00
TL
3218 if (my $audio = conf_has_audio($conf)) {
3219
2e7b5925
AL
3220 my $audiopciaddr = print_pci_addr("audio0", $bridges, $arch, $machine_type);
3221
d5535a00
TL
3222 my $id = $audio->{dev_id};
3223 if ($audio->{dev} eq 'AC97') {
3224 push @$devices, '-device', "AC97,id=${id}${audiopciaddr}";
3225 } elsif ($audio->{dev} =~ /intel\-hda$/) {
3226 push @$devices, '-device', "$audio->{dev},id=${id}${audiopciaddr}";
3227 push @$devices, '-device', "hda-micro,id=${id}-codec0,bus=${id}.0,cad=0";
3228 push @$devices, '-device', "hda-duplex,id=${id}-codec1,bus=${id}.0,cad=1";
b3703d39 3229 } else {
d5535a00 3230 die "unkown audio device '$audio->{dev}', implement me!";
2e7b5925 3231 }
1448547f 3232
d5535a00 3233 push @$devices, '-audiodev', "$audio->{backend},id=$audio->{backend_id}";
2e7b5925 3234 }
19672434 3235
1e3baf05
DM
3236 my $sockets = 1;
3237 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
3238 $sockets = $conf->{sockets} if $conf->{sockets};
3239
3240 my $cores = $conf->{cores} || 1;
3bd18e48 3241
de9d1e55 3242 my $maxcpus = $sockets * $cores;
76267728 3243
de9d1e55 3244 my $vcpus = $conf->{vcpus} ? $conf->{vcpus} : $maxcpus;
76267728 3245
de9d1e55
AD
3246 my $allowed_vcpus = $cpuinfo->{cpus};
3247
6965d5d1 3248 die "MAX $allowed_vcpus vcpus allowed per VM on this node\n"
de9d1e55
AD
3249 if ($allowed_vcpus < $maxcpus);
3250
2ea5fb7e 3251 if($hotplug_features->{cpu} && min_version($machine_version, 2, 7)) {
1e3baf05 3252
69c81430
AD
3253 push @$cmd, '-smp', "1,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
3254 for (my $i = 2; $i <= $vcpus; $i++) {
3255 my $cpustr = print_cpu_device($conf,$i);
3256 push @$cmd, '-device', $cpustr;
3257 }
3258
3259 } else {
3260
3261 push @$cmd, '-smp', "$vcpus,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
3262 }
1e3baf05
DM
3263 push @$cmd, '-nodefaults';
3264
32baffb4 3265 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 3266
0888fdce
DM
3267 my $bootindex_hash = {};
3268 my $i = 1;
3269 foreach my $o (split(//, $bootorder)) {
3270 $bootindex_hash->{$o} = $i*100;
3271 $i++;
afdb31d5 3272 }
3b408e82 3273
dbea4415 3274 push @$cmd, '-boot', "menu=on,strict=on,reboot-timeout=1000,splash=/usr/share/qemu-server/bootsplash.jpg";
1e3baf05 3275
6b64503e 3276 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 3277
6b64503e 3278 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 3279
84902837 3280 if ($vga->{type} && $vga->{type} !~ m/^serial\d+$/ && $vga->{type} ne 'none'){
2ea5fb7e 3281 push @$devices, '-device', print_vga_device($conf, $vga, $arch, $machine_version, $machine_type, undef, $qxlnum, $bridges);
d036e418 3282 my $socket = PVE::QemuServer::Helpers::vnc_socket($vmid);
dc62a7fa 3283 push @$cmd, '-vnc', "unix:$socket,password";
b7be4ba9 3284 } else {
55655ebc 3285 push @$cmd, '-vga', 'none' if $vga->{type} eq 'none';
b7be4ba9
AD
3286 push @$cmd, '-nographic';
3287 }
3288
1e3baf05 3289 # time drift fix
6b64503e 3290 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 3291
8c559505 3292 my $useLocaltime = $conf->{localtime};
1e3baf05 3293
4317f69f
AD
3294 if ($winversion >= 5) { # windows
3295 $useLocaltime = 1 if !defined($conf->{localtime});
7a131888 3296
4317f69f
AD
3297 # use time drift fix when acpi is enabled
3298 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
3299 $tdf = 1 if !defined($conf->{tdf});
462e8d19 3300 }
4317f69f 3301 }
462e8d19 3302
4317f69f
AD
3303 if ($winversion >= 6) {
3304 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
3305 push @$cmd, '-no-hpet';
1e3baf05
DM
3306 }
3307
8c559505
DM
3308 push @$rtcFlags, 'driftfix=slew' if $tdf;
3309
85f0511d 3310 if (($conf->{startdate}) && ($conf->{startdate} ne 'now')) {
8c559505
DM
3311 push @$rtcFlags, "base=$conf->{startdate}";
3312 } elsif ($useLocaltime) {
3313 push @$rtcFlags, 'base=localtime';
3314 }
1e3baf05 3315
2ea5fb7e 3316 push @$cmd, get_cpu_options($conf, $arch, $kvm, $kvm_off, $machine_version, $winversion, $gpu_passthrough);
519ed28c 3317
0567a4d5 3318 PVE::QemuServer::Memory::config($conf, $vmid, $sockets, $cores, $defaults, $hotplug_features, $cmd);
370b05e7 3319
1e3baf05
DM
3320 push @$cmd, '-S' if $conf->{freeze};
3321
b20df606 3322 push @$cmd, '-k', $conf->{keyboard} if defined($conf->{keyboard});
1e3baf05 3323
48657158
MD
3324 my $guest_agent = parse_guest_agent($conf);
3325
3326 if ($guest_agent->{enabled}) {
d036e418 3327 my $qgasocket = PVE::QemuServer::Helpers::qmp_socket($vmid, 1);
ab6a046f 3328 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
48657158 3329
60f03a11 3330 if (!$guest_agent->{type} || $guest_agent->{type} eq 'virtio') {
48657158
MD
3331 my $pciaddr = print_pci_addr("qga0", $bridges, $arch, $machine_type);
3332 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
3333 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
3334 } elsif ($guest_agent->{type} eq 'isa') {
3335 push @$devices, '-device', "isa-serial,chardev=qga0";
3336 }
ab6a046f
AD
3337 }
3338
2cf61f33
SR
3339 my $rng = parse_rng($conf->{rng0}) if $conf->{rng0};
3340 if ($rng && &$version_guard(4, 1, 2)) {
3341 my $max_bytes = $rng->{max_bytes} // $rng_fmt->{max_bytes}->{default};
3342 my $period = $rng->{period} // $rng_fmt->{period}->{default};
3343
3344 my $limiter_str = "";
3345 if ($max_bytes) {
3346 $limiter_str = ",max-bytes=$max_bytes,period=$period";
3347 }
3348
3349 # mostly relevant for /dev/hwrng, but doesn't hurt to check others too
3350 die "cannot create VirtIO RNG device: source file '$rng->{source}' doesn't exist\n"
3351 if ! -e $rng->{source};
3352
3353 my $rng_addr = print_pci_addr("rng0", $bridges, $arch, $machine_type);
3354
3355 push @$devices, '-object', "rng-random,filename=$rng->{source},id=rng0";
3356 push @$devices, '-device', "virtio-rng-pci,rng=rng0$limiter_str$rng_addr";
3357 }
3358
1d794448 3359 my $spice_port;
2fa3151e 3360
590e698c
DM
3361 if ($qxlnum) {
3362 if ($qxlnum > 1) {
ac087616 3363 if ($winversion){
590e698c 3364 for(my $i = 1; $i < $qxlnum; $i++){
2ea5fb7e 3365 push @$devices, '-device', print_vga_device($conf, $vga, $arch, $machine_version, $machine_type, $i, $qxlnum, $bridges);
590e698c
DM
3366 }
3367 } else {
3368 # assume other OS works like Linux
55655ebc
DC
3369 my ($ram, $vram) = ("134217728", "67108864");
3370 if ($vga->{memory}) {
3371 $ram = PVE::Tools::convert_size($qxlnum*4*$vga->{memory}, 'mb' => 'b');
3372 $vram = PVE::Tools::convert_size($qxlnum*2*$vga->{memory}, 'mb' => 'b');
3373 }
3374 push @$cmd, '-global', "qxl-vga.ram_size=$ram";
3375 push @$cmd, '-global', "qxl-vga.vram_size=$vram";
2fa3151e
AD
3376 }
3377 }
3378
d559309f 3379 my $pciaddr = print_pci_addr("spice", $bridges, $arch, $machine_type);
95a4b4a9 3380
af0eba7e 3381 my $pfamily = PVE::Tools::get_host_address_family($nodename);
91152441
WB
3382 my @nodeaddrs = PVE::Tools::getaddrinfo_all('localhost', family => $pfamily);
3383 die "failed to get an ip address of type $pfamily for 'localhost'\n" if !@nodeaddrs;
4d316a63
AL
3384
3385 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
3386 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
3387 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
3388
91152441
WB
3389 my $localhost = PVE::Network::addr_to_ip($nodeaddrs[0]->{addr});
3390 $spice_port = PVE::Tools::next_spice_port($pfamily, $localhost);
943340a6 3391
caab114a
TL
3392 my $spice_enhancement = PVE::JSONSchema::parse_property_string($spice_enhancements_fmt, $conf->{spice_enhancements} // '');
3393 if ($spice_enhancement->{foldersharing}) {
3394 push @$devices, '-chardev', "spiceport,id=foldershare,name=org.spice-space.webdav.0";
3395 push @$devices, '-device', "virtserialport,chardev=foldershare,name=org.spice-space.webdav.0";
3396 }
c4df18db 3397
caab114a
TL
3398 my $spice_opts = "tls-port=${spice_port},addr=$localhost,tls-ciphers=HIGH,seamless-migration=on";
3399 $spice_opts .= ",streaming-video=$spice_enhancement->{videostreaming}" if $spice_enhancement->{videostreaming};
3400 push @$devices, '-spice', "$spice_opts";
1011b570
DM
3401 }
3402
8d9ae0d2
DM
3403 # enable balloon by default, unless explicitly disabled
3404 if (!defined($conf->{balloon}) || $conf->{balloon}) {
d559309f 3405 $pciaddr = print_pci_addr("balloon0", $bridges, $arch, $machine_type);
8d9ae0d2
DM
3406 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
3407 }
1e3baf05 3408
0ea9541d
DM
3409 if ($conf->{watchdog}) {
3410 my $wdopts = parse_watchdog($conf->{watchdog});
d559309f 3411 $pciaddr = print_pci_addr("watchdog", $bridges, $arch, $machine_type);
0a40e8ea 3412 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
3413 push @$devices, '-device', "$watchdog$pciaddr";
3414 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
3415 }
3416
1e3baf05 3417 my $vollist = [];
941e0c42 3418 my $scsicontroller = {};
26ee04b6 3419 my $ahcicontroller = {};
cdd20088 3420 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 3421
5881b913
DM
3422 # Add iscsi initiator name if available
3423 if (my $initiator = get_initiator_name()) {
3424 push @$devices, '-iscsi', "initiator-name=$initiator";
3425 }
3426
1e3baf05
DM
3427 foreach_drive($conf, sub {
3428 my ($ds, $drive) = @_;
3429
ff1a2432 3430 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 3431 push @$vollist, $drive->{file};
ff1a2432 3432 }
afdb31d5 3433
4dcce9ee
TL
3434 # ignore efidisk here, already added in bios/fw handling code above
3435 return if $drive->{interface} eq 'efidisk';
3436
1e3baf05 3437 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
3438
3439 if (drive_is_cdrom ($drive)) {
3440 if ($bootindex_hash->{d}) {
3441 $drive->{bootindex} = $bootindex_hash->{d};
3442 $bootindex_hash->{d} += 1;
3443 }
3444 } else {
3445 if ($bootindex_hash->{c}) {
3446 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3447 $bootindex_hash->{c} += 1;
3448 }
3449 }
3450
51f492cd
AD
3451 if($drive->{interface} eq 'virtio'){
3452 push @$cmd, '-object', "iothread,id=iothread-$ds" if $drive->{iothread};
3453 }
3454
941e0c42 3455 if ($drive->{interface} eq 'scsi') {
cdd20088 3456
ee034f5c 3457 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $drive);
6731a4cf 3458
b8fb1c03
SR
3459 die "scsi$drive->{index}: machine version 4.1~pve2 or higher is required to use more than 14 SCSI disks\n"
3460 if $drive->{index} > 13 && !&$version_guard(4, 1, 2);
3461
d559309f 3462 $pciaddr = print_pci_addr("$controller_prefix$controller", $bridges, $arch, $machine_type);
a1b7d579 3463 my $scsihw_type = $scsihw =~ m/^virtio-scsi-single/ ? "virtio-scsi-pci" : $scsihw;
fc8b40fd
AD
3464
3465 my $iothread = '';
3466 if($conf->{scsihw} && $conf->{scsihw} eq "virtio-scsi-single" && $drive->{iothread}){
3467 $iothread .= ",iothread=iothread-$controller_prefix$controller";
3468 push @$cmd, '-object', "iothread,id=iothread-$controller_prefix$controller";
e7a5104d
DC
3469 } elsif ($drive->{iothread}) {
3470 warn "iothread is only valid with virtio disk or virtio-scsi-single controller, ignoring\n";
fc8b40fd
AD
3471 }
3472
6e11f143
AD
3473 my $queues = '';
3474 if($conf->{scsihw} && $conf->{scsihw} eq "virtio-scsi-single" && $drive->{queues}){
3475 $queues = ",num_queues=$drive->{queues}";
370b05e7 3476 }
6e11f143
AD
3477
3478 push @$devices, '-device', "$scsihw_type,id=$controller_prefix$controller$pciaddr$iothread$queues" if !$scsicontroller->{$controller};
cdd20088 3479 $scsicontroller->{$controller}=1;
941e0c42 3480 }
3b408e82 3481
26ee04b6 3482 if ($drive->{interface} eq 'sata') {
e0fd2b2f 3483 my $controller = int($drive->{index} / $PVE::QemuServer::Drive::MAX_SATA_DISKS);
d559309f 3484 $pciaddr = print_pci_addr("ahci$controller", $bridges, $arch, $machine_type);
5bdcf937 3485 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
3486 $ahcicontroller->{$controller}=1;
3487 }
46f58b5f 3488
776c5f50 3489 my $drive_cmd = print_drive_commandline_full($storecfg, $vmid, $drive);
15b21acc 3490 push @$devices, '-drive',$drive_cmd;
d559309f 3491 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges, $arch, $machine_type);
1e3baf05
DM
3492 });
3493
cc4d6182 3494 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 3495 next if !$conf->{"net$i"};
cc4d6182
DA
3496 my $d = parse_net($conf->{"net$i"});
3497 next if !$d;
1e3baf05 3498
cc4d6182 3499 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 3500
cc4d6182
DA
3501 if ($bootindex_hash->{n}) {
3502 $d->{bootindex} = $bootindex_hash->{n};
3503 $bootindex_hash->{n} += 1;
3504 }
1e3baf05 3505
d559309f 3506 my $netdevfull = print_netdev_full($vmid, $conf, $arch, $d, "net$i");
5bdcf937
AD
3507 push @$devices, '-netdev', $netdevfull;
3508
d559309f 3509 my $netdevicefull = print_netdevice_full($vmid, $conf, $d, "net$i", $bridges, $use_old_bios_files, $arch, $machine_type);
5bdcf937
AD
3510 push @$devices, '-device', $netdevicefull;
3511 }
1e3baf05 3512
6dbcb073
DC
3513 if ($conf->{ivshmem}) {
3514 my $ivshmem = PVE::JSONSchema::parse_property_string($ivshmem_fmt, $conf->{ivshmem});
e3c27a6a 3515
6dbcb073
DC
3516 my $bus;
3517 if ($q35) {
3518 $bus = print_pcie_addr("ivshmem");
3519 } else {
3520 $bus = print_pci_addr("ivshmem", $bridges, $arch, $machine_type);
3521 }
e3c27a6a
TL
3522
3523 my $ivshmem_name = $ivshmem->{name} // $vmid;
3524 my $path = '/dev/shm/pve-shm-' . $ivshmem_name;
3525
6dbcb073
DC
3526 push @$devices, '-device', "ivshmem-plain,memdev=ivshmem$bus,";
3527 push @$devices, '-object', "memory-backend-file,id=ivshmem,share=on,mem-path=$path,size=$ivshmem->{size}M";
3528 }
3529
2513b862
DC
3530 # pci.4 is nested in pci.1
3531 $bridges->{1} = 1 if $bridges->{4};
3532
db656e5f
DM
3533 if (!$q35) {
3534 # add pci bridges
2ea5fb7e 3535 if (min_version($machine_version, 2, 3)) {
fc79e813
AD
3536 $bridges->{1} = 1;
3537 $bridges->{2} = 1;
3538 }
3539
6731a4cf
AD
3540 $bridges->{3} = 1 if $scsihw =~ m/^virtio-scsi-single/;
3541
2513b862
DC
3542 }
3543
3544 for my $k (sort {$b cmp $a} keys %$bridges) {
3545 next if $q35 && $k < 4; # q35.cfg already includes bridges up to 3
3546 $pciaddr = print_pci_addr("pci.$k", undef, $arch, $machine_type);
3547 my $devstr = "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr";
3548 if ($q35) {
3549 # add after -readconfig pve-q35.cfg
3550 splice @$devices, 2, 0, '-device', $devstr;
3551 } else {
3552 unshift @$devices, '-device', $devstr if $k > 0;
f8e83f05 3553 }
19672434
DM
3554 }
3555
ac0077cc
SR
3556 if (!$kvm) {
3557 push @$machineFlags, 'accel=tcg';
3558 }
3559
3560 my $machine_type_min = $machine_type;
3561 if ($add_pve_version) {
3562 $machine_type_min =~ s/\+pve\d+$//;
3563 $machine_type_min .= "+pve$required_pve_version";
3564 }
3565 push @$machineFlags, "type=${machine_type_min}";
3566
5bdcf937 3567 push @$cmd, @$devices;
be190583 3568 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 3569 if scalar(@$rtcFlags);
be190583 3570 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
3571 if scalar(@$machineFlags);
3572 push @$cmd, '-global', join(',', @$globalFlags)
3573 if scalar(@$globalFlags);
3574
7ceade4c
DC
3575 if (my $vmstate = $conf->{vmstate}) {
3576 my $statepath = PVE::Storage::path($storecfg, $vmstate);
24d1f93a 3577 push @$vollist, $vmstate;
7ceade4c 3578 push @$cmd, '-loadstate', $statepath;
b85666cf 3579 print "activating and using '$vmstate' as vmstate\n";
7ceade4c
DC
3580 }
3581
76350670
DC
3582 # add custom args
3583 if ($conf->{args}) {
3584 my $aa = PVE::Tools::split_args($conf->{args});
3585 push @$cmd, @$aa;
3586 }
3587
1d794448 3588 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 3589}
19672434 3590
943340a6 3591sub spice_port {
1011b570 3592 my ($vmid) = @_;
943340a6 3593
0a13e08e 3594 my $res = mon_cmd($vmid, 'query-spice');
943340a6
DM
3595
3596 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3597}
3598
86fdcfb2
DA
3599sub vm_devices_list {
3600 my ($vmid) = @_;
3601
0a13e08e 3602 my $res = mon_cmd($vmid, 'query-pci');
f721624b 3603 my $devices_to_check = [];
ceea9078
DM
3604 my $devices = {};
3605 foreach my $pcibus (@$res) {
f721624b
DC
3606 push @$devices_to_check, @{$pcibus->{devices}},
3607 }
3608
3609 while (@$devices_to_check) {
3610 my $to_check = [];
3611 for my $d (@$devices_to_check) {
3612 $devices->{$d->{'qdev_id'}} = 1 if $d->{'qdev_id'};
3613 next if !$d->{'pci_bridge'};
3614
3615 $devices->{$d->{'qdev_id'}} += scalar(@{$d->{'pci_bridge'}->{devices}});
3616 push @$to_check, @{$d->{'pci_bridge'}->{devices}};
f78cc802 3617 }
f721624b 3618 $devices_to_check = $to_check;
f78cc802
AD
3619 }
3620
0a13e08e 3621 my $resblock = mon_cmd($vmid, 'query-block');
f78cc802
AD
3622 foreach my $block (@$resblock) {
3623 if($block->{device} =~ m/^drive-(\S+)/){
3624 $devices->{$1} = 1;
1dc4f496
DM
3625 }
3626 }
86fdcfb2 3627
0a13e08e 3628 my $resmice = mon_cmd($vmid, 'query-mice');
3d7389fe
DM
3629 foreach my $mice (@$resmice) {
3630 if ($mice->{name} eq 'QEMU HID Tablet') {
3631 $devices->{tablet} = 1;
3632 last;
3633 }
3634 }
3635
deb091c5
DC
3636 # for usb devices there is no query-usb
3637 # but we can iterate over the entries in
3638 # qom-list path=/machine/peripheral
0a13e08e 3639 my $resperipheral = mon_cmd($vmid, 'qom-list', path => '/machine/peripheral');
deb091c5
DC
3640 foreach my $per (@$resperipheral) {
3641 if ($per->{name} =~ m/^usb\d+$/) {
3642 $devices->{$per->{name}} = 1;
3643 }
3644 }
3645
1dc4f496 3646 return $devices;
86fdcfb2
DA
3647}
3648
ec21aa11 3649sub vm_deviceplug {
d559309f 3650 my ($storecfg, $conf, $vmid, $deviceid, $device, $arch, $machine_type) = @_;
ae57f6b3 3651
3392d6ca 3652 my $q35 = PVE::QemuServer::Machine::machine_type_is_q35($conf);
db656e5f 3653
95d6343b
DA
3654 my $devices_list = vm_devices_list($vmid);
3655 return 1 if defined($devices_list->{$deviceid});
3656
d559309f 3657 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid, $arch, $machine_type); # add PCI bridge if we need it for the device
fee46675 3658
3d7389fe 3659 if ($deviceid eq 'tablet') {
fee46675 3660
d559309f
WB
3661 qemu_deviceadd($vmid, print_tabletdevice_full($conf, $arch));
3662
3663 } elsif ($deviceid eq 'keyboard') {
3664
3665 qemu_deviceadd($vmid, print_keyboarddevice_full($conf, $arch));
3d7389fe 3666
4eb68604
DC
3667 } elsif ($deviceid =~ m/^usb(\d+)$/) {
3668
f745762b
DC
3669 die "usb hotplug currently not reliable\n";
3670 # since we can't reliably hot unplug all added usb devices
3671 # and usb passthrough disables live migration
3672 # we disable usb hotplugging for now
4eb68604
DC
3673 qemu_deviceadd($vmid, PVE::QemuServer::USB::print_usbdevice_full($conf, $deviceid, $device));
3674
fee46675 3675 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
40f28a9f 3676
22de899a
AD
3677 qemu_iothread_add($vmid, $deviceid, $device);
3678
fee46675 3679 qemu_driveadd($storecfg, $vmid, $device);
d559309f 3680 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device, $arch, $machine_type);
fee46675 3681
5e5dcb73 3682 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3683 eval { qemu_deviceaddverify($vmid, $deviceid); };
3684 if (my $err = $@) {
63c2da2f
DM
3685 eval { qemu_drivedel($vmid, $deviceid); };
3686 warn $@ if $@;
fee46675 3687 die $err;
5e5dcb73 3688 }
cfc817c7 3689
2733141c 3690 } elsif ($deviceid =~ m/^(virtioscsi|scsihw)(\d+)$/) {
fee46675 3691
fc8b40fd 3692
cdd20088 3693 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
d559309f 3694 my $pciaddr = print_pci_addr($deviceid, undef, $arch, $machine_type);
a1b7d579 3695 my $scsihw_type = $scsihw eq 'virtio-scsi-single' ? "virtio-scsi-pci" : $scsihw;
2733141c
AD
3696
3697 my $devicefull = "$scsihw_type,id=$deviceid$pciaddr";
fee46675 3698
fc8b40fd
AD
3699 if($deviceid =~ m/^virtioscsi(\d+)$/ && $device->{iothread}) {
3700 qemu_iothread_add($vmid, $deviceid, $device);
3701 $devicefull .= ",iothread=iothread-$deviceid";
3702 }
3703
6e11f143
AD
3704 if($deviceid =~ m/^virtioscsi(\d+)$/ && $device->{queues}) {
3705 $devicefull .= ",num_queues=$device->{queues}";
3706 }
3707
cfc817c7 3708 qemu_deviceadd($vmid, $devicefull);
fee46675 3709 qemu_deviceaddverify($vmid, $deviceid);
cfc817c7 3710
fee46675
DM
3711 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3712
d559309f 3713 qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device, $arch, $machine_type);
fee46675 3714 qemu_driveadd($storecfg, $vmid, $device);
a1b7d579 3715
d559309f 3716 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device, $arch, $machine_type);
fee46675
DM
3717 eval { qemu_deviceadd($vmid, $devicefull); };
3718 if (my $err = $@) {
63c2da2f
DM
3719 eval { qemu_drivedel($vmid, $deviceid); };
3720 warn $@ if $@;
fee46675 3721 die $err;
a4f091a0 3722 }
a4f091a0 3723
fee46675
DM
3724 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3725
95d3be58 3726 return undef if !qemu_netdevadd($vmid, $conf, $arch, $device, $deviceid);
8718099c 3727
3392d6ca 3728 my $machine_type = PVE::QemuServer::Machine::qemu_machine_pxe($vmid, $conf);
95d3be58
DC
3729 my $use_old_bios_files = undef;
3730 ($use_old_bios_files, $machine_type) = qemu_use_old_bios_files($machine_type);
8718099c 3731
95d3be58
DC
3732 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid, undef, $use_old_bios_files, $arch, $machine_type);
3733 qemu_deviceadd($vmid, $netdevicefull);
79046fd1
DC
3734 eval {
3735 qemu_deviceaddverify($vmid, $deviceid);
3736 qemu_set_link_status($vmid, $deviceid, !$device->{link_down});
3737 };
fee46675
DM
3738 if (my $err = $@) {
3739 eval { qemu_netdevdel($vmid, $deviceid); };
3740 warn $@ if $@;
3741 die $err;
95d3be58 3742 }
2630d2a9 3743
fee46675 3744 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
b467f79a 3745
40f28a9f 3746 my $bridgeid = $2;
d559309f 3747 my $pciaddr = print_pci_addr($deviceid, undef, $arch, $machine_type);
40f28a9f 3748 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
a1b7d579 3749
40f28a9f 3750 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3751 qemu_deviceaddverify($vmid, $deviceid);
3752
3753 } else {
a1b7d579 3754 die "can't hotplug device '$deviceid'\n";
40f28a9f
AD
3755 }
3756
5e5dcb73 3757 return 1;
a4dea331
DA
3758}
3759
3eec5767 3760# fixme: this should raise exceptions on error!
ec21aa11 3761sub vm_deviceunplug {
f19d1c47 3762 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3763
95d6343b
DA
3764 my $devices_list = vm_devices_list($vmid);
3765 return 1 if !defined($devices_list->{$deviceid});
3766
63c2da2f
DM
3767 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3768
d559309f 3769 if ($deviceid eq 'tablet' || $deviceid eq 'keyboard') {
63c2da2f 3770
3d7389fe 3771 qemu_devicedel($vmid, $deviceid);
3d7389fe 3772
4eb68604
DC
3773 } elsif ($deviceid =~ m/^usb\d+$/) {
3774
f745762b
DC
3775 die "usb hotplug currently not reliable\n";
3776 # when unplugging usb devices this way,
3777 # there may be remaining usb controllers/hubs
3778 # so we disable it for now
4eb68604
DC
3779 qemu_devicedel($vmid, $deviceid);
3780 qemu_devicedelverify($vmid, $deviceid);
3781
63c2da2f 3782 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
f19d1c47 3783
5e5dcb73 3784 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3785 qemu_devicedelverify($vmid, $deviceid);
3786 qemu_drivedel($vmid, $deviceid);
22de899a
AD
3787 qemu_iothread_del($conf, $vmid, $deviceid);
3788
2733141c 3789 } elsif ($deviceid =~ m/^(virtioscsi|scsihw)(\d+)$/) {
a1b7d579 3790
63c2da2f 3791 qemu_devicedel($vmid, $deviceid);
8ce30dde 3792 qemu_devicedelverify($vmid, $deviceid);
fc8b40fd 3793 qemu_iothread_del($conf, $vmid, $deviceid);
a1b7d579 3794
63c2da2f 3795 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
cfc817c7 3796
63c2da2f
DM
3797 qemu_devicedel($vmid, $deviceid);
3798 qemu_drivedel($vmid, $deviceid);
a1b7d579 3799 qemu_deletescsihw($conf, $vmid, $deviceid);
8ce30dde 3800
63c2da2f 3801 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
a4f091a0 3802
2630d2a9 3803 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3804 qemu_devicedelverify($vmid, $deviceid);
3805 qemu_netdevdel($vmid, $deviceid);
3806
3807 } else {
3808 die "can't unplug device '$deviceid'\n";
2630d2a9
DA
3809 }
3810
5e5dcb73
DA
3811 return 1;
3812}
3813
3814sub qemu_deviceadd {
3815 my ($vmid, $devicefull) = @_;
873c2d69 3816
d695b5b7
AD
3817 $devicefull = "driver=".$devicefull;
3818 my %options = split(/[=,]/, $devicefull);
f19d1c47 3819
0a13e08e 3820 mon_cmd($vmid, "device_add" , %options);
5e5dcb73 3821}
afdb31d5 3822
5e5dcb73 3823sub qemu_devicedel {
fee46675 3824 my ($vmid, $deviceid) = @_;
63c2da2f 3825
0a13e08e 3826 my $ret = mon_cmd($vmid, "device_del", id => $deviceid);
5e5dcb73
DA
3827}
3828
22de899a
AD
3829sub qemu_iothread_add {
3830 my($vmid, $deviceid, $device) = @_;
3831
3832 if ($device->{iothread}) {
3833 my $iothreads = vm_iothreads_list($vmid);
3834 qemu_objectadd($vmid, "iothread-$deviceid", "iothread") if !$iothreads->{"iothread-$deviceid"};
3835 }
3836}
3837
3838sub qemu_iothread_del {
3839 my($conf, $vmid, $deviceid) = @_;
3840
7820eae4
DC
3841 my $confid = $deviceid;
3842 if ($deviceid =~ m/^(?:virtioscsi|scsihw)(\d+)$/) {
3843 $confid = 'scsi' . $1;
3844 }
3845 my $device = parse_drive($confid, $conf->{$confid});
22de899a
AD
3846 if ($device->{iothread}) {
3847 my $iothreads = vm_iothreads_list($vmid);
3848 qemu_objectdel($vmid, "iothread-$deviceid") if $iothreads->{"iothread-$deviceid"};
3849 }
3850}
3851
4d3f29ed
AD
3852sub qemu_objectadd {
3853 my($vmid, $objectid, $qomtype) = @_;
3854
0a13e08e 3855 mon_cmd($vmid, "object-add", id => $objectid, "qom-type" => $qomtype);
4d3f29ed
AD
3856
3857 return 1;
3858}
3859
3860sub qemu_objectdel {
3861 my($vmid, $objectid) = @_;
3862
0a13e08e 3863 mon_cmd($vmid, "object-del", id => $objectid);
4d3f29ed
AD
3864
3865 return 1;
3866}
3867
5e5dcb73 3868sub qemu_driveadd {
fee46675 3869 my ($storecfg, $vmid, $device) = @_;
5e5dcb73 3870
776c5f50 3871 my $drive = print_drive_commandline_full($storecfg, $vmid, $device);
7a69fc3c 3872 $drive =~ s/\\/\\\\/g;
0a13e08e 3873 my $ret = PVE::QemuServer::Monitor::hmp_cmd($vmid, "drive_add auto \"$drive\"");
fee46675 3874
5e5dcb73 3875 # If the command succeeds qemu prints: "OK"
fee46675
DM
3876 return 1 if $ret =~ m/OK/s;
3877
3878 die "adding drive failed: $ret\n";
5e5dcb73 3879}
afdb31d5 3880
5e5dcb73
DA
3881sub qemu_drivedel {
3882 my($vmid, $deviceid) = @_;
873c2d69 3883
0a13e08e 3884 my $ret = PVE::QemuServer::Monitor::hmp_cmd($vmid, "drive_del drive-$deviceid");
5e5dcb73 3885 $ret =~ s/^\s+//;
a1b7d579 3886
63c2da2f 3887 return 1 if $ret eq "";
a1b7d579 3888
63c2da2f 3889 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
a1b7d579
DM
3890 return 1 if $ret =~ m/Device \'.*?\' not found/s;
3891
63c2da2f 3892 die "deleting drive $deviceid failed : $ret\n";
5e5dcb73 3893}
f19d1c47 3894
5e5dcb73 3895sub qemu_deviceaddverify {
fee46675 3896 my ($vmid, $deviceid) = @_;
873c2d69 3897
5e5dcb73
DA
3898 for (my $i = 0; $i <= 5; $i++) {
3899 my $devices_list = vm_devices_list($vmid);
3900 return 1 if defined($devices_list->{$deviceid});
3901 sleep 1;
afdb31d5 3902 }
fee46675
DM
3903
3904 die "error on hotplug device '$deviceid'\n";
5e5dcb73 3905}
afdb31d5 3906
5e5dcb73
DA
3907
3908sub qemu_devicedelverify {
63c2da2f
DM
3909 my ($vmid, $deviceid) = @_;
3910
a1b7d579 3911 # need to verify that the device is correctly removed as device_del
63c2da2f 3912 # is async and empty return is not reliable
5e5dcb73 3913
5e5dcb73
DA
3914 for (my $i = 0; $i <= 5; $i++) {
3915 my $devices_list = vm_devices_list($vmid);
3916 return 1 if !defined($devices_list->{$deviceid});
3917 sleep 1;
afdb31d5 3918 }
63c2da2f
DM
3919
3920 die "error on hot-unplugging device '$deviceid'\n";
873c2d69
DA
3921}
3922
cdd20088 3923sub qemu_findorcreatescsihw {
d559309f 3924 my ($storecfg, $conf, $vmid, $device, $arch, $machine_type) = @_;
cfc817c7 3925
ee034f5c 3926 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $device);
2733141c
AD
3927
3928 my $scsihwid="$controller_prefix$controller";
cfc817c7
DA
3929 my $devices_list = vm_devices_list($vmid);
3930
cdd20088 3931 if(!defined($devices_list->{$scsihwid})) {
d559309f 3932 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid, $device, $arch, $machine_type);
cfc817c7 3933 }
fee46675 3934
cfc817c7
DA
3935 return 1;
3936}
3937
8ce30dde
AD
3938sub qemu_deletescsihw {
3939 my ($conf, $vmid, $opt) = @_;
3940
3941 my $device = parse_drive($opt, $conf->{$opt});
3942
a1511b3c 3943 if ($conf->{scsihw} && ($conf->{scsihw} eq 'virtio-scsi-single')) {
2733141c
AD
3944 vm_deviceunplug($vmid, $conf, "virtioscsi$device->{index}");
3945 return 1;
3946 }
3947
ee034f5c 3948 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $device);
8ce30dde
AD
3949
3950 my $devices_list = vm_devices_list($vmid);
3951 foreach my $opt (keys %{$devices_list}) {
e0fd2b2f
FE
3952 if (is_valid_drivename($opt)) {
3953 my $drive = parse_drive($opt, $conf->{$opt});
8ce30dde
AD
3954 if($drive->{interface} eq 'scsi' && $drive->{index} < (($maxdev-1)*($controller+1))) {
3955 return 1;
3956 }
3957 }
3958 }
3959
3960 my $scsihwid="scsihw$controller";
3961
3962 vm_deviceunplug($vmid, $conf, $scsihwid);
3963
3964 return 1;
3965}
3966
281fedb3 3967sub qemu_add_pci_bridge {
d559309f 3968 my ($storecfg, $conf, $vmid, $device, $arch, $machine_type) = @_;
40f28a9f
AD
3969
3970 my $bridges = {};
281fedb3
DM
3971
3972 my $bridgeid;
3973
d559309f 3974 print_pci_addr($device, $bridges, $arch, $machine_type);
40f28a9f
AD
3975
3976 while (my ($k, $v) = each %$bridges) {
3977 $bridgeid = $k;
3978 }
fee46675 3979 return 1 if !defined($bridgeid) || $bridgeid < 1;
281fedb3 3980
40f28a9f
AD
3981 my $bridge = "pci.$bridgeid";
3982 my $devices_list = vm_devices_list($vmid);
3983
281fedb3 3984 if (!defined($devices_list->{$bridge})) {
d559309f 3985 vm_deviceplug($storecfg, $conf, $vmid, $bridge, $arch, $machine_type);
40f28a9f 3986 }
281fedb3 3987
40f28a9f
AD
3988 return 1;
3989}
3990
25088687
DM
3991sub qemu_set_link_status {
3992 my ($vmid, $device, $up) = @_;
3993
0a13e08e 3994 mon_cmd($vmid, "set_link", name => $device,
25088687
DM
3995 up => $up ? JSON::true : JSON::false);
3996}
3997
2630d2a9 3998sub qemu_netdevadd {
d559309f 3999 my ($vmid, $conf, $arch, $device, $deviceid) = @_;
2630d2a9 4000
d559309f 4001 my $netdev = print_netdev_full($vmid, $conf, $arch, $device, $deviceid, 1);
73aa03b8 4002 my %options = split(/[=,]/, $netdev);
2630d2a9 4003
0a13e08e 4004 mon_cmd($vmid, "netdev_add", %options);
73aa03b8 4005 return 1;
2630d2a9
DA
4006}
4007
4008sub qemu_netdevdel {
4009 my ($vmid, $deviceid) = @_;
4010
0a13e08e 4011 mon_cmd($vmid, "netdev_del", id => $deviceid);
2630d2a9
DA
4012}
4013
16521d63 4014sub qemu_usb_hotplug {
d559309f 4015 my ($storecfg, $conf, $vmid, $deviceid, $device, $arch, $machine_type) = @_;
16521d63
DC
4016
4017 return if !$device;
4018
4019 # remove the old one first
4020 vm_deviceunplug($vmid, $conf, $deviceid);
4021
4022 # check if xhci controller is necessary and available
4023 if ($device->{usb3}) {
4024
4025 my $devicelist = vm_devices_list($vmid);
4026
4027 if (!$devicelist->{xhci}) {
d559309f 4028 my $pciaddr = print_pci_addr("xhci", undef, $arch, $machine_type);
16521d63
DC
4029 qemu_deviceadd($vmid, "nec-usb-xhci,id=xhci$pciaddr");
4030 }
4031 }
4032 my $d = parse_usb_device($device->{host});
4033 $d->{usb3} = $device->{usb3};
4034
4035 # add the new one
d559309f 4036 vm_deviceplug($storecfg, $conf, $vmid, $deviceid, $d, $arch, $machine_type);
16521d63
DC
4037}
4038
838776ab 4039sub qemu_cpu_hotplug {
8edc9c08 4040 my ($vmid, $conf, $vcpus) = @_;
838776ab 4041
3392d6ca 4042 my $machine_type = PVE::QemuServer::Machine::get_current_qemu_machine($vmid);
1e881b75 4043
8edc9c08
AD
4044 my $sockets = 1;
4045 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
4046 $sockets = $conf->{sockets} if $conf->{sockets};
4047 my $cores = $conf->{cores} || 1;
4048 my $maxcpus = $sockets * $cores;
838776ab 4049
8edc9c08 4050 $vcpus = $maxcpus if !$vcpus;
3a11fadb 4051
8edc9c08
AD
4052 die "you can't add more vcpus than maxcpus\n"
4053 if $vcpus > $maxcpus;
3a11fadb 4054
8edc9c08 4055 my $currentvcpus = $conf->{vcpus} || $maxcpus;
1e881b75 4056
eba3e64d 4057 if ($vcpus < $currentvcpus) {
1e881b75 4058
2ea5fb7e 4059 if (PVE::QemuServer::Machine::machine_version($machine_type, 2, 7)) {
1e881b75
AD
4060
4061 for (my $i = $currentvcpus; $i > $vcpus; $i--) {
4062 qemu_devicedel($vmid, "cpu$i");
4063 my $retry = 0;
4064 my $currentrunningvcpus = undef;
4065 while (1) {
65af8c31 4066 $currentrunningvcpus = mon_cmd($vmid, "query-cpus-fast");
1e881b75 4067 last if scalar(@{$currentrunningvcpus}) == $i-1;
961af8a3 4068 raise_param_exc({ vcpus => "error unplugging cpu$i" }) if $retry > 5;
1e881b75
AD
4069 $retry++;
4070 sleep 1;
4071 }
4072 #update conf after each succesfull cpu unplug
4073 $conf->{vcpus} = scalar(@{$currentrunningvcpus});
4074 PVE::QemuConfig->write_config($vmid, $conf);
4075 }
4076 } else {
961af8a3 4077 die "cpu hot-unplugging requires qemu version 2.7 or higher\n";
1e881b75
AD
4078 }
4079
4080 return;
4081 }
838776ab 4082
65af8c31 4083 my $currentrunningvcpus = mon_cmd($vmid, "query-cpus-fast");
961af8a3 4084 die "vcpus in running vm does not match its configuration\n"
8edc9c08 4085 if scalar(@{$currentrunningvcpus}) != $currentvcpus;
838776ab 4086
2ea5fb7e 4087 if (PVE::QemuServer::Machine::machine_version($machine_type, 2, 7)) {
eba3e64d
AD
4088
4089 for (my $i = $currentvcpus+1; $i <= $vcpus; $i++) {
4090 my $cpustr = print_cpu_device($conf, $i);
4091 qemu_deviceadd($vmid, $cpustr);
4092
4093 my $retry = 0;
4094 my $currentrunningvcpus = undef;
4095 while (1) {
65af8c31 4096 $currentrunningvcpus = mon_cmd($vmid, "query-cpus-fast");
eba3e64d 4097 last if scalar(@{$currentrunningvcpus}) == $i;
961af8a3 4098 raise_param_exc({ vcpus => "error hotplugging cpu$i" }) if $retry > 10;
eba3e64d
AD
4099 sleep 1;
4100 $retry++;
4101 }
4102 #update conf after each succesfull cpu hotplug
4103 $conf->{vcpus} = scalar(@{$currentrunningvcpus});
4104 PVE::QemuConfig->write_config($vmid, $conf);
4105 }
4106 } else {
4107
4108 for (my $i = $currentvcpus; $i < $vcpus; $i++) {
0a13e08e 4109 mon_cmd($vmid, "cpu-add", id => int($i));
eba3e64d 4110 }
838776ab
AD
4111 }
4112}
4113
affd2f88 4114sub qemu_block_set_io_throttle {
277ca170
WB
4115 my ($vmid, $deviceid,
4116 $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr,
9196a8ec
WB
4117 $bps_max, $bps_rd_max, $bps_wr_max, $iops_max, $iops_rd_max, $iops_wr_max,
4118 $bps_max_length, $bps_rd_max_length, $bps_wr_max_length,
4119 $iops_max_length, $iops_rd_max_length, $iops_wr_max_length) = @_;
affd2f88 4120
f3f323a3
AD
4121 return if !check_running($vmid) ;
4122
0a13e08e 4123 mon_cmd($vmid, "block_set_io_throttle", device => $deviceid,
277ca170
WB
4124 bps => int($bps),
4125 bps_rd => int($bps_rd),
4126 bps_wr => int($bps_wr),
4127 iops => int($iops),
4128 iops_rd => int($iops_rd),
4129 iops_wr => int($iops_wr),
4130 bps_max => int($bps_max),
4131 bps_rd_max => int($bps_rd_max),
4132 bps_wr_max => int($bps_wr_max),
4133 iops_max => int($iops_max),
4134 iops_rd_max => int($iops_rd_max),
9196a8ec
WB
4135 iops_wr_max => int($iops_wr_max),
4136 bps_max_length => int($bps_max_length),
4137 bps_rd_max_length => int($bps_rd_max_length),
4138 bps_wr_max_length => int($bps_wr_max_length),
4139 iops_max_length => int($iops_max_length),
4140 iops_rd_max_length => int($iops_rd_max_length),
4141 iops_wr_max_length => int($iops_wr_max_length),
277ca170 4142 );
f3f323a3 4143
affd2f88
AD
4144}
4145
f5eb281a 4146# old code, only used to shutdown old VM after update
dab36e1e
DM
4147sub __read_avail {
4148 my ($fh, $timeout) = @_;
4149
4150 my $sel = new IO::Select;
4151 $sel->add($fh);
4152
4153 my $res = '';
4154 my $buf;
4155
4156 my @ready;
4157 while (scalar (@ready = $sel->can_read($timeout))) {
4158 my $count;
4159 if ($count = $fh->sysread($buf, 8192)) {
4160 if ($buf =~ /^(.*)\(qemu\) $/s) {
4161 $res .= $1;
4162 last;
4163 } else {
4164 $res .= $buf;
4165 }
4166 } else {
4167 if (!defined($count)) {
4168 die "$!\n";
4169 }
4170 last;
4171 }
4172 }
4173
4174 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 4175
dab36e1e
DM
4176 return $res;
4177}
4178
c1175c92
AD
4179sub qemu_block_resize {
4180 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
4181
ed221350 4182 my $running = check_running($vmid);
c1175c92 4183
7246e8f9 4184 $size = 0 if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
c1175c92
AD
4185
4186 return if !$running;
4187
375db731
FE
4188 my $padding = (1024 - $size % 1024) % 1024;
4189 $size = $size + $padding;
4190
0a13e08e 4191 mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
c1175c92
AD
4192
4193}
4194
1ab0057c
AD
4195sub qemu_volume_snapshot {
4196 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
4197
ed221350 4198 my $running = check_running($vmid);
1ab0057c 4199
e5eaa028 4200 if ($running && do_snapshots_with_qemu($storecfg, $volid)){
0a13e08e 4201 mon_cmd($vmid, 'blockdev-snapshot-internal-sync', device => $deviceid, name => $snap);
e5eaa028
WL
4202 } else {
4203 PVE::Storage::volume_snapshot($storecfg, $volid, $snap);
4204 }
1ab0057c
AD
4205}
4206
fc46aff9
AD
4207sub qemu_volume_snapshot_delete {
4208 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
4209
ed221350 4210 my $running = check_running($vmid);
fc46aff9 4211
a2f1554b
AD
4212 if($running) {
4213
4214 $running = undef;
4215 my $conf = PVE::QemuConfig->load_config($vmid);
4216 foreach_drive($conf, sub {
4217 my ($ds, $drive) = @_;
4218 $running = 1 if $drive->{file} eq $volid;
4219 });
4220 }
4221
1ef7592f 4222 if ($running && do_snapshots_with_qemu($storecfg, $volid)){
0a13e08e 4223 mon_cmd($vmid, 'blockdev-snapshot-delete-internal-sync', device => $deviceid, name => $snap);
1ef7592f
AD
4224 } else {
4225 PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
4226 }
fc46aff9
AD
4227}
4228
264e519f
DM
4229sub set_migration_caps {
4230 my ($vmid) = @_;
a89fded1 4231
8b8345f3 4232 my $cap_ref = [];
a89fded1
AD
4233
4234 my $enabled_cap = {
8b8345f3 4235 "auto-converge" => 1,
0b0a47e8 4236 "xbzrle" => 1,
8b8345f3
DM
4237 "x-rdma-pin-all" => 0,
4238 "zero-blocks" => 0,
b62532e4 4239 "compress" => 0
a89fded1
AD
4240 };
4241
0a13e08e 4242 my $supported_capabilities = mon_cmd($vmid, "query-migrate-capabilities");
a89fded1 4243
8b8345f3 4244 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
4245 push @$cap_ref, {
4246 capability => $supported_capability->{capability},
22430fa2
DM
4247 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
4248 };
a89fded1
AD
4249 }
4250
0a13e08e 4251 mon_cmd($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
8b8345f3 4252}
a89fded1 4253
81d95ae1 4254my $fast_plug_option = {
7498eb64 4255 'lock' => 1,
81d95ae1 4256 'name' => 1,
a1b7d579 4257 'onboot' => 1,
81d95ae1
DM
4258 'shares' => 1,
4259 'startup' => 1,
b0ec896e 4260 'description' => 1,
ec647db4 4261 'protection' => 1,
8cad5e9b 4262 'vmstatestorage' => 1,
9e784b11 4263 'hookscript' => 1,
b8e7068a 4264 'tags' => 1,
81d95ae1
DM
4265};
4266
3a11fadb
DM
4267# hotplug changes in [PENDING]
4268# $selection hash can be used to only apply specified options, for
4269# example: { cores => 1 } (only apply changed 'cores')
4270# $errors ref is used to return error messages
c427973b 4271sub vmconfig_hotplug_pending {
3a11fadb 4272 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
c427973b 4273
8e90138a 4274 my $defaults = load_defaults();
045749f2
TL
4275 my $arch = get_vm_arch($conf);
4276 my $machine_type = get_vm_machine($conf, undef, $arch);
c427973b
DM
4277
4278 # commit values which do not have any impact on running VM first
3a11fadb
DM
4279 # Note: those option cannot raise errors, we we do not care about
4280 # $selection and always apply them.
4281
4282 my $add_error = sub {
4283 my ($opt, $msg) = @_;
4284 $errors->{$opt} = "hotplug problem - $msg";
4285 };
c427973b
DM
4286
4287 my $changes = 0;
4288 foreach my $opt (keys %{$conf->{pending}}) { # add/change
81d95ae1 4289 if ($fast_plug_option->{$opt}) {
c427973b
DM
4290 $conf->{$opt} = $conf->{pending}->{$opt};
4291 delete $conf->{pending}->{$opt};
4292 $changes = 1;
4293 }
4294 }
4295
4296 if ($changes) {
ffda963f 4297 PVE::QemuConfig->write_config($vmid, $conf);
c427973b
DM
4298 }
4299
b3c2bdd1 4300 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
c427973b 4301
98bc3aeb 4302 my $pending_delete_hash = PVE::QemuConfig->parse_pending_delete($conf->{pending}->{delete});
d321c4a9 4303 foreach my $opt (sort keys %$pending_delete_hash) {
3a11fadb 4304 next if $selection && !$selection->{$opt};
d321c4a9 4305 my $force = $pending_delete_hash->{$opt}->{force};
3a11fadb 4306 eval {
51a6f637
AD
4307 if ($opt eq 'hotplug') {
4308 die "skip\n" if ($conf->{hotplug} =~ /memory/);
4309 } elsif ($opt eq 'tablet') {
b3c2bdd1 4310 die "skip\n" if !$hotplug_features->{usb};
3a11fadb 4311 if ($defaults->{tablet}) {
d559309f
WB
4312 vm_deviceplug($storecfg, $conf, $vmid, 'tablet', $arch, $machine_type);
4313 vm_deviceplug($storecfg, $conf, $vmid, 'keyboard', $arch, $machine_type)
4314 if $arch eq 'aarch64';
3a11fadb 4315 } else {
d559309f
WB
4316 vm_deviceunplug($vmid, $conf, 'tablet');
4317 vm_deviceunplug($vmid, $conf, 'keyboard') if $arch eq 'aarch64';
3a11fadb 4318 }
4eb68604 4319 } elsif ($opt =~ m/^usb\d+/) {
f745762b
DC
4320 die "skip\n";
4321 # since we cannot reliably hot unplug usb devices
4322 # we are disabling it
4eb68604
DC
4323 die "skip\n" if !$hotplug_features->{usb} || $conf->{$opt} =~ m/spice/i;
4324 vm_deviceunplug($vmid, $conf, $opt);
8edc9c08 4325 } elsif ($opt eq 'vcpus') {
b3c2bdd1 4326 die "skip\n" if !$hotplug_features->{cpu};
8edc9c08 4327 qemu_cpu_hotplug($vmid, $conf, undef);
9c2f7069 4328 } elsif ($opt eq 'balloon') {
81d95ae1 4329 # enable balloon device is not hotpluggable
75b51053
DC
4330 die "skip\n" if defined($conf->{balloon}) && $conf->{balloon} == 0;
4331 # here we reset the ballooning value to memory
4332 my $balloon = $conf->{memory} || $defaults->{memory};
0a13e08e 4333 mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
81d95ae1
DM
4334 } elsif ($fast_plug_option->{$opt}) {
4335 # do nothing
3eec5767 4336 } elsif ($opt =~ m/^net(\d+)$/) {
b3c2bdd1 4337 die "skip\n" if !$hotplug_features->{network};
3eec5767 4338 vm_deviceunplug($vmid, $conf, $opt);
74479ee9 4339 } elsif (is_valid_drivename($opt)) {
b3c2bdd1 4340 die "skip\n" if !$hotplug_features->{disk} || $opt =~ m/(ide|sata)(\d+)/;
19120f99 4341 vm_deviceunplug($vmid, $conf, $opt);
3dc38fbb 4342 vmconfig_delete_or_detach_drive($vmid, $storecfg, $conf, $opt, $force);
4d3f29ed
AD
4343 } elsif ($opt =~ m/^memory$/) {
4344 die "skip\n" if !$hotplug_features->{memory};
6779f1ac 4345 PVE::QemuServer::Memory::qemu_memory_hotplug($vmid, $conf, $defaults, $opt);
c8effec3
AD
4346 } elsif ($opt eq 'cpuunits') {
4347 cgroups_write("cpu", $vmid, "cpu.shares", $defaults->{cpuunits});
58be00f1
AD
4348 } elsif ($opt eq 'cpulimit') {
4349 cgroups_write("cpu", $vmid, "cpu.cfs_quota_us", -1);
3d7389fe 4350 } else {
e56beeda 4351 die "skip\n";
3d7389fe 4352 }
3a11fadb
DM
4353 };
4354 if (my $err = $@) {
e56beeda
DM
4355 &$add_error($opt, $err) if $err ne "skip\n";
4356 } else {
3a11fadb 4357 delete $conf->{$opt};
98bc3aeb 4358 PVE::QemuConfig->remove_from_pending_delete($conf, $opt);
3d7389fe 4359 }
3d7389fe
DM
4360 }
4361
e5a66e48 4362 my ($apply_pending_cloudinit, $apply_pending_cloudinit_done);
9ed7a77c 4363 $apply_pending_cloudinit = sub {
e5a66e48
WB
4364 return if $apply_pending_cloudinit_done; # once is enough
4365 $apply_pending_cloudinit_done = 1; # once is enough
4366
9ed7a77c 4367 my ($key, $value) = @_;
9ed7a77c
WB
4368
4369 my @cloudinit_opts = keys %$confdesc_cloudinit;
4370 foreach my $opt (keys %{$conf->{pending}}) {
4371 next if !grep { $_ eq $opt } @cloudinit_opts;
4372 $conf->{$opt} = delete $conf->{pending}->{$opt};
4373 }
4374
4375 my $new_conf = { %$conf };
4376 $new_conf->{$key} = $value;
4377 PVE::QemuServer::Cloudinit::generate_cloudinitconfig($new_conf, $vmid);
4378 };
4379
3d7389fe 4380 foreach my $opt (keys %{$conf->{pending}}) {
3a11fadb 4381 next if $selection && !$selection->{$opt};
3d7389fe 4382 my $value = $conf->{pending}->{$opt};
3a11fadb 4383 eval {
51a6f637
AD
4384 if ($opt eq 'hotplug') {
4385 die "skip\n" if ($value =~ /memory/) || ($value !~ /memory/ && $conf->{hotplug} =~ /memory/);
4386 } elsif ($opt eq 'tablet') {
b3c2bdd1 4387 die "skip\n" if !$hotplug_features->{usb};
3a11fadb 4388 if ($value == 1) {
d559309f
WB
4389 vm_deviceplug($storecfg, $conf, $vmid, 'tablet', $arch, $machine_type);
4390 vm_deviceplug($storecfg, $conf, $vmid, 'keyboard', $arch, $machine_type)
4391 if $arch eq 'aarch64';
3a11fadb 4392 } elsif ($value == 0) {
d559309f
WB
4393 vm_deviceunplug($vmid, $conf, 'tablet');
4394 vm_deviceunplug($vmid, $conf, 'keyboard') if $arch eq 'aarch64';
3a11fadb 4395 }
4eb68604 4396 } elsif ($opt =~ m/^usb\d+$/) {
f745762b
DC
4397 die "skip\n";
4398 # since we cannot reliably hot unplug usb devices
4399 # we are disabling it
4eb68604
DC
4400 die "skip\n" if !$hotplug_features->{usb} || $value =~ m/spice/i;
4401 my $d = eval { PVE::JSONSchema::parse_property_string($usbdesc->{format}, $value) };
4402 die "skip\n" if !$d;
d559309f 4403 qemu_usb_hotplug($storecfg, $conf, $vmid, $opt, $d, $arch, $machine_type);
8edc9c08 4404 } elsif ($opt eq 'vcpus') {
b3c2bdd1 4405 die "skip\n" if !$hotplug_features->{cpu};
3a11fadb
DM
4406 qemu_cpu_hotplug($vmid, $conf, $value);
4407 } elsif ($opt eq 'balloon') {
81d95ae1 4408 # enable/disable balloning device is not hotpluggable
8fe689e7 4409 my $old_balloon_enabled = !!(!defined($conf->{balloon}) || $conf->{balloon});
a1b7d579 4410 my $new_balloon_enabled = !!(!defined($conf->{pending}->{balloon}) || $conf->{pending}->{balloon});
81d95ae1
DM
4411 die "skip\n" if $old_balloon_enabled != $new_balloon_enabled;
4412
3a11fadb 4413 # allow manual ballooning if shares is set to zero
4cc1efa6 4414 if ((defined($conf->{shares}) && ($conf->{shares} == 0))) {
9c2f7069 4415 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
0a13e08e 4416 mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
9c2f7069 4417 }
a1b7d579 4418 } elsif ($opt =~ m/^net(\d+)$/) {
3eec5767 4419 # some changes can be done without hotplug
a1b7d579 4420 vmconfig_update_net($storecfg, $conf, $hotplug_features->{network},
d559309f 4421 $vmid, $opt, $value, $arch, $machine_type);
74479ee9 4422 } elsif (is_valid_drivename($opt)) {
7a4bdb36 4423 die "skip\n" if $opt eq 'efidisk0';
a05cff86 4424 # some changes can be done without hotplug
9ed7a77c
WB
4425 my $drive = parse_drive($opt, $value);
4426 if (drive_is_cloudinit($drive)) {
4427 &$apply_pending_cloudinit($opt, $value);
4428 }
b3c2bdd1 4429 vmconfig_update_disk($storecfg, $conf, $hotplug_features->{disk},
9e7bce2c 4430 $vmid, $opt, $value, $arch, $machine_type);
4d3f29ed
AD
4431 } elsif ($opt =~ m/^memory$/) { #dimms
4432 die "skip\n" if !$hotplug_features->{memory};
6779f1ac 4433 $value = PVE::QemuServer::Memory::qemu_memory_hotplug($vmid, $conf, $defaults, $opt, $value);
c8effec3
AD
4434 } elsif ($opt eq 'cpuunits') {
4435 cgroups_write("cpu", $vmid, "cpu.shares", $conf->{pending}->{$opt});
58be00f1 4436 } elsif ($opt eq 'cpulimit') {
c6f773b8 4437 my $cpulimit = $conf->{pending}->{$opt} == 0 ? -1 : int($conf->{pending}->{$opt} * 100000);
58be00f1 4438 cgroups_write("cpu", $vmid, "cpu.cfs_quota_us", $cpulimit);
3a11fadb 4439 } else {
e56beeda 4440 die "skip\n"; # skip non-hot-pluggable options
3d7389fe 4441 }
3a11fadb
DM
4442 };
4443 if (my $err = $@) {
e56beeda
DM
4444 &$add_error($opt, $err) if $err ne "skip\n";
4445 } else {
3a11fadb
DM
4446 $conf->{$opt} = $value;
4447 delete $conf->{pending}->{$opt};
3d7389fe 4448 }
3d7389fe 4449 }
4df15a03
OB
4450
4451 PVE::QemuConfig->write_config($vmid, $conf);
c427973b 4452}
055d554d 4453
3dc38fbb
WB
4454sub try_deallocate_drive {
4455 my ($storecfg, $vmid, $conf, $key, $drive, $rpcenv, $authuser, $force) = @_;
4456
4457 if (($force || $key =~ /^unused/) && !drive_is_cdrom($drive, 1)) {
4458 my $volid = $drive->{file};
4459 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
4460 my $sid = PVE::Storage::parse_volume_id($volid);
4461 $rpcenv->check($authuser, "/storage/$sid", ['Datastore.AllocateSpace']);
cee01bcb
WB
4462
4463 # check if the disk is really unused
cee01bcb 4464 die "unable to delete '$volid' - volume is still in use (snapshot?)\n"
e0fd2b2f 4465 if PVE::QemuServer::Drive::is_volume_in_use($storecfg, $conf, $key, $volid);
cee01bcb 4466 PVE::Storage::vdisk_free($storecfg, $volid);
3dc38fbb 4467 return 1;
40b977f3
WL
4468 } else {
4469 # If vm is not owner of this disk remove from config
4470 return 1;
3dc38fbb
WB
4471 }
4472 }
4473
4474 return undef;
4475}
4476
4477sub vmconfig_delete_or_detach_drive {
4478 my ($vmid, $storecfg, $conf, $opt, $force) = @_;
4479
4480 my $drive = parse_drive($opt, $conf->{$opt});
4481
4482 my $rpcenv = PVE::RPCEnvironment::get();
4483 my $authuser = $rpcenv->get_user();
4484
4485 if ($force) {
4486 $rpcenv->check_vm_perm($authuser, $vmid, undef, ['VM.Config.Disk']);
4487 try_deallocate_drive($storecfg, $vmid, $conf, $opt, $drive, $rpcenv, $authuser, $force);
4488 } else {
4489 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $drive);
4490 }
4491}
4492
98bc3aeb
OB
4493
4494
055d554d 4495sub vmconfig_apply_pending {
eb5e482d
OB
4496 my ($vmid, $conf, $storecfg, $errors) = @_;
4497
4498 my $add_apply_error = sub {
4499 my ($opt, $msg) = @_;
4500 my $err_msg = "unable to apply pending change $opt : $msg";
4501 $errors->{$opt} = $err_msg;
4502 warn $err_msg;
4503 };
c427973b
DM
4504
4505 # cold plug
055d554d 4506
98bc3aeb 4507 my $pending_delete_hash = PVE::QemuConfig->parse_pending_delete($conf->{pending}->{delete});
d321c4a9 4508 foreach my $opt (sort keys %$pending_delete_hash) {
fb4d1ba2 4509 my $force = $pending_delete_hash->{$opt}->{force};
eb5e482d 4510 eval {
3d48b95a
OB
4511 if ($opt =~ m/^unused/) {
4512 die "internal error";
4513 } elsif (defined($conf->{$opt}) && is_valid_drivename($opt)) {
eb5e482d 4514 vmconfig_delete_or_detach_drive($vmid, $storecfg, $conf, $opt, $force);
eb5e482d
OB
4515 }
4516 };
4517 if (my $err = $@) {
4518 $add_apply_error->($opt, $err);
055d554d 4519 } else {
98bc3aeb 4520 PVE::QemuConfig->remove_from_pending_delete($conf, $opt);
055d554d 4521 delete $conf->{$opt};
055d554d
DM
4522 }
4523 }
4524
3d48b95a 4525 PVE::QemuConfig->cleanup_pending($conf);
055d554d
DM
4526
4527 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3d48b95a 4528 next if $opt eq 'delete'; # just to be sure
eb5e482d 4529 eval {
3d48b95a 4530 if (defined($conf->{$opt}) && is_valid_drivename($opt)) {
eb5e482d 4531 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
eb5e482d
OB
4532 }
4533 };
4534 if (my $err = $@) {
4535 $add_apply_error->($opt, $err);
055d554d 4536 } else {
eb5e482d 4537 $conf->{$opt} = delete $conf->{pending}->{$opt};
055d554d 4538 }
055d554d 4539 }
3d48b95a
OB
4540
4541 # write all changes at once to avoid unnecessary i/o
4542 PVE::QemuConfig->write_config($vmid, $conf);
055d554d
DM
4543}
4544
3eec5767 4545sub vmconfig_update_net {
d559309f 4546 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value, $arch, $machine_type) = @_;
3eec5767
DM
4547
4548 my $newnet = parse_net($value);
4549
4550 if ($conf->{$opt}) {
4551 my $oldnet = parse_net($conf->{$opt});
4552
0f1af9e7
OB
4553 if (safe_string_ne($oldnet->{model}, $newnet->{model}) ||
4554 safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
4555 safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
3eec5767
DM
4556 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
4557
4558 # for non online change, we try to hot-unplug
7196b757 4559 die "skip\n" if !$hotplug;
3eec5767
DM
4560 vm_deviceunplug($vmid, $conf, $opt);
4561 } else {
4562
4563 die "internal error" if $opt !~ m/net(\d+)/;
4564 my $iface = "tap${vmid}i$1";
a1b7d579 4565
0f1af9e7
OB
4566 if (safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
4567 safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
4568 safe_string_ne($oldnet->{trunks}, $newnet->{trunks}) ||
4569 safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3eec5767 4570 PVE::Network::tap_unplug($iface);
28e129cc
AD
4571
4572 if ($have_sdn) {
4573 PVE::Network::SDN::Zones::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks}, $newnet->{rate});
4574 } else {
4575 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks}, $newnet->{rate});
4576 }
0f1af9e7 4577 } elsif (safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
4f4fbeb0
WB
4578 # Rate can be applied on its own but any change above needs to
4579 # include the rate in tap_plug since OVS resets everything.
4580 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3eec5767 4581 }
38c590d9 4582
0f1af9e7 4583 if (safe_string_ne($oldnet->{link_down}, $newnet->{link_down})) {
25088687
DM
4584 qemu_set_link_status($vmid, $opt, !$newnet->{link_down});
4585 }
4586
38c590d9 4587 return 1;
3eec5767
DM
4588 }
4589 }
a1b7d579 4590
7196b757 4591 if ($hotplug) {
d559309f 4592 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet, $arch, $machine_type);
38c590d9
DM
4593 } else {
4594 die "skip\n";
4595 }
3eec5767
DM
4596}
4597
a05cff86 4598sub vmconfig_update_disk {
9e7bce2c 4599 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value, $arch, $machine_type) = @_;
a05cff86
DM
4600
4601 my $drive = parse_drive($opt, $value);
4602
4603 if ($conf->{$opt}) {
4604
4605 if (my $old_drive = parse_drive($opt, $conf->{$opt})) {
4606
4607 my $media = $drive->{media} || 'disk';
4608 my $oldmedia = $old_drive->{media} || 'disk';
4609 die "unable to change media type\n" if $media ne $oldmedia;
4610
4611 if (!drive_is_cdrom($old_drive)) {
4612
a1b7d579 4613 if ($drive->{file} ne $old_drive->{file}) {
a05cff86 4614
7196b757 4615 die "skip\n" if !$hotplug;
a05cff86
DM
4616
4617 # unplug and register as unused
4618 vm_deviceunplug($vmid, $conf, $opt);
4619 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $old_drive)
a1b7d579 4620
a05cff86
DM
4621 } else {
4622 # update existing disk
4623
4624 # skip non hotpluggable value
0f1af9e7
OB
4625 if (safe_string_ne($drive->{discard}, $old_drive->{discard}) ||
4626 safe_string_ne($drive->{iothread}, $old_drive->{iothread}) ||
4627 safe_string_ne($drive->{queues}, $old_drive->{queues}) ||
4628 safe_string_ne($drive->{cache}, $old_drive->{cache}) ||
4629 safe_string_ne($drive->{ssd}, $old_drive->{ssd})) {
a05cff86
DM
4630 die "skip\n";
4631 }
4632
4633 # apply throttle
0f1af9e7
OB
4634 if (safe_num_ne($drive->{mbps}, $old_drive->{mbps}) ||
4635 safe_num_ne($drive->{mbps_rd}, $old_drive->{mbps_rd}) ||
4636 safe_num_ne($drive->{mbps_wr}, $old_drive->{mbps_wr}) ||
4637 safe_num_ne($drive->{iops}, $old_drive->{iops}) ||
4638 safe_num_ne($drive->{iops_rd}, $old_drive->{iops_rd}) ||
4639 safe_num_ne($drive->{iops_wr}, $old_drive->{iops_wr}) ||
4640 safe_num_ne($drive->{mbps_max}, $old_drive->{mbps_max}) ||
4641 safe_num_ne($drive->{mbps_rd_max}, $old_drive->{mbps_rd_max}) ||
4642 safe_num_ne($drive->{mbps_wr_max}, $old_drive->{mbps_wr_max}) ||
4643 safe_num_ne($drive->{iops_max}, $old_drive->{iops_max}) ||
4644 safe_num_ne($drive->{iops_rd_max}, $old_drive->{iops_rd_max}) ||
4645 safe_num_ne($drive->{iops_wr_max}, $old_drive->{iops_wr_max}) ||
4646 safe_num_ne($drive->{bps_max_length}, $old_drive->{bps_max_length}) ||
4647 safe_num_ne($drive->{bps_rd_max_length}, $old_drive->{bps_rd_max_length}) ||
4648 safe_num_ne($drive->{bps_wr_max_length}, $old_drive->{bps_wr_max_length}) ||
4649 safe_num_ne($drive->{iops_max_length}, $old_drive->{iops_max_length}) ||
4650 safe_num_ne($drive->{iops_rd_max_length}, $old_drive->{iops_rd_max_length}) ||
4651 safe_num_ne($drive->{iops_wr_max_length}, $old_drive->{iops_wr_max_length})) {
a1b7d579 4652
a05cff86
DM
4653 qemu_block_set_io_throttle($vmid,"drive-$opt",
4654 ($drive->{mbps} || 0)*1024*1024,
4655 ($drive->{mbps_rd} || 0)*1024*1024,
4656 ($drive->{mbps_wr} || 0)*1024*1024,
4657 $drive->{iops} || 0,
4658 $drive->{iops_rd} || 0,
4659 $drive->{iops_wr} || 0,
4660 ($drive->{mbps_max} || 0)*1024*1024,
4661 ($drive->{mbps_rd_max} || 0)*1024*1024,
4662 ($drive->{mbps_wr_max} || 0)*1024*1024,
4663 $drive->{iops_max} || 0,
4664 $drive->{iops_rd_max} || 0,
9196a8ec
WB
4665 $drive->{iops_wr_max} || 0,
4666 $drive->{bps_max_length} || 1,
4667 $drive->{bps_rd_max_length} || 1,
4668 $drive->{bps_wr_max_length} || 1,
4669 $drive->{iops_max_length} || 1,
4670 $drive->{iops_rd_max_length} || 1,
4671 $drive->{iops_wr_max_length} || 1);
a05cff86
DM
4672
4673 }
a1b7d579 4674
a05cff86
DM
4675 return 1;
4676 }
4de1bb25
DM
4677
4678 } else { # cdrom
a1b7d579 4679
4de1bb25 4680 if ($drive->{file} eq 'none') {
922869f2 4681 mon_cmd($vmid, "eject", force => JSON::true, id => "$opt");
2d9ddec5
WB
4682 if (drive_is_cloudinit($old_drive)) {
4683 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $old_drive);
4684 }
4de1bb25
DM
4685 } else {
4686 my $path = get_iso_path($storecfg, $vmid, $drive->{file});
ce9fce79
SR
4687
4688 # force eject if locked
922869f2 4689 mon_cmd($vmid, "eject", force => JSON::true, id => "$opt");
ce9fce79
SR
4690
4691 if ($path) {
4692 mon_cmd($vmid, "blockdev-change-medium",
922869f2 4693 id => "$opt", filename => "$path");
ce9fce79 4694 }
4de1bb25 4695 }
a1b7d579 4696
34758d66 4697 return 1;
a05cff86
DM
4698 }
4699 }
4700 }
4701
a1b7d579 4702 die "skip\n" if !$hotplug || $opt =~ m/(ide|sata)(\d+)/;
4de1bb25 4703 # hotplug new disks
f7b4356f 4704 PVE::Storage::activate_volumes($storecfg, [$drive->{file}]) if $drive->{file} !~ m|^/dev/.+|;
d559309f 4705 vm_deviceplug($storecfg, $conf, $vmid, $opt, $drive, $arch, $machine_type);
a05cff86
DM
4706}
4707
1e3baf05 4708sub vm_start {
ba9e1000 4709 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused,
ef3f4293 4710 $forcemachine, $spice_ticket, $migration_network, $migration_type, $targetstorage, $timeout) = @_;
1e3baf05 4711
ffda963f
FG
4712 PVE::QemuConfig->lock_config($vmid, sub {
4713 my $conf = PVE::QemuConfig->load_config($vmid, $migratedfrom);
1e3baf05 4714
ffda963f 4715 die "you can't start a vm if it's a template\n" if PVE::QemuConfig->is_template($conf);
3dcb98d5 4716
7ceade4c
DC
4717 my $is_suspended = PVE::QemuConfig->has_lock($conf, 'suspended');
4718
4719 PVE::QemuConfig->check_lock($conf)
4720 if !($skiplock || $is_suspended);
1e3baf05 4721
7e8dcf2c 4722 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 4723
64457ed4
DC
4724 # clean up leftover reboot request files
4725 eval { clear_reboot_request($vmid); };
4726 warn $@ if $@;
4727
055d554d 4728 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3a11fadb 4729 vmconfig_apply_pending($vmid, $conf, $storecfg);
ffda963f 4730 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4731 }
4732
0c9a7596
AD
4733 PVE::QemuServer::Cloudinit::generate_cloudinitconfig($conf, $vmid);
4734
6c47d546
DM
4735 my $defaults = load_defaults();
4736
4737 # set environment variable useful inside network script
4738 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
4739
2189246c
AD
4740 my $local_volumes = {};
4741
3b4cf0f0 4742 if ($targetstorage) {
2189246c
AD
4743 foreach_drive($conf, sub {
4744 my ($ds, $drive) = @_;
4745
4746 return if drive_is_cdrom($drive);
4747
4748 my $volid = $drive->{file};
4749
4750 return if !$volid;
4751
4752 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid);
4753
4754 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
4755 return if $scfg->{shared};
4756 $local_volumes->{$ds} = [$volid, $storeid, $volname];
4757 });
4758
4759 my $format = undef;
4760
4761 foreach my $opt (sort keys %$local_volumes) {
4762
4763 my ($volid, $storeid, $volname) = @{$local_volumes->{$opt}};
4764 my $drive = parse_drive($opt, $conf->{$opt});
4765
c3c5d2b6
FE
4766 # If a remote storage is specified and the format of the original
4767 # volume is not available there, fall back to the default format.
4768 # Otherwise use the same format as the original.
2189246c
AD
4769 if ($targetstorage && $targetstorage ne "1") {
4770 $storeid = $targetstorage;
4771 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
c3c5d2b6
FE
4772 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
4773 my $fileFormat = qemu_img_format($scfg, $volname);
4774 $format = (grep {$fileFormat eq $_} @{$validFormats}) ? $fileFormat : $defFormat;
2189246c 4775 } else {
2189246c 4776 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
301c6752 4777 $format = qemu_img_format($scfg, $volname);
2189246c
AD
4778 }
4779
4780 my $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $vmid, $format, undef, ($drive->{size}/1024));
4781 my $newdrive = $drive;
4782 $newdrive->{format} = $format;
4783 $newdrive->{file} = $newvolid;
71c58bb7 4784 my $drivestr = print_drive($newdrive);
2189246c
AD
4785 $local_volumes->{$opt} = $drivestr;
4786 #pass drive to conf for command line
4787 $conf->{$opt} = $drivestr;
4788 }
4789 }
4790
9e784b11
DC
4791 PVE::GuestHelpers::exec_hookscript($conf, $vmid, 'pre-start', 1);
4792
7ceade4c
DC
4793 if ($is_suspended) {
4794 # enforce machine type on suspended vm to ensure HW compatibility
4795 $forcemachine = $conf->{runningmachine};
b0a9a385 4796 print "Resuming suspended VM\n";
7ceade4c
DC
4797 }
4798
67812f9c 4799 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 4800
b24e1ac2
FG
4801 my $migration_ip;
4802 my $get_migration_ip = sub {
4803 my ($cidr, $nodename) = @_;
4804
4805 return $migration_ip if defined($migration_ip);
4806
4807 if (!defined($cidr)) {
4808 my $dc_conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
4809 $cidr = $dc_conf->{migration}->{network};
4810 }
4811
4812 if (defined($cidr)) {
4813 my $ips = PVE::Network::get_local_ip_from_cidr($cidr);
4814
4815 die "could not get IP: no address configured on local " .
4816 "node for network '$cidr'\n" if scalar(@$ips) == 0;
4817
4818 die "could not get IP: multiple addresses configured on local " .
4819 "node for network '$cidr'\n" if scalar(@$ips) > 1;
4820
4821 $migration_ip = @$ips[0];
4822 }
4823
4824 $migration_ip = PVE::Cluster::remote_node_ip($nodename, 1)
4825 if !defined($migration_ip);
4826
4827 return $migration_ip;
4828 };
4829
5bc1e039 4830 my $migrate_uri;
1e3baf05
DM
4831 if ($statefile) {
4832 if ($statefile eq 'tcp') {
5bc1e039
SP
4833 my $localip = "localhost";
4834 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
38277afc 4835 my $nodename = nodename();
2de2d6f7 4836
b7a5a225
TL
4837 if (!defined($migration_type)) {
4838 if (defined($datacenterconf->{migration}->{type})) {
4839 $migration_type = $datacenterconf->{migration}->{type};
4840 } else {
4841 $migration_type = 'secure';
4842 }
4843 }
4844
2de2d6f7 4845 if ($migration_type eq 'insecure') {
b24e1ac2 4846 $localip = $get_migration_ip->($migration_network, $nodename);
2de2d6f7 4847 $localip = "[$localip]" if Net::IP::ip_is_ipv6($localip);
5bc1e039 4848 }
2de2d6f7 4849
af0eba7e 4850 my $pfamily = PVE::Tools::get_host_address_family($nodename);
a447e92c 4851 my $migrate_port = PVE::Tools::next_migrate_port($pfamily);
407e0b8b 4852 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
4853 push @$cmd, '-incoming', $migrate_uri;
4854 push @$cmd, '-S';
1c9d54bf
TL
4855
4856 } elsif ($statefile eq 'unix') {
4857 # should be default for secure migrations as a ssh TCP forward
4858 # tunnel is not deterministic reliable ready and fails regurarly
4859 # to set up in time, so use UNIX socket forwards
54323eed
TL
4860 my $socket_addr = "/run/qemu-server/$vmid.migrate";
4861 unlink $socket_addr;
4862
4863 $migrate_uri = "unix:$socket_addr";
1c9d54bf
TL
4864
4865 push @$cmd, '-incoming', $migrate_uri;
4866 push @$cmd, '-S';
4867
5c1d42b7 4868 } elsif (-e $statefile) {
6c47d546 4869 push @$cmd, '-loadstate', $statefile;
5c1d42b7
TL
4870 } else {
4871 my $statepath = PVE::Storage::path($storecfg, $statefile);
edcbf953 4872 push @$vollist, $statefile;
5c1d42b7 4873 push @$cmd, '-loadstate', $statepath;
1e3baf05 4874 }
91bd6c90
DM
4875 } elsif ($paused) {
4876 push @$cmd, '-S';
1e3baf05
DM
4877 }
4878
1e3baf05 4879 # host pci devices
040b06b7
DA
4880 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
4881 my $d = parse_hostpci($conf->{"hostpci$i"});
4882 next if !$d;
b1f72af6
AD
4883 my $pcidevices = $d->{pciid};
4884 foreach my $pcidevice (@$pcidevices) {
2fd24788 4885 my $pciid = $pcidevice->{id};
000fc0a2 4886
70740c1a 4887 my $info = PVE::SysFSTools::pci_device_info("$pciid");
b71351a7 4888 die "IOMMU not present\n" if !PVE::SysFSTools::check_iommu_support();
b1f72af6 4889 die "no pci device info for device '$pciid'\n" if !$info;
6ab45bd7
DC
4890
4891 if ($d->{mdev}) {
4892 my $uuid = PVE::SysFSTools::generate_mdev_uuid($vmid, $i);
4893 PVE::SysFSTools::pci_create_mdev_device($pciid, $uuid, $d->{mdev});
4894 } else {
4895 die "can't unbind/bind pci group to vfio '$pciid'\n"
4896 if !PVE::SysFSTools::pci_dev_group_bind_to_vfio($pciid);
4897 die "can't reset pci device '$pciid'\n"
4898 if $info->{has_fl_reset} and !PVE::SysFSTools::pci_dev_reset($info);
4899 }
b1f72af6 4900 }
040b06b7 4901 }
1e3baf05
DM
4902
4903 PVE::Storage::activate_volumes($storecfg, $vollist);
4904
4f8cfa19
WB
4905 eval {
4906 run_command(['/bin/systemctl', 'stop', "$vmid.scope"],
4907 outfunc => sub {}, errfunc => sub {});
4908 };
4909 # Issues with the above 'stop' not being fully completed are extremely rare, a very low
4910 # timeout should be more than enough here...
4911 PVE::Systemd::wait_for_unit_removed("$vmid.scope", 5);
2b401189 4912
8e59d952
WB
4913 my $cpuunits = defined($conf->{cpuunits}) ? $conf->{cpuunits}
4914 : $defaults->{cpuunits};
4915
ef3f4293 4916 my $start_timeout = $timeout // config_aware_timeout($conf, $is_suspended);
6e0216d8
SR
4917 my %run_params = (
4918 timeout => $statefile ? undef : $start_timeout,
4919 umask => 0077,
4920 noerr => 1,
4921 );
7023f3ea 4922
8bf30c2a
SR
4923 # when migrating, prefix QEMU output so other side can pick up any
4924 # errors that might occur and show the user
4925 if ($migratedfrom) {
4926 $run_params{quiet} = 1;
128193e2 4927 $run_params{logfunc} = sub { print "QEMU: $_[0]\n" };
8bf30c2a
SR
4928 }
4929
7023f3ea
AD
4930 my %properties = (
4931 Slice => 'qemu.slice',
4932 KillMode => 'none',
4933 CPUShares => $cpuunits
4934 );
4935
4936 if (my $cpulimit = $conf->{cpulimit}) {
4937 $properties{CPUQuota} = int($cpulimit * 100);
4938 }
4939 $properties{timeout} = 10 if $statefile; # setting up the scope shoul be quick
4940
503308ed
WB
4941 my $run_qemu = sub {
4942 PVE::Tools::run_fork sub {
d04d6af1 4943 PVE::Systemd::enter_systemd_scope($vmid, "Proxmox VE VM $vmid", %properties);
6e0216d8
SR
4944
4945 my $exitcode = run_command($cmd, %run_params);
4946 die "QEMU exited with code $exitcode\n" if $exitcode;
503308ed
WB
4947 };
4948 };
4949
7023f3ea
AD
4950 if ($conf->{hugepages}) {
4951
4952 my $code = sub {
4953 my $hugepages_topology = PVE::QemuServer::Memory::hugepages_topology($conf);
4954 my $hugepages_host_topology = PVE::QemuServer::Memory::hugepages_host_topology();
4955
4956 PVE::QemuServer::Memory::hugepages_mount();
4957 PVE::QemuServer::Memory::hugepages_allocate($hugepages_topology, $hugepages_host_topology);
4958
503308ed 4959 eval { $run_qemu->() };
7023f3ea
AD
4960 if (my $err = $@) {
4961 PVE::QemuServer::Memory::hugepages_reset($hugepages_host_topology);
4962 die $err;
4963 }
4964
4965 PVE::QemuServer::Memory::hugepages_pre_deallocate($hugepages_topology);
4966 };
4967 eval { PVE::QemuServer::Memory::hugepages_update_locked($code); };
4968
4969 } else {
503308ed 4970 eval { $run_qemu->() };
7023f3ea 4971 }
77cde36b
DC
4972
4973 if (my $err = $@) {
4974 # deactivate volumes if start fails
4975 eval { PVE::Storage::deactivate_volumes($storecfg, $vollist); };
4976 die "start failed: $err";
4977 }
1e3baf05 4978
5bc1e039 4979 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 4980
b37ecfe6 4981 if ($statefile && $statefile ne 'tcp' && $statefile ne 'unix') {
0a13e08e 4982 eval { mon_cmd($vmid, "cont"); };
8c609afd 4983 warn $@ if $@;
62de2cbd
DM
4984 }
4985
2189246c
AD
4986 #start nbd server for storage migration
4987 if ($targetstorage) {
38277afc 4988 my $nodename = nodename();
b24e1ac2 4989 my $localip = $get_migration_ip->($migration_network, $nodename);
2189246c 4990 my $pfamily = PVE::Tools::get_host_address_family($nodename);
a447e92c 4991 my $storage_migrate_port = PVE::Tools::next_migrate_port($pfamily);
2189246c 4992
0a13e08e 4993 mon_cmd($vmid, "nbd-server-start", addr => { type => 'inet', data => { host => "${localip}", port => "${storage_migrate_port}" } } );
2189246c
AD
4994
4995 $localip = "[$localip]" if Net::IP::ip_is_ipv6($localip);
4996
4997 foreach my $opt (sort keys %$local_volumes) {
8b02e568 4998 my $drivestr = $local_volumes->{$opt};
0a13e08e 4999 mon_cmd($vmid, "nbd-server-add", device => "drive-$opt", writable => JSON::true );
a447e92c 5000 my $migrate_storage_uri = "nbd:${localip}:${storage_migrate_port}:exportname=drive-$opt";
8b02e568 5001 print "storage migration listens on $migrate_storage_uri volume:$drivestr\n";
2189246c
AD
5002 }
5003 }
5004
1d794448 5005 if ($migratedfrom) {
a89fded1 5006 eval {
8e90138a 5007 set_migration_caps($vmid);
a89fded1 5008 };
1d794448 5009 warn $@ if $@;
a89fded1 5010
1d794448
DM
5011 if ($spice_port) {
5012 print "spice listens on port $spice_port\n";
5013 if ($spice_ticket) {
0a13e08e
SR
5014 mon_cmd($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
5015 mon_cmd($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
5016 }
5017 }
5018
1d794448 5019 } else {
0a13e08e 5020 mon_cmd($vmid, "balloon", value => $conf->{balloon}*1024*1024)
51153f86 5021 if !$statefile && $conf->{balloon};
25088687
DM
5022
5023 foreach my $opt (keys %$conf) {
5024 next if $opt !~ m/^net\d+$/;
5025 my $nicconf = parse_net($conf->{$opt});
5026 qemu_set_link_status($vmid, $opt, 0) if $nicconf->{link_down};
5027 }
e18b0b99 5028 }
a1b7d579 5029
0a13e08e 5030 mon_cmd($vmid, 'qom-set',
eb065317
AD
5031 path => "machine/peripheral/balloon0",
5032 property => "guest-stats-polling-interval",
5033 value => 2) if (!defined($conf->{balloon}) || $conf->{balloon});
5034
ad1d49f4 5035 if ($is_suspended) {
b0a9a385 5036 print "Resumed VM, removing state\n";
ad1d49f4
DC
5037 if (my $vmstate = $conf->{vmstate}) {
5038 PVE::Storage::deactivate_volumes($storecfg, [$vmstate]);
5039 PVE::Storage::vdisk_free($storecfg, $vmstate);
5040 }
7ceade4c 5041 delete $conf->@{qw(lock vmstate runningmachine)};
7ceade4c
DC
5042 PVE::QemuConfig->write_config($vmid, $conf);
5043 }
5044
9e784b11 5045 PVE::GuestHelpers::exec_hookscript($conf, $vmid, 'post-start');
1e3baf05
DM
5046 });
5047}
5048
1e3baf05 5049sub vm_commandline {
b14477e7 5050 my ($storecfg, $vmid, $snapname) = @_;
1e3baf05 5051
ffda963f 5052 my $conf = PVE::QemuConfig->load_config($vmid);
092868c4 5053 my $forcemachine;
1e3baf05 5054
b14477e7
RV
5055 if ($snapname) {
5056 my $snapshot = $conf->{snapshots}->{$snapname};
87d92707
TL
5057 die "snapshot '$snapname' does not exist\n" if !defined($snapshot);
5058
092868c4
SR
5059 # check for a 'runningmachine' in snapshot
5060 $forcemachine = $snapshot->{runningmachine} if $snapshot->{runningmachine};
5061
87d92707 5062 $snapshot->{digest} = $conf->{digest}; # keep file digest for API
b14477e7 5063
b14477e7
RV
5064 $conf = $snapshot;
5065 }
5066
1e3baf05
DM
5067 my $defaults = load_defaults();
5068
092868c4 5069 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
1e3baf05 5070
5930c1ff 5071 return PVE::Tools::cmd2string($cmd);
1e3baf05
DM
5072}
5073
5074sub vm_reset {
5075 my ($vmid, $skiplock) = @_;
5076
ffda963f 5077 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 5078
ffda963f 5079 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 5080
ffda963f 5081 PVE::QemuConfig->check_lock($conf) if !$skiplock;
1e3baf05 5082
0a13e08e 5083 mon_cmd($vmid, "system_reset");
ff1a2432
DM
5084 });
5085}
5086
5087sub get_vm_volumes {
5088 my ($conf) = @_;
1e3baf05 5089
ff1a2432 5090 my $vollist = [];
d5769dc2 5091 foreach_volid($conf, sub {
392f8b5d 5092 my ($volid, $attr) = @_;
ff1a2432 5093
d5769dc2 5094 return if $volid =~ m|^/|;
ff1a2432 5095
d5769dc2
DM
5096 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
5097 return if !$sid;
ff1a2432
DM
5098
5099 push @$vollist, $volid;
1e3baf05 5100 });
ff1a2432
DM
5101
5102 return $vollist;
5103}
5104
5105sub vm_stop_cleanup {
70b04821 5106 my ($storecfg, $vmid, $conf, $keepActive, $apply_pending_changes) = @_;
ff1a2432 5107
745fed70 5108 eval {
ff1a2432 5109
254575e9
DM
5110 if (!$keepActive) {
5111 my $vollist = get_vm_volumes($conf);
5112 PVE::Storage::deactivate_volumes($storecfg, $vollist);
5113 }
a1b7d579 5114
ab6a046f 5115 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
5116 unlink "/var/run/qemu-server/${vmid}.$ext";
5117 }
a1b7d579 5118
6dbcb073
DC
5119 if ($conf->{ivshmem}) {
5120 my $ivshmem = PVE::JSONSchema::parse_property_string($ivshmem_fmt, $conf->{ivshmem});
4c5a6a24
TL
5121 # just delete it for now, VMs which have this already open do not
5122 # are affected, but new VMs will get a separated one. If this
5123 # becomes an issue we either add some sort of ref-counting or just
5124 # add a "don't delete on stop" flag to the ivshmem format.
6dbcb073
DC
5125 unlink '/dev/shm/pve-shm-' . ($ivshmem->{name} // $vmid);
5126 }
5127
6ab45bd7
DC
5128 foreach my $key (keys %$conf) {
5129 next if $key !~ m/^hostpci(\d+)$/;
5130 my $hostpciindex = $1;
5131 my $d = parse_hostpci($conf->{$key});
5132 my $uuid = PVE::SysFSTools::generate_mdev_uuid($vmid, $hostpciindex);
5133
5134 foreach my $pci (@{$d->{pciid}}) {
2fd24788 5135 my $pciid = $pci->{id};
6ab45bd7
DC
5136 PVE::SysFSTools::pci_cleanup_mdev_device($pciid, $uuid);
5137 }
5138 }
5139
70b04821 5140 vmconfig_apply_pending($vmid, $conf, $storecfg) if $apply_pending_changes;
745fed70
DM
5141 };
5142 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
5143}
5144
575d19da
DC
5145# call only in locked context
5146sub _do_vm_stop {
5147 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive) = @_;
9269013a 5148
575d19da
DC
5149 my $pid = check_running($vmid, $nocheck);
5150 return if !$pid;
1e3baf05 5151
575d19da
DC
5152 my $conf;
5153 if (!$nocheck) {
5154 $conf = PVE::QemuConfig->load_config($vmid);
5155 PVE::QemuConfig->check_lock($conf) if !$skiplock;
5156 if (!defined($timeout) && $shutdown && $conf->{startup}) {
5157 my $opts = PVE::JSONSchema::pve_parse_startup_order($conf->{startup});
5158 $timeout = $opts->{down} if $opts->{down};
e6c3b671 5159 }
575d19da
DC
5160 PVE::GuestHelpers::exec_hookscript($conf, $vmid, 'pre-stop');
5161 }
19672434 5162
575d19da
DC
5163 eval {
5164 if ($shutdown) {
5165 if (defined($conf) && parse_guest_agent($conf)->{enabled}) {
0a13e08e 5166 mon_cmd($vmid, "guest-shutdown", timeout => $timeout);
9269013a 5167 } else {
0a13e08e 5168 mon_cmd($vmid, "system_powerdown");
1e3baf05
DM
5169 }
5170 } else {
0a13e08e 5171 mon_cmd($vmid, "quit");
1e3baf05 5172 }
575d19da
DC
5173 };
5174 my $err = $@;
1e3baf05 5175
575d19da
DC
5176 if (!$err) {
5177 $timeout = 60 if !defined($timeout);
1e3baf05
DM
5178
5179 my $count = 0;
e6c3b671 5180 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
5181 $count++;
5182 sleep 1;
5183 }
5184
5185 if ($count >= $timeout) {
575d19da
DC
5186 if ($force) {
5187 warn "VM still running - terminating now with SIGTERM\n";
5188 kill 15, $pid;
5189 } else {
5190 die "VM quit/powerdown failed - got timeout\n";
5191 }
5192 } else {
5193 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
5194 return;
1e3baf05 5195 }
575d19da
DC
5196 } else {
5197 if ($force) {
5198 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
5199 kill 15, $pid;
5200 } else {
5201 die "VM quit/powerdown failed\n";
5202 }
5203 }
5204
5205 # wait again
5206 $timeout = 10;
5207
5208 my $count = 0;
5209 while (($count < $timeout) && check_running($vmid, $nocheck)) {
5210 $count++;
5211 sleep 1;
5212 }
5213
5214 if ($count >= $timeout) {
5215 warn "VM still running - terminating now with SIGKILL\n";
5216 kill 9, $pid;
5217 sleep 1;
5218 }
1e3baf05 5219
575d19da
DC
5220 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
5221}
5222
5223# Note: use $nocheck to skip tests if VM configuration file exists.
5224# We need that when migration VMs to other nodes (files already moved)
5225# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
5226sub vm_stop {
5227 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
5228
5229 $force = 1 if !defined($force) && !$shutdown;
5230
5231 if ($migratedfrom){
5232 my $pid = check_running($vmid, $nocheck, $migratedfrom);
5233 kill 15, $pid if $pid;
5234 my $conf = PVE::QemuConfig->load_config($vmid, $migratedfrom);
5235 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 0);
5236 return;
5237 }
5238
5239 PVE::QemuConfig->lock_config($vmid, sub {
5240 _do_vm_stop($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive);
ff1a2432 5241 });
1e3baf05
DM
5242}
5243
165411f0
DC
5244sub vm_reboot {
5245 my ($vmid, $timeout) = @_;
5246
5247 PVE::QemuConfig->lock_config($vmid, sub {
66026117 5248 eval {
165411f0 5249
66026117
OB
5250 # only reboot if running, as qmeventd starts it again on a stop event
5251 return if !check_running($vmid);
165411f0 5252
66026117 5253 create_reboot_request($vmid);
165411f0 5254
66026117
OB
5255 my $storecfg = PVE::Storage::config();
5256 _do_vm_stop($storecfg, $vmid, undef, undef, $timeout, 1);
165411f0 5257
66026117
OB
5258 };
5259 if (my $err = $@) {
3c1c3fe6 5260 # avoid that the next normal shutdown will be confused for a reboot
66026117
OB
5261 clear_reboot_request($vmid);
5262 die $err;
5263 }
165411f0
DC
5264 });
5265}
5266
75c24bba 5267# note: if using the statestorage parameter, the caller has to check privileges
1e3baf05 5268sub vm_suspend {
48b4cdc2 5269 my ($vmid, $skiplock, $includestate, $statestorage) = @_;
159719e5
DC
5270
5271 my $conf;
5272 my $path;
5273 my $storecfg;
5274 my $vmstate;
1e3baf05 5275
ffda963f 5276 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 5277
159719e5 5278 $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 5279
159719e5 5280 my $is_backing_up = PVE::QemuConfig->has_lock($conf, 'backup');
e79706d4 5281 PVE::QemuConfig->check_lock($conf)
159719e5
DC
5282 if !($skiplock || $is_backing_up);
5283
5284 die "cannot suspend to disk during backup\n"
5285 if $is_backing_up && $includestate;
bcb7c9cf 5286
159719e5
DC
5287 if ($includestate) {
5288 $conf->{lock} = 'suspending';
5289 my $date = strftime("%Y-%m-%d", localtime(time()));
5290 $storecfg = PVE::Storage::config();
75c24bba
DC
5291 if (!$statestorage) {
5292 $statestorage = find_vmstate_storage($conf, $storecfg);
5293 # check permissions for the storage
5294 my $rpcenv = PVE::RPCEnvironment::get();
5295 if ($rpcenv->{type} ne 'cli') {
5296 my $authuser = $rpcenv->get_user();
5297 $rpcenv->check($authuser, "/storage/$statestorage", ['Datastore.AllocateSpace']);
5298 }
5299 }
5300
5301
48b4cdc2 5302 $vmstate = PVE::QemuConfig->__snapshot_save_vmstate($vmid, $conf, "suspend-$date", $storecfg, $statestorage, 1);
159719e5
DC
5303 $path = PVE::Storage::path($storecfg, $vmstate);
5304 PVE::QemuConfig->write_config($vmid, $conf);
5305 } else {
0a13e08e 5306 mon_cmd($vmid, "stop");
159719e5 5307 }
1e3baf05 5308 });
159719e5
DC
5309
5310 if ($includestate) {
5311 # save vm state
5312 PVE::Storage::activate_volumes($storecfg, [$vmstate]);
5313
5314 eval {
0a13e08e 5315 mon_cmd($vmid, "savevm-start", statefile => $path);
159719e5 5316 for(;;) {
0a13e08e 5317 my $state = mon_cmd($vmid, "query-savevm");
159719e5
DC
5318 if (!$state->{status}) {
5319 die "savevm not active\n";
5320 } elsif ($state->{status} eq 'active') {
5321 sleep(1);
5322 next;
5323 } elsif ($state->{status} eq 'completed') {
b0a9a385 5324 print "State saved, quitting\n";
159719e5
DC
5325 last;
5326 } elsif ($state->{status} eq 'failed' && $state->{error}) {
5327 die "query-savevm failed with error '$state->{error}'\n"
5328 } else {
5329 die "query-savevm returned status '$state->{status}'\n";
5330 }
5331 }
5332 };
5333 my $err = $@;
5334
5335 PVE::QemuConfig->lock_config($vmid, sub {
5336 $conf = PVE::QemuConfig->load_config($vmid);
5337 if ($err) {
5338 # cleanup, but leave suspending lock, to indicate something went wrong
5339 eval {
0a13e08e 5340 mon_cmd($vmid, "savevm-end");
159719e5
DC
5341 PVE::Storage::deactivate_volumes($storecfg, [$vmstate]);
5342 PVE::Storage::vdisk_free($storecfg, $vmstate);
5343 delete $conf->@{qw(vmstate runningmachine)};
5344 PVE::QemuConfig->write_config($vmid, $conf);
5345 };
5346 warn $@ if $@;
5347 die $err;
5348 }
5349
5350 die "lock changed unexpectedly\n"
5351 if !PVE::QemuConfig->has_lock($conf, 'suspending');
5352
0a13e08e 5353 mon_cmd($vmid, "quit");
159719e5
DC
5354 $conf->{lock} = 'suspended';
5355 PVE::QemuConfig->write_config($vmid, $conf);
5356 });
5357 }
1e3baf05
DM
5358}
5359
5360sub vm_resume {
289e0b85 5361 my ($vmid, $skiplock, $nocheck) = @_;
1e3baf05 5362
ffda963f 5363 PVE::QemuConfig->lock_config($vmid, sub {
0a13e08e 5364 my $res = mon_cmd($vmid, 'query-status');
c2786bed
DC
5365 my $resume_cmd = 'cont';
5366
5367 if ($res->{status} && $res->{status} eq 'suspended') {
5368 $resume_cmd = 'system_wakeup';
5369 }
5370
289e0b85 5371 if (!$nocheck) {
1e3baf05 5372
ffda963f 5373 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 5374
e79706d4
FG
5375 PVE::QemuConfig->check_lock($conf)
5376 if !($skiplock || PVE::QemuConfig->has_lock($conf, 'backup'));
289e0b85 5377 }
3e24733b 5378
0a13e08e 5379 mon_cmd($vmid, $resume_cmd);
1e3baf05
DM
5380 });
5381}
5382
5fdbe4f0
DM
5383sub vm_sendkey {
5384 my ($vmid, $skiplock, $key) = @_;
1e3baf05 5385
ffda963f 5386 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 5387
ffda963f 5388 my $conf = PVE::QemuConfig->load_config($vmid);
f5eb281a 5389
7b7c6d1b 5390 # there is no qmp command, so we use the human monitor command
0a13e08e 5391 my $res = PVE::QemuServer::Monitor::hmp_cmd($vmid, "sendkey $key");
d30820d6 5392 die $res if $res ne '';
1e3baf05
DM
5393 });
5394}
5395
3e16d5fc
DM
5396# vzdump restore implementaion
5397
ed221350 5398sub tar_archive_read_firstfile {
3e16d5fc 5399 my $archive = shift;
afdb31d5 5400
3e16d5fc
DM
5401 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
5402
5403 # try to detect archive type first
387ba257 5404 my $pid = open (my $fh, '-|', 'tar', 'tf', $archive) ||
3e16d5fc 5405 die "unable to open file '$archive'\n";
387ba257 5406 my $firstfile = <$fh>;
3e16d5fc 5407 kill 15, $pid;
387ba257 5408 close $fh;
3e16d5fc
DM
5409
5410 die "ERROR: archive contaions no data\n" if !$firstfile;
5411 chomp $firstfile;
5412
5413 return $firstfile;
5414}
5415
ed221350
DM
5416sub tar_restore_cleanup {
5417 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
5418
5419 print STDERR "starting cleanup\n";
5420
5421 if (my $fd = IO::File->new($statfile, "r")) {
5422 while (defined(my $line = <$fd>)) {
5423 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5424 my $volid = $2;
5425 eval {
5426 if ($volid =~ m|^/|) {
5427 unlink $volid || die 'unlink failed\n';
5428 } else {
ed221350 5429 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 5430 }
afdb31d5 5431 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
5432 };
5433 print STDERR "unable to cleanup '$volid' - $@" if $@;
5434 } else {
5435 print STDERR "unable to parse line in statfile - $line";
afdb31d5 5436 }
3e16d5fc
DM
5437 }
5438 $fd->close();
5439 }
5440}
5441
5442sub restore_archive {
a0d1b1a2 5443 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 5444
91bd6c90
DM
5445 my $format = $opts->{format};
5446 my $comp;
5447
5448 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
5449 $format = 'tar' if !$format;
5450 $comp = 'gzip';
5451 } elsif ($archive =~ m/\.tar$/) {
5452 $format = 'tar' if !$format;
5453 } elsif ($archive =~ m/.tar.lzo$/) {
5454 $format = 'tar' if !$format;
5455 $comp = 'lzop';
5456 } elsif ($archive =~ m/\.vma$/) {
5457 $format = 'vma' if !$format;
5458 } elsif ($archive =~ m/\.vma\.gz$/) {
5459 $format = 'vma' if !$format;
5460 $comp = 'gzip';
5461 } elsif ($archive =~ m/\.vma\.lzo$/) {
5462 $format = 'vma' if !$format;
5463 $comp = 'lzop';
5464 } else {
5465 $format = 'vma' if !$format; # default
5466 }
5467
5468 # try to detect archive format
5469 if ($format eq 'tar') {
5470 return restore_tar_archive($archive, $vmid, $user, $opts);
5471 } else {
5472 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
5473 }
5474}
5475
5476sub restore_update_config_line {
5477 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
5478
5479 return if $line =~ m/^\#qmdump\#/;
5480 return if $line =~ m/^\#vzdump\#/;
5481 return if $line =~ m/^lock:/;
5482 return if $line =~ m/^unused\d+:/;
5483 return if $line =~ m/^parent:/;
5484
b5b99790 5485 my $dc = PVE::Cluster::cfs_read_file('datacenter.cfg');
91bd6c90
DM
5486 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
5487 # try to convert old 1.X settings
5488 my ($id, $ind, $ethcfg) = ($1, $2, $3);
5489 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
5490 my ($model, $macaddr) = split(/\=/, $devconfig);
b5b99790 5491 $macaddr = PVE::Tools::random_ether_addr($dc->{mac_prefix}) if !$macaddr || $unique;
91bd6c90
DM
5492 my $net = {
5493 model => $model,
5494 bridge => "vmbr$ind",
5495 macaddr => $macaddr,
5496 };
5497 my $netstr = print_net($net);
5498
5499 print $outfd "net$cookie->{netcount}: $netstr\n";
5500 $cookie->{netcount}++;
5501 }
5502 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
5503 my ($id, $netstr) = ($1, $2);
5504 my $net = parse_net($netstr);
b5b99790 5505 $net->{macaddr} = PVE::Tools::random_ether_addr($dc->{mac_prefix}) if $net->{macaddr};
91bd6c90
DM
5506 $netstr = print_net($net);
5507 print $outfd "$id: $netstr\n";
6470743f 5508 } elsif ($line =~ m/^((ide|scsi|virtio|sata|efidisk)\d+):\s*(\S+)\s*$/) {
91bd6c90 5509 my $virtdev = $1;
907ea891 5510 my $value = $3;
d9faf790
WB
5511 my $di = parse_drive($virtdev, $value);
5512 if (defined($di->{backup}) && !$di->{backup}) {
91bd6c90 5513 print $outfd "#$line";
c0f7406e 5514 } elsif ($map->{$virtdev}) {
8fd57431 5515 delete $di->{format}; # format can change on restore
91bd6c90 5516 $di->{file} = $map->{$virtdev};
71c58bb7 5517 $value = print_drive($di);
91bd6c90
DM
5518 print $outfd "$virtdev: $value\n";
5519 } else {
5520 print $outfd $line;
5521 }
1a0c2f03 5522 } elsif (($line =~ m/^vmgenid: (.*)/)) {
babecffe 5523 my $vmgenid = $1;
6ee499ff 5524 if ($vmgenid ne '0') {
1a0c2f03 5525 # always generate a new vmgenid if there was a valid one setup
6ee499ff
DC
5526 $vmgenid = generate_uuid();
5527 }
1a0c2f03 5528 print $outfd "vmgenid: $vmgenid\n";
19a5dd55
WL
5529 } elsif (($line =~ m/^(smbios1: )(.*)/) && $unique) {
5530 my ($uuid, $uuid_str);
5531 UUID::generate($uuid);
5532 UUID::unparse($uuid, $uuid_str);
5533 my $smbios1 = parse_smbios1($2);
5534 $smbios1->{uuid} = $uuid_str;
5535 print $outfd $1.print_smbios1($smbios1)."\n";
91bd6c90
DM
5536 } else {
5537 print $outfd $line;
5538 }
5539}
5540
5541sub scan_volids {
5542 my ($cfg, $vmid) = @_;
5543
5544 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
5545
5546 my $volid_hash = {};
5547 foreach my $storeid (keys %$info) {
5548 foreach my $item (@{$info->{$storeid}}) {
5549 next if !($item->{volid} && $item->{size});
5996a936 5550 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
5551 $volid_hash->{$item->{volid}} = $item;
5552 }
5553 }
5554
5555 return $volid_hash;
5556}
5557
68b108ee 5558sub update_disk_config {
91bd6c90 5559 my ($vmid, $conf, $volid_hash) = @_;
be190583 5560
91bd6c90 5561 my $changes;
53b81297 5562 my $prefix = "VM $vmid:";
91bd6c90 5563
c449137a
DC
5564 # used and unused disks
5565 my $referenced = {};
91bd6c90 5566
5996a936
DM
5567 # Note: it is allowed to define multiple storages with same path (alias), so
5568 # we need to check both 'volid' and real 'path' (two different volid can point
5569 # to the same path).
5570
c449137a 5571 my $referencedpath = {};
be190583 5572
91bd6c90
DM
5573 # update size info
5574 foreach my $opt (keys %$conf) {
74479ee9 5575 if (is_valid_drivename($opt)) {
ed221350 5576 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
5577 my $volid = $drive->{file};
5578 next if !$volid;
5579
68b108ee 5580 # mark volid as "in-use" for next step
c449137a 5581 $referenced->{$volid} = 1;
be190583 5582 if ($volid_hash->{$volid} &&
5996a936 5583 (my $path = $volid_hash->{$volid}->{path})) {
c449137a 5584 $referencedpath->{$path} = 1;
5996a936 5585 }
91bd6c90 5586
ed221350 5587 next if drive_is_cdrom($drive);
91bd6c90
DM
5588 next if !$volid_hash->{$volid};
5589
e0fd2b2f 5590 my ($updated, $old_size, $new_size) = PVE::QemuServer::Drive::update_disksize($drive, $volid_hash);
68b108ee 5591 if (defined($updated)) {
7a907ce6 5592 $changes = 1;
68b108ee
SR
5593 $conf->{$opt} = print_drive($updated);
5594 print "$prefix size of disk '$volid' ($opt) updated from $old_size to $new_size\n";
7a907ce6 5595 }
91bd6c90
DM
5596 }
5597 }
5598
5996a936
DM
5599 # remove 'unusedX' entry if volume is used
5600 foreach my $opt (keys %$conf) {
5601 next if $opt !~ m/^unused\d+$/;
5602 my $volid = $conf->{$opt};
5603 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
c449137a 5604 if ($referenced->{$volid} || ($path && $referencedpath->{$path})) {
68b108ee 5605 print "$prefix remove entry '$opt', its volume '$volid' is in use\n";
5996a936
DM
5606 $changes = 1;
5607 delete $conf->{$opt};
5608 }
c449137a
DC
5609
5610 $referenced->{$volid} = 1;
5611 $referencedpath->{$path} = 1 if $path;
5996a936
DM
5612 }
5613
91bd6c90
DM
5614 foreach my $volid (sort keys %$volid_hash) {
5615 next if $volid =~ m/vm-$vmid-state-/;
c449137a 5616 next if $referenced->{$volid};
5996a936
DM
5617 my $path = $volid_hash->{$volid}->{path};
5618 next if !$path; # just to be sure
c449137a 5619 next if $referencedpath->{$path};
91bd6c90 5620 $changes = 1;
53b81297 5621 my $key = PVE::QemuConfig->add_unused_volume($conf, $volid);
68b108ee 5622 print "$prefix add unreferenced volume '$volid' as '$key' to config\n";
c449137a 5623 $referencedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
5624 }
5625
5626 return $changes;
5627}
5628
5629sub rescan {
9224dcee 5630 my ($vmid, $nolock, $dryrun) = @_;
91bd6c90 5631
20519efc 5632 my $cfg = PVE::Storage::config();
91bd6c90 5633
b9a1a3ab
TL
5634 # FIXME: Remove once our RBD plugin can handle CT and VM on a single storage
5635 # see: https://pve.proxmox.com/pipermail/pve-devel/2018-July/032900.html
4771526a
AA
5636 foreach my $stor (keys %{$cfg->{ids}}) {
5637 delete($cfg->{ids}->{$stor}) if ! $cfg->{ids}->{$stor}->{content}->{images};
5638 }
5639
53b81297 5640 print "rescan volumes...\n";
91bd6c90
DM
5641 my $volid_hash = scan_volids($cfg, $vmid);
5642
5643 my $updatefn = sub {
5644 my ($vmid) = @_;
5645
ffda963f 5646 my $conf = PVE::QemuConfig->load_config($vmid);
be190583 5647
ffda963f 5648 PVE::QemuConfig->check_lock($conf);
91bd6c90 5649
03da3f0d
DM
5650 my $vm_volids = {};
5651 foreach my $volid (keys %$volid_hash) {
5652 my $info = $volid_hash->{$volid};
5653 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
5654 }
5655
68b108ee 5656 my $changes = update_disk_config($vmid, $conf, $vm_volids);
91bd6c90 5657
9224dcee 5658 PVE::QemuConfig->write_config($vmid, $conf) if $changes && !$dryrun;
91bd6c90
DM
5659 };
5660
5661 if (defined($vmid)) {
5662 if ($nolock) {
5663 &$updatefn($vmid);
5664 } else {
ffda963f 5665 PVE::QemuConfig->lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
5666 }
5667 } else {
5668 my $vmlist = config_list();
5669 foreach my $vmid (keys %$vmlist) {
5670 if ($nolock) {
5671 &$updatefn($vmid);
5672 } else {
ffda963f 5673 PVE::QemuConfig->lock_config($vmid, $updatefn, $vmid);
be190583 5674 }
91bd6c90
DM
5675 }
5676 }
5677}
5678
5679sub restore_vma_archive {
5680 my ($archive, $vmid, $user, $opts, $comp) = @_;
5681
91bd6c90
DM
5682 my $readfrom = $archive;
5683
7c536e11
WB
5684 my $cfg = PVE::Storage::config();
5685 my $commands = [];
5686 my $bwlimit = $opts->{bwlimit};
5687
5688 my $dbg_cmdstring = '';
5689 my $add_pipe = sub {
5690 my ($cmd) = @_;
5691 push @$commands, $cmd;
5692 $dbg_cmdstring .= ' | ' if length($dbg_cmdstring);
5693 $dbg_cmdstring .= PVE::Tools::cmd2string($cmd);
91bd6c90 5694 $readfrom = '-';
7c536e11
WB
5695 };
5696
5697 my $input = undef;
5698 if ($archive eq '-') {
5699 $input = '<&STDIN';
5700 } else {
5701 # If we use a backup from a PVE defined storage we also consider that
5702 # storage's rate limit:
5703 my (undef, $volid) = PVE::Storage::path_to_volume_id($cfg, $archive);
5704 if (defined($volid)) {
5705 my ($sid, undef) = PVE::Storage::parse_volume_id($volid);
5706 my $readlimit = PVE::Storage::get_bandwidth_limit('restore', [$sid], $bwlimit);
5707 if ($readlimit) {
5708 print STDERR "applying read rate limit: $readlimit\n";
9444c6e4 5709 my $cstream = ['cstream', '-t', $readlimit*1024, '--', $readfrom];
7c536e11
WB
5710 $add_pipe->($cstream);
5711 }
5712 }
5713 }
5714
5715 if ($comp) {
5716 my $cmd;
91bd6c90 5717 if ($comp eq 'gzip') {
7c536e11 5718 $cmd = ['zcat', $readfrom];
91bd6c90 5719 } elsif ($comp eq 'lzop') {
7c536e11 5720 $cmd = ['lzop', '-d', '-c', $readfrom];
91bd6c90
DM
5721 } else {
5722 die "unknown compression method '$comp'\n";
5723 }
7c536e11 5724 $add_pipe->($cmd);
91bd6c90
DM
5725 }
5726
5727 my $tmpdir = "/var/tmp/vzdumptmp$$";
5728 rmtree $tmpdir;
5729
5730 # disable interrupts (always do cleanups)
5b97ef24
TL
5731 local $SIG{INT} =
5732 local $SIG{TERM} =
5733 local $SIG{QUIT} =
5734 local $SIG{HUP} = sub { warn "got interrupt - ignored\n"; };
91bd6c90
DM
5735
5736 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
5737 POSIX::mkfifo($mapfifo, 0600);
5738 my $fifofh;
5739
5740 my $openfifo = sub {
5741 open($fifofh, '>', $mapfifo) || die $!;
5742 };
5743
7c536e11 5744 $add_pipe->(['vma', 'extract', '-v', '-r', $mapfifo, $readfrom, $tmpdir]);
91bd6c90
DM
5745
5746 my $oldtimeout;
5747 my $timeout = 5;
5748
5749 my $devinfo = {};
5750
5751 my $rpcenv = PVE::RPCEnvironment::get();
5752
ffda963f 5753 my $conffile = PVE::QemuConfig->config_file($vmid);
91bd6c90
DM
5754 my $tmpfn = "$conffile.$$.tmp";
5755
ae200950 5756 # Note: $oldconf is undef if VM does not exist
ffda963f
FG
5757 my $cfs_path = PVE::QemuConfig->cfs_config_path($vmid);
5758 my $oldconf = PVE::Cluster::cfs_read_file($cfs_path);
ed221350 5759
7c536e11
WB
5760 my %storage_limits;
5761
91bd6c90
DM
5762 my $print_devmap = sub {
5763 my $virtdev_hash = {};
5764
5765 my $cfgfn = "$tmpdir/qemu-server.conf";
5766
5767 # we can read the config - that is already extracted
5768 my $fh = IO::File->new($cfgfn, "r") ||
5769 "unable to read qemu-server.conf - $!\n";
5770
6738ab9c 5771 my $fwcfgfn = "$tmpdir/qemu-server.fw";
3457d090
WL
5772 if (-f $fwcfgfn) {
5773 my $pve_firewall_dir = '/etc/pve/firewall';
5774 mkdir $pve_firewall_dir; # make sure the dir exists
5775 PVE::Tools::file_copy($fwcfgfn, "${pve_firewall_dir}/$vmid.fw");
5776 }
6738ab9c 5777
91bd6c90
DM
5778 while (defined(my $line = <$fh>)) {
5779 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
5780 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
5781 die "archive does not contain data for drive '$virtdev'\n"
5782 if !$devinfo->{$devname};
5783 if (defined($opts->{storage})) {
5784 $storeid = $opts->{storage} || 'local';
5785 } elsif (!$storeid) {
5786 $storeid = 'local';
5787 }
5788 $format = 'raw' if !$format;
5789 $devinfo->{$devname}->{devname} = $devname;
5790 $devinfo->{$devname}->{virtdev} = $virtdev;
5791 $devinfo->{$devname}->{format} = $format;
5792 $devinfo->{$devname}->{storeid} = $storeid;
5793
be190583 5794 # check permission on storage
91bd6c90
DM
5795 my $pool = $opts->{pool}; # todo: do we need that?
5796 if ($user ne 'root@pam') {
5797 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
5798 }
5799
7c536e11
WB
5800 $storage_limits{$storeid} = $bwlimit;
5801
91bd6c90 5802 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
c4ab3c55
ML
5803 } elsif ($line =~ m/^((?:ide|sata|scsi)\d+):\s*(.*)\s*$/) {
5804 my $virtdev = $1;
5805 my $drive = parse_drive($virtdev, $2);
5806 if (drive_is_cloudinit($drive)) {
5807 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5808 my $scfg = PVE::Storage::storage_config($cfg, $storeid);
5809 my $format = qemu_img_format($scfg, $volname); # has 'raw' fallback
5810
5811 my $d = {
5812 format => $format,
5813 storeid => $opts->{storage} // $storeid,
5814 size => PVE::QemuServer::Cloudinit::CLOUDINIT_DISK_SIZE,
5815 file => $drive->{file}, # to make drive_is_cloudinit check possible
5816 name => "vm-$vmid-cloudinit",
87056e18 5817 is_cloudinit => 1,
c4ab3c55
ML
5818 };
5819 $virtdev_hash->{$virtdev} = $d;
5820 }
91bd6c90
DM
5821 }
5822 }
5823
7c536e11
WB
5824 foreach my $key (keys %storage_limits) {
5825 my $limit = PVE::Storage::get_bandwidth_limit('restore', [$key], $bwlimit);
5826 next if !$limit;
5827 print STDERR "rate limit for storage $key: $limit KiB/s\n";
5828 $storage_limits{$key} = $limit * 1024;
5829 }
5830
91bd6c90 5831 foreach my $devname (keys %$devinfo) {
be190583
DM
5832 die "found no device mapping information for device '$devname'\n"
5833 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
5834 }
5835
ed221350 5836 # create empty/temp config
be190583 5837 if ($oldconf) {
ed221350
DM
5838 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
5839 foreach_drive($oldconf, sub {
5840 my ($ds, $drive) = @_;
5841
a82348eb 5842 return if drive_is_cdrom($drive, 1);
ed221350
DM
5843
5844 my $volid = $drive->{file};
ed221350
DM
5845 return if !$volid || $volid =~ m|^/|;
5846
5847 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
5848 return if !$path || !$owner || ($owner != $vmid);
5849
5850 # Note: only delete disk we want to restore
5851 # other volumes will become unused
5852 if ($virtdev_hash->{$ds}) {
6b72854b
FG
5853 eval { PVE::Storage::vdisk_free($cfg, $volid); };
5854 if (my $err = $@) {
5855 warn $err;
5856 }
ed221350
DM
5857 }
5858 });
381b8fae 5859
2b2923ae 5860 # delete vmstate files, after the restore we have no snapshots anymore
381b8fae
DC
5861 foreach my $snapname (keys %{$oldconf->{snapshots}}) {
5862 my $snap = $oldconf->{snapshots}->{$snapname};
5863 if ($snap->{vmstate}) {
5864 eval { PVE::Storage::vdisk_free($cfg, $snap->{vmstate}); };
5865 if (my $err = $@) {
5866 warn $err;
5867 }
5868 }
5869 }
ed221350
DM
5870 }
5871
5872 my $map = {};
91bd6c90
DM
5873 foreach my $virtdev (sort keys %$virtdev_hash) {
5874 my $d = $virtdev_hash->{$virtdev};
5875 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
7c536e11
WB
5876 my $storeid = $d->{storeid};
5877 my $scfg = PVE::Storage::storage_config($cfg, $storeid);
5878
5879 my $map_opts = '';
5880 if (my $limit = $storage_limits{$storeid}) {
5881 $map_opts .= "throttling.bps=$limit:throttling.group=$storeid:";
5882 }
8fd57431
DM
5883
5884 # test if requested format is supported
7c536e11 5885 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $storeid);
8fd57431
DM
5886 my $supported = grep { $_ eq $d->{format} } @$validFormats;
5887 $d->{format} = $defFormat if !$supported;
5888
87056e18
TL
5889 my $name;
5890 if ($d->{is_cloudinit}) {
5891 $name = $d->{name};
5892 $name .= ".$d->{format}" if $d->{format} ne 'raw';
c4ab3c55 5893 }
2b2923ae
TL
5894
5895 my $volid = PVE::Storage::vdisk_alloc($cfg, $storeid, $vmid, $d->{format}, $name, $alloc_size);
91bd6c90
DM
5896 print STDERR "new volume ID is '$volid'\n";
5897 $d->{volid} = $volid;
91bd6c90 5898
2b2923ae 5899 PVE::Storage::activate_volumes($cfg, [$volid]);
5f96f4df 5900
91bd6c90 5901 my $write_zeros = 1;
88240a83 5902 if (PVE::Storage::volume_has_feature($cfg, 'sparseinit', $volid)) {
91bd6c90
DM
5903 $write_zeros = 0;
5904 }
5905
87056e18
TL
5906 if (!$d->{is_cloudinit}) {
5907 my $path = PVE::Storage::path($cfg, $volid);
5908
c4ab3c55 5909 print $fifofh "${map_opts}format=$d->{format}:${write_zeros}:$d->{devname}=$path\n";
91bd6c90 5910
c4ab3c55
ML
5911 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
5912 }
91bd6c90
DM
5913 $map->{$virtdev} = $volid;
5914 }
5915
5916 $fh->seek(0, 0) || die "seek failed - $!\n";
5917
5918 my $outfd = new IO::File ($tmpfn, "w") ||
5919 die "unable to write config for VM $vmid\n";
5920
5921 my $cookie = { netcount => 0 };
5922 while (defined(my $line = <$fh>)) {
be190583 5923 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
5924 }
5925
5926 $fh->close();
5927 $outfd->close();
5928 };
5929
5930 eval {
5931 # enable interrupts
6cb0144a
EK
5932 local $SIG{INT} =
5933 local $SIG{TERM} =
5934 local $SIG{QUIT} =
5935 local $SIG{HUP} =
5936 local $SIG{PIPE} = sub { die "interrupted by signal\n"; };
91bd6c90
DM
5937 local $SIG{ALRM} = sub { die "got timeout\n"; };
5938
5939 $oldtimeout = alarm($timeout);
5940
5941 my $parser = sub {
5942 my $line = shift;
5943
5944 print "$line\n";
5945
5946 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
5947 my ($dev_id, $size, $devname) = ($1, $2, $3);
5948 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
5949 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 5950 # we correctly received the vma config, so we can disable
3cf90d7a
DM
5951 # the timeout now for disk allocation (set to 10 minutes, so
5952 # that we always timeout if something goes wrong)
5953 alarm(600);
91bd6c90
DM
5954 &$print_devmap();
5955 print $fifofh "done\n";
5956 my $tmp = $oldtimeout || 0;
5957 $oldtimeout = undef;
5958 alarm($tmp);
5959 close($fifofh);
5960 }
5961 };
be190583 5962
7c536e11
WB
5963 print "restore vma archive: $dbg_cmdstring\n";
5964 run_command($commands, input => $input, outfunc => $parser, afterfork => $openfifo);
91bd6c90
DM
5965 };
5966 my $err = $@;
5967
5968 alarm($oldtimeout) if $oldtimeout;
5969
5f96f4df
WL
5970 my $vollist = [];
5971 foreach my $devname (keys %$devinfo) {
5972 my $volid = $devinfo->{$devname}->{volid};
5973 push @$vollist, $volid if $volid;
5974 }
5975
5f96f4df
WL
5976 PVE::Storage::deactivate_volumes($cfg, $vollist);
5977
91bd6c90
DM
5978 unlink $mapfifo;
5979
5980 if ($err) {
5981 rmtree $tmpdir;
5982 unlink $tmpfn;
5983
91bd6c90
DM
5984 foreach my $devname (keys %$devinfo) {
5985 my $volid = $devinfo->{$devname}->{volid};
5986 next if !$volid;
5987 eval {
5988 if ($volid =~ m|^/|) {
5989 unlink $volid || die 'unlink failed\n';
5990 } else {
5991 PVE::Storage::vdisk_free($cfg, $volid);
5992 }
5993 print STDERR "temporary volume '$volid' sucessfuly removed\n";
5994 };
5995 print STDERR "unable to cleanup '$volid' - $@" if $@;
5996 }
5997 die $err;
5998 }
5999
6000 rmtree $tmpdir;
ed221350
DM
6001
6002 rename($tmpfn, $conffile) ||
91bd6c90
DM
6003 die "unable to commit configuration file '$conffile'\n";
6004
ed221350
DM
6005 PVE::Cluster::cfs_update(); # make sure we read new file
6006
91bd6c90
DM
6007 eval { rescan($vmid, 1); };
6008 warn $@ if $@;
6009}
6010
6011sub restore_tar_archive {
6012 my ($archive, $vmid, $user, $opts) = @_;
6013
9c502e26 6014 if ($archive ne '-') {
ed221350 6015 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
6016 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
6017 if $firstfile ne 'qemu-server.conf';
6018 }
3e16d5fc 6019
20519efc 6020 my $storecfg = PVE::Storage::config();
ebb55558 6021
4b026937
TL
6022 # avoid zombie disks when restoring over an existing VM -> cleanup first
6023 # pass keep_empty_config=1 to keep the config (thus VMID) reserved for us
6024 # skiplock=1 because qmrestore has set the 'create' lock itself already
ffda963f 6025 my $vmcfgfn = PVE::QemuConfig->config_file($vmid);
b04ea584 6026 destroy_vm($storecfg, $vmid, 1, { lock => 'restore' }) if -f $vmcfgfn;
ed221350 6027
3e16d5fc
DM
6028 my $tocmd = "/usr/lib/qemu-server/qmextract";
6029
2415a446 6030 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 6031 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
6032 $tocmd .= ' --prealloc' if $opts->{prealloc};
6033 $tocmd .= ' --info' if $opts->{info};
6034
a0d1b1a2 6035 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 6036 # so we pipe to zcat
2415a446
DM
6037 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
6038 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
6039
6040 my $tmpdir = "/var/tmp/vzdumptmp$$";
6041 mkpath $tmpdir;
6042
6043 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
6044 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 6045 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 6046
ffda963f 6047 my $conffile = PVE::QemuConfig->config_file($vmid);
3e16d5fc
DM
6048 my $tmpfn = "$conffile.$$.tmp";
6049
6050 # disable interrupts (always do cleanups)
6cb0144a
EK
6051 local $SIG{INT} =
6052 local $SIG{TERM} =
6053 local $SIG{QUIT} =
6054 local $SIG{HUP} = sub { print STDERR "got interrupt - ignored\n"; };
3e16d5fc 6055
afdb31d5 6056 eval {
3e16d5fc 6057 # enable interrupts
6cb0144a
EK
6058 local $SIG{INT} =
6059 local $SIG{TERM} =
6060 local $SIG{QUIT} =
6061 local $SIG{HUP} =
6062 local $SIG{PIPE} = sub { die "interrupted by signal\n"; };
3e16d5fc 6063
9c502e26
DM
6064 if ($archive eq '-') {
6065 print "extracting archive from STDIN\n";
6066 run_command($cmd, input => "<&STDIN");
6067 } else {
6068 print "extracting archive '$archive'\n";
6069 run_command($cmd);
6070 }
3e16d5fc
DM
6071
6072 return if $opts->{info};
6073
6074 # read new mapping
6075 my $map = {};
6076 my $statfile = "$tmpdir/qmrestore.stat";
6077 if (my $fd = IO::File->new($statfile, "r")) {
6078 while (defined (my $line = <$fd>)) {
6079 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
6080 $map->{$1} = $2 if $1;
6081 } else {
6082 print STDERR "unable to parse line in statfile - $line\n";
6083 }
6084 }
6085 $fd->close();
6086 }
6087
6088 my $confsrc = "$tmpdir/qemu-server.conf";
6089
6090 my $srcfd = new IO::File($confsrc, "r") ||
6091 die "unable to open file '$confsrc'\n";
6092
6093 my $outfd = new IO::File ($tmpfn, "w") ||
6094 die "unable to write config for VM $vmid\n";
6095
91bd6c90 6096 my $cookie = { netcount => 0 };
3e16d5fc 6097 while (defined (my $line = <$srcfd>)) {
be190583 6098 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
6099 }
6100
6101 $srcfd->close();
6102 $outfd->close();
6103 };
7dc7f315 6104 if (my $err = $@) {
3e16d5fc 6105 unlink $tmpfn;
ed221350 6106 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
3e16d5fc 6107 die $err;
afdb31d5 6108 }
3e16d5fc
DM
6109
6110 rmtree $tmpdir;
6111
6112 rename $tmpfn, $conffile ||
6113 die "unable to commit configuration file '$conffile'\n";
91bd6c90 6114
ed221350
DM
6115 PVE::Cluster::cfs_update(); # make sure we read new file
6116
91bd6c90
DM
6117 eval { rescan($vmid, 1); };
6118 warn $@ if $@;
3e16d5fc
DM
6119};
6120
65a5ce88 6121sub foreach_storage_used_by_vm {
18bfb361
DM
6122 my ($conf, $func) = @_;
6123
6124 my $sidhash = {};
6125
8ddbcf8b
FG
6126 foreach_drive($conf, sub {
6127 my ($ds, $drive) = @_;
6128 return if drive_is_cdrom($drive);
18bfb361
DM
6129
6130 my $volid = $drive->{file};
6131
6132 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 6133 $sidhash->{$sid} = $sid if $sid;
8ddbcf8b 6134 });
18bfb361
DM
6135
6136 foreach my $sid (sort keys %$sidhash) {
6137 &$func($sid);
6138 }
6139}
6140
6c9f59c1
TL
6141my $qemu_snap_storage = {
6142 rbd => 1,
6143};
e5eaa028
WL
6144sub do_snapshots_with_qemu {
6145 my ($storecfg, $volid) = @_;
6146
6147 my $storage_name = PVE::Storage::parse_volume_id($volid);
8aa2ed7c 6148 my $scfg = $storecfg->{ids}->{$storage_name};
e5eaa028 6149
8aa2ed7c 6150 if ($qemu_snap_storage->{$scfg->{type}} && !$scfg->{krbd}){
e5eaa028
WL
6151 return 1;
6152 }
6153
6154 if ($volid =~ m/\.(qcow2|qed)$/){
6155 return 1;
6156 }
6157
6158 return undef;
6159}
6160
4dcc780c 6161sub qga_check_running {
a4938c72 6162 my ($vmid, $nowarn) = @_;
4dcc780c 6163
0a13e08e 6164 eval { mon_cmd($vmid, "guest-ping", timeout => 3); };
4dcc780c 6165 if ($@) {
a4938c72 6166 warn "Qemu Guest Agent is not running - $@" if !$nowarn;
4dcc780c
WL
6167 return 0;
6168 }
6169 return 1;
6170}
6171
04a69bb4
AD
6172sub template_create {
6173 my ($vmid, $conf, $disk) = @_;
6174
04a69bb4 6175 my $storecfg = PVE::Storage::config();
04a69bb4 6176
9cd07842
DM
6177 foreach_drive($conf, sub {
6178 my ($ds, $drive) = @_;
6179
6180 return if drive_is_cdrom($drive);
6181 return if $disk && $ds ne $disk;
6182
6183 my $volid = $drive->{file};
bbd56097 6184 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 6185
04a69bb4
AD
6186 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
6187 $drive->{file} = $voliddst;
71c58bb7 6188 $conf->{$ds} = print_drive($drive);
ffda963f 6189 PVE::QemuConfig->write_config($vmid, $conf);
04a69bb4 6190 });
04a69bb4
AD
6191}
6192
92bdc3f0
DC
6193sub convert_iscsi_path {
6194 my ($path) = @_;
6195
6196 if ($path =~ m|^iscsi://([^/]+)/([^/]+)/(.+)$|) {
6197 my $portal = $1;
6198 my $target = $2;
6199 my $lun = $3;
6200
6201 my $initiator_name = get_initiator_name();
6202
6203 return "file.driver=iscsi,file.transport=tcp,file.initiator-name=$initiator_name,".
6204 "file.portal=$portal,file.target=$target,file.lun=$lun,driver=raw";
6205 }
6206
6207 die "cannot convert iscsi path '$path', unkown format\n";
6208}
6209
5133de42 6210sub qemu_img_convert {
988e2714 6211 my ($src_volid, $dst_volid, $size, $snapname, $is_zero_initialized) = @_;
5133de42
AD
6212
6213 my $storecfg = PVE::Storage::config();
6214 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
6215 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
6216
af1f1ec0 6217 die "destination '$dst_volid' is not a valid volid form qemu-img convert\n" if !$dst_storeid;
6bb91c17 6218
af1f1ec0
DC
6219 my $cachemode;
6220 my $src_path;
6221 my $src_is_iscsi = 0;
bdd1feef 6222 my $src_format;
6bb91c17 6223
af1f1ec0
DC
6224 if ($src_storeid) {
6225 PVE::Storage::activate_volumes($storecfg, [$src_volid], $snapname);
5133de42 6226 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
af1f1ec0
DC
6227 $src_format = qemu_img_format($src_scfg, $src_volname);
6228 $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
6229 $src_is_iscsi = ($src_path =~ m|^iscsi://|);
6230 $cachemode = 'none' if $src_scfg->{type} eq 'zfspool';
6231 } elsif (-f $src_volid) {
6232 $src_path = $src_volid;
e0fd2b2f 6233 if ($src_path =~ m/\.($PVE::QemuServer::Drive::QEMU_FORMAT_RE)$/) {
af1f1ec0
DC
6234 $src_format = $1;
6235 }
6236 }
5133de42 6237
af1f1ec0 6238 die "source '$src_volid' is not a valid volid nor path for qemu-img convert\n" if !$src_path;
5133de42 6239
af1f1ec0
DC
6240 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
6241 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
6242 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
6243 my $dst_is_iscsi = ($dst_path =~ m|^iscsi://|);
5133de42 6244
af1f1ec0
DC
6245 my $cmd = [];
6246 push @$cmd, '/usr/bin/qemu-img', 'convert', '-p', '-n';
bdd1feef
TL
6247 push @$cmd, '-l', "snapshot.name=$snapname"
6248 if $snapname && $src_format && $src_format eq "qcow2";
af1f1ec0
DC
6249 push @$cmd, '-t', 'none' if $dst_scfg->{type} eq 'zfspool';
6250 push @$cmd, '-T', $cachemode if defined($cachemode);
6251
6252 if ($src_is_iscsi) {
6253 push @$cmd, '--image-opts';
6254 $src_path = convert_iscsi_path($src_path);
bdd1feef 6255 } elsif ($src_format) {
af1f1ec0
DC
6256 push @$cmd, '-f', $src_format;
6257 }
92bdc3f0 6258
af1f1ec0
DC
6259 if ($dst_is_iscsi) {
6260 push @$cmd, '--target-image-opts';
6261 $dst_path = convert_iscsi_path($dst_path);
6262 } else {
6263 push @$cmd, '-O', $dst_format;
6264 }
92bdc3f0 6265
af1f1ec0 6266 push @$cmd, $src_path;
92bdc3f0 6267
af1f1ec0
DC
6268 if (!$dst_is_iscsi && $is_zero_initialized) {
6269 push @$cmd, "zeroinit:$dst_path";
6270 } else {
6271 push @$cmd, $dst_path;
6272 }
92bdc3f0 6273
af1f1ec0
DC
6274 my $parser = sub {
6275 my $line = shift;
6276 if($line =~ m/\((\S+)\/100\%\)/){
6277 my $percent = $1;
6278 my $transferred = int($size * $percent / 100);
6279 my $remaining = $size - $transferred;
92bdc3f0 6280
af1f1ec0 6281 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
988e2714 6282 }
5133de42 6283
af1f1ec0 6284 };
5133de42 6285
af1f1ec0
DC
6286 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
6287 my $err = $@;
6288 die "copy failed: $err" if $err;
5133de42
AD
6289}
6290
6291sub qemu_img_format {
6292 my ($scfg, $volname) = @_;
6293
e0fd2b2f 6294 if ($scfg->{path} && $volname =~ m/\.($PVE::QemuServer::Drive::QEMU_FORMAT_RE)$/) {
5133de42 6295 return $1;
be190583 6296 } else {
5133de42 6297 return "raw";
5133de42
AD
6298 }
6299}
6300
cfad42af 6301sub qemu_drive_mirror {
9fa05d31 6302 my ($vmid, $drive, $dst_volid, $vmiddst, $is_zero_initialized, $jobs, $skipcomplete, $qga, $bwlimit) = @_;
cfad42af 6303
5a345967
AD
6304 $jobs = {} if !$jobs;
6305
6306 my $qemu_target;
6307 my $format;
35e4ab04 6308 $jobs->{"drive-$drive"} = {};
152fe752 6309
1e5143de 6310 if ($dst_volid =~ /^nbd:/) {
87955688 6311 $qemu_target = $dst_volid;
5a345967 6312 $format = "nbd";
5a345967 6313 } else {
5a345967
AD
6314 my $storecfg = PVE::Storage::config();
6315 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
6316
6317 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 6318
5a345967 6319 $format = qemu_img_format($dst_scfg, $dst_volname);
21ccdb50 6320
5a345967 6321 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 6322
5a345967
AD
6323 $qemu_target = $is_zero_initialized ? "zeroinit:$dst_path" : $dst_path;
6324 }
988e2714
WB
6325
6326 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $qemu_target };
88383920
DM
6327 $opts->{format} = $format if $format;
6328
9fa05d31 6329 if (defined($bwlimit)) {
f6409f61
TL
6330 $opts->{speed} = $bwlimit * 1024;
6331 print "drive mirror is starting for drive-$drive with bandwidth limit: ${bwlimit} KB/s\n";
9fa05d31
SI
6332 } else {
6333 print "drive mirror is starting for drive-$drive\n";
6334 }
21ccdb50 6335
6dde5ea2 6336 # if a job already runs for this device we get an error, catch it for cleanup
0a13e08e 6337 eval { mon_cmd($vmid, "drive-mirror", %$opts); };
5a345967
AD
6338 if (my $err = $@) {
6339 eval { PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs) };
6dde5ea2
TL
6340 warn "$@\n" if $@;
6341 die "mirroring error: $err\n";
5a345967
AD
6342 }
6343
5619e74a 6344 qemu_drive_mirror_monitor ($vmid, $vmiddst, $jobs, $skipcomplete, $qga);
5a345967
AD
6345}
6346
6347sub qemu_drive_mirror_monitor {
5619e74a 6348 my ($vmid, $vmiddst, $jobs, $skipcomplete, $qga) = @_;
2e953867 6349
08ac653f 6350 eval {
5a345967
AD
6351 my $err_complete = 0;
6352
08ac653f 6353 while (1) {
5a345967
AD
6354 die "storage migration timed out\n" if $err_complete > 300;
6355
0a13e08e 6356 my $stats = mon_cmd($vmid, "query-block-jobs");
08ac653f 6357
5a345967
AD
6358 my $running_mirror_jobs = {};
6359 foreach my $stat (@$stats) {
6360 next if $stat->{type} ne 'mirror';
6361 $running_mirror_jobs->{$stat->{device}} = $stat;
6362 }
08ac653f 6363
5a345967 6364 my $readycounter = 0;
67fb9de6 6365
5a345967
AD
6366 foreach my $job (keys %$jobs) {
6367
6368 if(defined($jobs->{$job}->{complete}) && !defined($running_mirror_jobs->{$job})) {
6369 print "$job : finished\n";
6370 delete $jobs->{$job};
6371 next;
6372 }
6373
bd2d5fe6 6374 die "$job: mirroring has been cancelled\n" if !defined($running_mirror_jobs->{$job});
f34ebd52 6375
5a345967
AD
6376 my $busy = $running_mirror_jobs->{$job}->{busy};
6377 my $ready = $running_mirror_jobs->{$job}->{ready};
6378 if (my $total = $running_mirror_jobs->{$job}->{len}) {
6379 my $transferred = $running_mirror_jobs->{$job}->{offset} || 0;
6380 my $remaining = $total - $transferred;
6381 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
08ac653f 6382
5a345967
AD
6383 print "$job: transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy ready: $ready \n";
6384 }
f34ebd52 6385
d1782eba 6386 $readycounter++ if $running_mirror_jobs->{$job}->{ready};
5a345967 6387 }
b467f79a 6388
5a345967
AD
6389 last if scalar(keys %$jobs) == 0;
6390
6391 if ($readycounter == scalar(keys %$jobs)) {
6392 print "all mirroring jobs are ready \n";
6393 last if $skipcomplete; #do the complete later
6394
6395 if ($vmiddst && $vmiddst != $vmid) {
1a988fd2
DC
6396 my $agent_running = $qga && qga_check_running($vmid);
6397 if ($agent_running) {
5619e74a 6398 print "freeze filesystem\n";
0a13e08e 6399 eval { mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5619e74a
AD
6400 } else {
6401 print "suspend vm\n";
6402 eval { PVE::QemuServer::vm_suspend($vmid, 1); };
6403 }
6404
5a345967
AD
6405 # if we clone a disk for a new target vm, we don't switch the disk
6406 PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs);
5619e74a 6407
1a988fd2 6408 if ($agent_running) {
5619e74a 6409 print "unfreeze filesystem\n";
0a13e08e 6410 eval { mon_cmd($vmid, "guest-fsfreeze-thaw"); };
5619e74a
AD
6411 } else {
6412 print "resume vm\n";
6413 eval { PVE::QemuServer::vm_resume($vmid, 1, 1); };
6414 }
6415
2e953867 6416 last;
5a345967
AD
6417 } else {
6418
6419 foreach my $job (keys %$jobs) {
6420 # try to switch the disk if source and destination are on the same guest
bd2d5fe6 6421 print "$job: Completing block job...\n";
5a345967 6422
0a13e08e 6423 eval { mon_cmd($vmid, "block-job-complete", device => $job) };
5a345967 6424 if ($@ =~ m/cannot be completed/) {
bd2d5fe6 6425 print "$job: Block job cannot be completed, try again.\n";
5a345967
AD
6426 $err_complete++;
6427 }else {
bd2d5fe6 6428 print "$job: Completed successfully.\n";
5a345967
AD
6429 $jobs->{$job}->{complete} = 1;
6430 }
6431 }
2e953867 6432 }
08ac653f 6433 }
08ac653f 6434 sleep 1;
cfad42af 6435 }
08ac653f 6436 };
88383920 6437 my $err = $@;
08ac653f 6438
88383920 6439 if ($err) {
5a345967 6440 eval { PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs) };
88383920
DM
6441 die "mirroring error: $err";
6442 }
6443
5a345967
AD
6444}
6445
6446sub qemu_blockjobs_cancel {
6447 my ($vmid, $jobs) = @_;
6448
6449 foreach my $job (keys %$jobs) {
bd2d5fe6 6450 print "$job: Cancelling block job\n";
0a13e08e 6451 eval { mon_cmd($vmid, "block-job-cancel", device => $job); };
5a345967
AD
6452 $jobs->{$job}->{cancel} = 1;
6453 }
6454
6455 while (1) {
0a13e08e 6456 my $stats = mon_cmd($vmid, "query-block-jobs");
5a345967
AD
6457
6458 my $running_jobs = {};
6459 foreach my $stat (@$stats) {
6460 $running_jobs->{$stat->{device}} = $stat;
6461 }
6462
6463 foreach my $job (keys %$jobs) {
6464
bd2d5fe6
WB
6465 if (defined($jobs->{$job}->{cancel}) && !defined($running_jobs->{$job})) {
6466 print "$job: Done.\n";
5a345967
AD
6467 delete $jobs->{$job};
6468 }
6469 }
6470
6471 last if scalar(keys %$jobs) == 0;
6472
6473 sleep 1;
cfad42af
AD
6474 }
6475}
6476
152fe752 6477sub clone_disk {
be190583 6478 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
7e303ef3 6479 $newvmid, $storage, $format, $full, $newvollist, $jobs, $skipcomplete, $qga, $bwlimit) = @_;
152fe752
DM
6480
6481 my $newvolid;
6482
6483 if (!$full) {
6484 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 6485 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
6486 push @$newvollist, $newvolid;
6487 } else {
5a345967 6488
152fe752
DM
6489 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
6490 $storeid = $storage if $storage;
6491
44549149 6492 my $dst_format = resolve_dst_disk_format($storecfg, $storeid, $volname, $format);
152fe752
DM
6493 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
6494
6495 print "create full clone of drive $drivename ($drive->{file})\n";
931432bd 6496 my $name = undef;
7fe8b44c
TL
6497 if (drive_is_cloudinit($drive)) {
6498 $name = "vm-$newvmid-cloudinit";
6499 $name .= ".$dst_format" if $dst_format ne 'raw';
6500 $snapname = undef;
6501 $size = PVE::QemuServer::Cloudinit::CLOUDINIT_DISK_SIZE;
6502 }
931432bd 6503 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $dst_format, $name, ($size/1024));
152fe752
DM
6504 push @$newvollist, $newvolid;
6505
3999f370 6506 PVE::Storage::activate_volumes($storecfg, [$newvolid]);
1dbd6d30 6507
7fe8b44c
TL
6508 if (drive_is_cloudinit($drive)) {
6509 goto no_data_clone;
6510 }
6511
988e2714 6512 my $sparseinit = PVE::Storage::volume_has_feature($storecfg, 'sparseinit', $newvolid);
152fe752 6513 if (!$running || $snapname) {
d189e590 6514 # TODO: handle bwlimits
988e2714 6515 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname, $sparseinit);
152fe752 6516 } else {
2e541679
AD
6517
6518 my $kvmver = get_running_qemu_version ($vmid);
2ea5fb7e 6519 if (!min_version($kvmver, 2, 7)) {
961af8a3
WB
6520 die "drive-mirror with iothread requires qemu version 2.7 or higher\n"
6521 if $drive->{iothread};
2e541679 6522 }
2af848a2 6523
7e303ef3 6524 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid, $sparseinit, $jobs, $skipcomplete, $qga, $bwlimit);
be190583 6525 }
152fe752
DM
6526 }
6527
7fe8b44c 6528no_data_clone:
152fe752
DM
6529 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
6530
6531 my $disk = $drive;
6532 $disk->{format} = undef;
6533 $disk->{file} = $newvolid;
6534 $disk->{size} = $size;
6535
6536 return $disk;
6537}
6538
98cfd8b6
AD
6539sub get_running_qemu_version {
6540 my ($vmid) = @_;
0a13e08e 6541 my $res = mon_cmd($vmid, "query-version");
98cfd8b6
AD
6542 return "$res->{qemu}->{major}.$res->{qemu}->{minor}";
6543}
6544
249c4a6c
AD
6545sub qemu_use_old_bios_files {
6546 my ($machine_type) = @_;
6547
6548 return if !$machine_type;
6549
6550 my $use_old_bios_files = undef;
6551
6552 if ($machine_type =~ m/^(\S+)\.pxe$/) {
6553 $machine_type = $1;
6554 $use_old_bios_files = 1;
6555 } else {
9471e48b 6556 my $version = PVE::QemuServer::Machine::extract_version($machine_type, kvm_user_version());
249c4a6c
AD
6557 # Note: kvm version < 2.4 use non-efi pxe files, and have problems when we
6558 # load new efi bios files on migration. So this hack is required to allow
6559 # live migration from qemu-2.2 to qemu-2.4, which is sometimes used when
6560 # updrading from proxmox-ve-3.X to proxmox-ve 4.0
2ea5fb7e 6561 $use_old_bios_files = !min_version($version, 2, 4);
249c4a6c
AD
6562 }
6563
6564 return ($use_old_bios_files, $machine_type);
6565}
6566
96ed3574
WB
6567sub create_efidisk($$$$$) {
6568 my ($storecfg, $storeid, $vmid, $fmt, $arch) = @_;
3e1f1122 6569
96ed3574
WB
6570 my (undef, $ovmf_vars) = get_ovmf_files($arch);
6571 die "EFI vars default image not found\n" if ! -f $ovmf_vars;
3e1f1122 6572
af1f1ec0
DC
6573 my $vars_size_b = -s $ovmf_vars;
6574 my $vars_size = PVE::Tools::convert_size($vars_size_b, 'b' => 'kb');
3e1f1122
TL
6575 my $volid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $vmid, $fmt, undef, $vars_size);
6576 PVE::Storage::activate_volumes($storecfg, [$volid]);
6577
af1f1ec0 6578 qemu_img_convert($ovmf_vars, $volid, $vars_size_b, undef, 0);
340dbcf7 6579 my ($size) = PVE::Storage::volume_size_info($storecfg, $volid, 3);
3e1f1122 6580
340dbcf7 6581 return ($volid, $size/1024);
3e1f1122
TL
6582}
6583
22de899a
AD
6584sub vm_iothreads_list {
6585 my ($vmid) = @_;
6586
0a13e08e 6587 my $res = mon_cmd($vmid, 'query-iothreads');
22de899a
AD
6588
6589 my $iothreads = {};
6590 foreach my $iothread (@$res) {
6591 $iothreads->{ $iothread->{id} } = $iothread->{"thread-id"};
6592 }
6593
6594 return $iothreads;
6595}
6596
ee034f5c
AD
6597sub scsihw_infos {
6598 my ($conf, $drive) = @_;
6599
6600 my $maxdev = 0;
6601
7fe1b688 6602 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)) {
ee034f5c 6603 $maxdev = 7;
a1511b3c 6604 } elsif ($conf->{scsihw} && ($conf->{scsihw} eq 'virtio-scsi-single')) {
ee034f5c
AD
6605 $maxdev = 1;
6606 } else {
6607 $maxdev = 256;
6608 }
6609
6610 my $controller = int($drive->{index} / $maxdev);
a1511b3c 6611 my $controller_prefix = ($conf->{scsihw} && $conf->{scsihw} eq 'virtio-scsi-single') ? "virtioscsi" : "scsihw";
ee034f5c
AD
6612
6613 return ($maxdev, $controller, $controller_prefix);
6614}
a1511b3c 6615
4317f69f
AD
6616sub windows_version {
6617 my ($ostype) = @_;
6618
6619 return 0 if !$ostype;
6620
6621 my $winversion = 0;
6622
6623 if($ostype eq 'wxp' || $ostype eq 'w2k3' || $ostype eq 'w2k') {
6624 $winversion = 5;
6625 } elsif($ostype eq 'w2k8' || $ostype eq 'wvista') {
6626 $winversion = 6;
6627 } elsif ($ostype =~ m/^win(\d+)$/) {
6628 $winversion = $1;
6629 }
6630
6631 return $winversion;
6632}
6633
44549149
EK
6634sub resolve_dst_disk_format {
6635 my ($storecfg, $storeid, $src_volname, $format) = @_;
6636 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
6637
6638 if (!$format) {
6639 # if no target format is specified, use the source disk format as hint
6640 if ($src_volname) {
6641 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
6642 $format = qemu_img_format($scfg, $src_volname);
6643 } else {
6644 return $defFormat;
6645 }
6646 }
6647
6648 # test if requested format is supported - else use default
6649 my $supported = grep { $_ eq $format } @$validFormats;
6650 $format = $defFormat if !$supported;
6651 return $format;
6652}
6653
66cebc46
DC
6654# NOTE: if this logic changes, please update docs & possibly gui logic
6655sub find_vmstate_storage {
6656 my ($conf, $storecfg) = @_;
6657
6658 # first, return storage from conf if set
6659 return $conf->{vmstatestorage} if $conf->{vmstatestorage};
6660
6661 my ($target, $shared, $local);
6662
6663 foreach_storage_used_by_vm($conf, sub {
6664 my ($sid) = @_;
6665 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
6666 my $dst = $scfg->{shared} ? \$shared : \$local;
6667 $$dst = $sid if !$$dst || $scfg->{path}; # prefer file based storage
6668 });
6669
6670 # second, use shared storage where VM has at least one disk
6671 # third, use local storage where VM has at least one disk
6672 # fall back to local storage
6673 $target = $shared // $local // 'local';
6674
6675 return $target;
6676}
6677
6ee499ff 6678sub generate_uuid {
ae2fcb3b
EK
6679 my ($uuid, $uuid_str);
6680 UUID::generate($uuid);
6681 UUID::unparse($uuid, $uuid_str);
6ee499ff
DC
6682 return $uuid_str;
6683}
6684
6685sub generate_smbios1_uuid {
6686 return "uuid=".generate_uuid();
ae2fcb3b
EK
6687}
6688
9c152e87
TL
6689sub nbd_stop {
6690 my ($vmid) = @_;
6691
0a13e08e 6692 mon_cmd($vmid, 'nbd-server-stop');
9c152e87
TL
6693}
6694
dae98db9
DC
6695sub create_reboot_request {
6696 my ($vmid) = @_;
6697 open(my $fh, '>', "/run/qemu-server/$vmid.reboot")
6698 or die "failed to create reboot trigger file: $!\n";
6699 close($fh);
6700}
6701
6702sub clear_reboot_request {
6703 my ($vmid) = @_;
6704 my $path = "/run/qemu-server/$vmid.reboot";
6705 my $res = 0;
6706
6707 $res = unlink($path);
6708 die "could not remove reboot request for $vmid: $!"
6709 if !$res && $! != POSIX::ENOENT;
6710
6711 return $res;
6712}
6713
65e866e5
DM
6714# bash completion helper
6715
6716sub complete_backup_archives {
6717 my ($cmdname, $pname, $cvalue) = @_;
6718
6719 my $cfg = PVE::Storage::config();
6720
6721 my $storeid;
6722
6723 if ($cvalue =~ m/^([^:]+):/) {
6724 $storeid = $1;
6725 }
6726
6727 my $data = PVE::Storage::template_list($cfg, $storeid, 'backup');
6728
6729 my $res = [];
6730 foreach my $id (keys %$data) {
6731 foreach my $item (@{$data->{$id}}) {
6732 next if $item->{format} !~ m/^vma\.(gz|lzo)$/;
6733 push @$res, $item->{volid} if defined($item->{volid});
6734 }
6735 }
6736
6737 return $res;
6738}
6739
6740my $complete_vmid_full = sub {
6741 my ($running) = @_;
6742
6743 my $idlist = vmstatus();
6744
6745 my $res = [];
6746
6747 foreach my $id (keys %$idlist) {
6748 my $d = $idlist->{$id};
6749 if (defined($running)) {
6750 next if $d->{template};
6751 next if $running && $d->{status} ne 'running';
6752 next if !$running && $d->{status} eq 'running';
6753 }
6754 push @$res, $id;
6755
6756 }
6757 return $res;
6758};
6759
6760sub complete_vmid {
6761 return &$complete_vmid_full();
6762}
6763
6764sub complete_vmid_stopped {
6765 return &$complete_vmid_full(0);
6766}
6767
6768sub complete_vmid_running {
6769 return &$complete_vmid_full(1);
6770}
6771
335af808
DM
6772sub complete_storage {
6773
6774 my $cfg = PVE::Storage::config();
6775 my $ids = $cfg->{ids};
6776
6777 my $res = [];
6778 foreach my $sid (keys %$ids) {
6779 next if !PVE::Storage::storage_check_enabled($cfg, $sid, undef, 1);
c4c844ef 6780 next if !$ids->{$sid}->{content}->{images};
335af808
DM
6781 push @$res, $sid;
6782 }
6783
6784 return $res;
6785}
6786
255e9c54
AL
6787sub complete_migration_storage {
6788 my ($cmd, $param, $current_value, $all_args) = @_;
6789
6790 my $targetnode = @$all_args[1];
6791
6792 my $cfg = PVE::Storage::config();
6793 my $ids = $cfg->{ids};
6794
6795 my $res = [];
6796 foreach my $sid (keys %$ids) {
6797 next if !PVE::Storage::storage_check_enabled($cfg, $sid, $targetnode, 1);
6798 next if !$ids->{$sid}->{content}->{images};
6799 push @$res, $sid;
6800 }
6801
6802 return $res;
6803}
6804
1e3baf05 68051;