]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
don't use cirrus by default for sane OS'
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
ffda963f 30use PVE::QemuConfig;
26f11676 31use PVE::QMPClient;
91bd6c90 32use PVE::RPCEnvironment;
de9768f0 33use PVE::QemuServer::PCI qw(print_pci_addr print_pcie_addr);
3f669af2 34use PVE::QemuServer::Memory;
d40e5e18 35use PVE::QemuServer::USB qw(parse_usb_device);
6b64503e 36use Time::HiRes qw(gettimeofday);
a783c78e 37use File::Copy qw(copy);
46630a5f 38use URI::Escape;
1e3baf05 39
2ddc0a5c
DC
40my $OVMF_CODE = '/usr/share/kvm/OVMF_CODE-pure-efi.fd';
41my $OVMF_VARS = '/usr/share/kvm/OVMF_VARS-pure-efi.fd';
42my $OVMF_IMG = '/usr/share/kvm/OVMF-pure-efi.fd';
43
e5eaa028
WL
44my $qemu_snap_storage = {rbd => 1, sheepdog => 1};
45
7f0b5beb 46my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 47
19672434 48# Note about locking: we use flock on the config file protect
1e3baf05
DM
49# against concurent actions.
50# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 51# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
52# allowed when such lock is set. But you can ignore this kind of
53# lock with the --skiplock flag.
54
97d62eb7 55cfs_register_file('/qemu-server/',
1858638f
DM
56 \&parse_vm_config,
57 \&write_vm_config);
1e3baf05 58
3ea94c60
DM
59PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
60 description => "Some command save/restore state from this location.",
61 type => 'string',
62 maxLength => 128,
63 optional => 1,
64});
65
8abd398b
DM
66PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
67 description => "The name of the snapshot.",
68 type => 'string', format => 'pve-configid',
69 maxLength => 40,
70});
71
c7d2b650
DM
72PVE::JSONSchema::register_standard_option('pve-qm-image-format', {
73 type => 'string',
74 enum => [qw(raw cow qcow qed qcow2 vmdk cloop)],
75 description => "The drive's backing file's data format.",
76 optional => 1,
77});
78
1e3baf05
DM
79#no warnings 'redefine';
80
c8effec3
AD
81sub cgroups_write {
82 my ($controller, $vmid, $option, $value) = @_;
83
3a515a88
DM
84 my $path = "/sys/fs/cgroup/$controller/qemu.slice/$vmid.scope/$option";
85 PVE::ProcFSTools::write_proc_entry($path, $value);
c8effec3
AD
86
87}
88
1e3baf05
DM
89my $nodename = PVE::INotify::nodename();
90
91mkdir "/etc/pve/nodes/$nodename";
92my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
93mkdir $confdir;
94
95my $var_run_tmpdir = "/var/run/qemu-server";
96mkdir $var_run_tmpdir;
97
98my $lock_dir = "/var/lock/qemu-server";
99mkdir $lock_dir;
100
101my $pcisysfs = "/sys/bus/pci";
102
8930da74
DM
103my $cpu_vendor_list = {
104 # Intel CPUs
105 486 => 'GenuineIntel',
106 pentium => 'GenuineIntel',
107 pentium2 => 'GenuineIntel',
108 pentium3 => 'GenuineIntel',
109 coreduo => 'GenuineIntel',
110 core2duo => 'GenuineIntel',
111 Conroe => 'GenuineIntel',
112 Penryn => 'GenuineIntel',
113 Nehalem => 'GenuineIntel',
114 Westmere => 'GenuineIntel',
115 SandyBridge => 'GenuineIntel',
116 IvyBridge => 'GenuineIntel',
117 Haswell => 'GenuineIntel',
118 'Haswell-noTSX' => 'GenuineIntel',
119 Broadwell => 'GenuineIntel',
120 'Broadwell-noTSX' => 'GenuineIntel',
3db920fc 121 'Skylake-Client' => 'GenuineIntel',
8930da74
DM
122
123 # AMD CPUs
124 athlon => 'AuthenticAMD',
125 phenom => 'AuthenticAMD',
126 Opteron_G1 => 'AuthenticAMD',
127 Opteron_G2 => 'AuthenticAMD',
128 Opteron_G3 => 'AuthenticAMD',
129 Opteron_G4 => 'AuthenticAMD',
130 Opteron_G5 => 'AuthenticAMD',
131
132 # generic types, use vendor from host node
133 host => 'default',
134 kvm32 => 'default',
135 kvm64 => 'default',
136 qemu32 => 'default',
137 qemu64 => 'default',
138};
139
ff6ffe20 140my $cpu_fmt = {
16a91d65
WB
141 cputype => {
142 description => "Emulated CPU type.",
143 type => 'string',
7f694a71 144 enum => [ sort { "\L$a" cmp "\L$b" } keys %$cpu_vendor_list ],
16a91d65
WB
145 default => 'kvm64',
146 default_key => 1,
147 },
148 hidden => {
149 description => "Do not identify as a KVM virtual machine.",
150 type => 'boolean',
151 optional => 1,
152 default => 0
153 },
154};
155
ec3582b5
WB
156my $watchdog_fmt = {
157 model => {
158 default_key => 1,
159 type => 'string',
160 enum => [qw(i6300esb ib700)],
161 description => "Watchdog type to emulate.",
162 default => 'i6300esb',
163 optional => 1,
164 },
165 action => {
166 type => 'string',
167 enum => [qw(reset shutdown poweroff pause debug none)],
168 description => "The action to perform if after activation the guest fails to poll the watchdog in time.",
169 optional => 1,
170 },
171};
172PVE::JSONSchema::register_format('pve-qm-watchdog', $watchdog_fmt);
173
1e3baf05
DM
174my $confdesc = {
175 onboot => {
176 optional => 1,
177 type => 'boolean',
178 description => "Specifies whether a VM will be started during system bootup.",
179 default => 0,
180 },
181 autostart => {
182 optional => 1,
183 type => 'boolean',
184 description => "Automatic restart after crash (currently ignored).",
185 default => 0,
186 },
2ff09f52
DA
187 hotplug => {
188 optional => 1,
b3c2bdd1
DM
189 type => 'string', format => 'pve-hotplug-features',
190 description => "Selectively enable hotplug features. This is a comma separated list of hotplug features: 'network', 'disk', 'cpu', 'memory' and 'usb'. Use '0' to disable hotplug completely. Value '1' is an alias for the default 'network,disk,usb'.",
191 default => 'network,disk,usb',
2ff09f52 192 },
1e3baf05
DM
193 reboot => {
194 optional => 1,
195 type => 'boolean',
196 description => "Allow reboot. If set to '0' the VM exit on reboot.",
197 default => 1,
198 },
199 lock => {
200 optional => 1,
201 type => 'string',
202 description => "Lock/unlock the VM.",
22c377f0 203 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
204 },
205 cpulimit => {
206 optional => 1,
c6f773b8 207 type => 'number',
52261945
DM
208 description => "Limit of CPU usage.",
209 verbose_description => "Limit of CPU usage.\n\nNOTE: If the computer has 2 CPUs, it has total of '2' CPU time. Value '0' indicates no CPU limit.",
1e3baf05 210 minimum => 0,
c6f773b8 211 maximum => 128,
52261945 212 default => 0,
1e3baf05
DM
213 },
214 cpuunits => {
215 optional => 1,
216 type => 'integer',
52261945
DM
217 description => "CPU weight for a VM.",
218 verbose_description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
1e3baf05
DM
219 minimum => 0,
220 maximum => 500000,
613d76a1 221 default => 1024,
1e3baf05
DM
222 },
223 memory => {
224 optional => 1,
225 type => 'integer',
7878afeb 226 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
227 minimum => 16,
228 default => 512,
229 },
13a48620
DA
230 balloon => {
231 optional => 1,
232 type => 'integer',
8b1accf7
DM
233 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
234 minimum => 0,
235 },
236 shares => {
237 optional => 1,
238 type => 'integer',
239 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
240 minimum => 0,
241 maximum => 50000,
242 default => 1000,
13a48620 243 },
1e3baf05
DM
244 keyboard => {
245 optional => 1,
246 type => 'string',
fad17f04 247 description => "Keybord layout for vnc server. Default is read from the '/etc/pve/datacenter.conf' configuration file.",
e95fe75f 248 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
249 default => 'en-us',
250 },
251 name => {
252 optional => 1,
7fabe17d 253 type => 'string', format => 'dns-name',
1e3baf05
DM
254 description => "Set a name for the VM. Only used on the configuration web interface.",
255 },
cdd20088
AD
256 scsihw => {
257 optional => 1,
258 type => 'string',
52261945 259 description => "SCSI controller model",
6731a4cf 260 enum => [qw(lsi lsi53c810 virtio-scsi-pci virtio-scsi-single megasas pvscsi)],
cdd20088
AD
261 default => 'lsi',
262 },
1e3baf05
DM
263 description => {
264 optional => 1,
265 type => 'string',
0581fe4f 266 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
267 },
268 ostype => {
269 optional => 1,
270 type => 'string',
0cb9971e 271 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 win10 l24 l26 solaris)],
52261945
DM
272 description => "Specify guest operating system.",
273 verbose_description => <<EODESC,
274Specify guest operating system. This is used to enable special
275optimization/features for specific operating systems:
276
277[horizontal]
278other;; unspecified OS
279wxp;; Microsoft Windows XP
280w2k;; Microsoft Windows 2000
281w2k3;; Microsoft Windows 2003
282w2k8;; Microsoft Windows 2008
283wvista;; Microsoft Windows Vista
284win7;; Microsoft Windows 7
285win8;; Microsoft Windows 8/2012
286l24;; Linux 2.4 Kernel
287l26;; Linux 2.6/3.X Kernel
288solaris;; Solaris/OpenSolaris/OpenIndiania kernel
1e3baf05
DM
289EODESC
290 },
291 boot => {
292 optional => 1,
293 type => 'string',
294 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
295 pattern => '[acdn]{1,4}',
32baffb4 296 default => 'cdn',
1e3baf05
DM
297 },
298 bootdisk => {
299 optional => 1,
300 type => 'string', format => 'pve-qm-bootdisk',
301 description => "Enable booting from specified disk.",
03e480fc 302 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
303 },
304 smp => {
305 optional => 1,
306 type => 'integer',
307 description => "The number of CPUs. Please use option -sockets instead.",
308 minimum => 1,
309 default => 1,
310 },
311 sockets => {
312 optional => 1,
313 type => 'integer',
314 description => "The number of CPU sockets.",
315 minimum => 1,
316 default => 1,
317 },
318 cores => {
319 optional => 1,
320 type => 'integer',
321 description => "The number of cores per socket.",
322 minimum => 1,
323 default => 1,
324 },
8a010eae
AD
325 numa => {
326 optional => 1,
327 type => 'boolean',
1917695c 328 description => "Enable/disable NUMA.",
8a010eae
AD
329 default => 0,
330 },
7023f3ea
AD
331 hugepages => {
332 optional => 1,
333 type => 'string',
334 description => "Enable/disable hugepages memory.",
335 enum => [qw(any 2 1024)],
336 },
de9d1e55 337 vcpus => {
3bd18e48
AD
338 optional => 1,
339 type => 'integer',
de9d1e55 340 description => "Number of hotplugged vcpus.",
3bd18e48 341 minimum => 1,
de9d1e55 342 default => 0,
3bd18e48 343 },
1e3baf05
DM
344 acpi => {
345 optional => 1,
346 type => 'boolean',
347 description => "Enable/disable ACPI.",
348 default => 1,
349 },
bc84dcca 350 agent => {
ab6a046f
AD
351 optional => 1,
352 type => 'boolean',
353 description => "Enable/disable Qemu GuestAgent.",
be79c214 354 default => 0,
ab6a046f 355 },
1e3baf05
DM
356 kvm => {
357 optional => 1,
358 type => 'boolean',
359 description => "Enable/disable KVM hardware virtualization.",
360 default => 1,
361 },
362 tdf => {
363 optional => 1,
364 type => 'boolean',
8c559505
DM
365 description => "Enable/disable time drift fix.",
366 default => 0,
1e3baf05 367 },
19672434 368 localtime => {
1e3baf05
DM
369 optional => 1,
370 type => 'boolean',
371 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
372 },
373 freeze => {
374 optional => 1,
375 type => 'boolean',
376 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
377 },
378 vga => {
379 optional => 1,
380 type => 'string',
52261945
DM
381 description => "Select the VGA type.",
382 verbose_description => "Select the VGA type. If you want to use high resolution" .
1917695c
TL
383 " modes (>= 1280x1024x16) then you should use the options " .
384 "'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and " .
385 "'cirrus' for other OS types. The 'qxl' option enables the SPICE " .
386 "display sever. For win* OS you can select how many independent " .
387 "displays you want, Linux guests can add displays them self. " .
388 "You can also run without any graphic card, using a serial device" .
389 " as terminal.",
2fa3151e 390 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 391 },
0ea9541d
DM
392 watchdog => {
393 optional => 1,
394 type => 'string', format => 'pve-qm-watchdog',
52261945
DM
395 description => "Create a virtual hardware watchdog device.",
396 verbose_description => "Create a virtual hardware watchdog device. Once enabled" .
1917695c
TL
397 " (by a guest action), the watchdog must be periodically polled " .
398 "by an agent inside the guest or else the watchdog will reset " .
399 "the guest (or execute the respective action specified)",
0ea9541d 400 },
1e3baf05
DM
401 startdate => {
402 optional => 1,
19672434 403 type => 'string',
1e3baf05
DM
404 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
405 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
406 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
407 default => 'now',
408 },
43574f73 409 startup => get_standard_option('pve-startup-order'),
68eda3ab
AD
410 template => {
411 optional => 1,
412 type => 'boolean',
413 description => "Enable/disable Template.",
414 default => 0,
415 },
1e3baf05
DM
416 args => {
417 optional => 1,
418 type => 'string',
52261945
DM
419 description => "Arbitrary arguments passed to kvm.",
420 verbose_description => <<EODESCR,
c7a8aad6 421Arbitrary arguments passed to kvm, for example:
1e3baf05
DM
422
423args: -no-reboot -no-hpet
c7a8aad6
FG
424
425NOTE: this option is for experts only.
1e3baf05
DM
426EODESCR
427 },
428 tablet => {
429 optional => 1,
430 type => 'boolean',
431 default => 1,
52261945
DM
432 description => "Enable/disable the USB tablet device.",
433 verbose_description => "Enable/disable the USB tablet device. This device is " .
1917695c
TL
434 "usually needed to allow absolute mouse positioning with VNC. " .
435 "Else the mouse runs out of sync with normal VNC clients. " .
436 "If you're running lots of console-only guests on one host, " .
437 "you may consider disabling this to save some context switches. " .
438 "This is turned off by default if you use spice (-vga=qxl).",
1e3baf05
DM
439 },
440 migrate_speed => {
441 optional => 1,
442 type => 'integer',
443 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
444 minimum => 0,
445 default => 0,
446 },
447 migrate_downtime => {
448 optional => 1,
04432191 449 type => 'number',
1e3baf05
DM
450 description => "Set maximum tolerated downtime (in seconds) for migrations.",
451 minimum => 0,
04432191 452 default => 0.1,
1e3baf05
DM
453 },
454 cdrom => {
455 optional => 1,
b799312f 456 type => 'string', format => 'pve-qm-ide',
8485b9ba 457 typetext => '<volume>',
1e3baf05
DM
458 description => "This is an alias for option -ide2",
459 },
460 cpu => {
461 optional => 1,
462 description => "Emulated CPU type.",
463 type => 'string',
ff6ffe20 464 format => $cpu_fmt,
1e3baf05 465 },
b7ba6b79
DM
466 parent => get_standard_option('pve-snapshot-name', {
467 optional => 1,
468 description => "Parent snapshot name. This is used internally, and should not be modified.",
469 }),
982c7f12
DM
470 snaptime => {
471 optional => 1,
472 description => "Timestamp for snapshots.",
473 type => 'integer',
474 minimum => 0,
475 },
18bfb361
DM
476 vmstate => {
477 optional => 1,
478 type => 'string', format => 'pve-volume-id',
479 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
480 },
3bafc510
DM
481 machine => {
482 description => "Specific the Qemu machine type.",
483 type => 'string',
7bac824e 484 pattern => '(pc|pc(-i440fx)?-\d+\.\d+(\.pxe)?|q35|pc-q35-\d+\.\d+(\.pxe)?)',
3bafc510
DM
485 maxLength => 40,
486 optional => 1,
487 },
2796e7d5
DM
488 smbios1 => {
489 description => "Specify SMBIOS type 1 fields.",
490 type => 'string', format => 'pve-qm-smbios1',
2796e7d5
DM
491 maxLength => 256,
492 optional => 1,
493 },
cb0e4540
AG
494 protection => {
495 optional => 1,
496 type => 'boolean',
52261945 497 description => "Sets the protection flag of the VM. This will disable the remove VM and remove disk operations.",
cb0e4540
AG
498 default => 0,
499 },
3edb45e7 500 bios => {
a783c78e 501 optional => 1,
3edb45e7
DM
502 type => 'string',
503 enum => [ qw(seabios ovmf) ],
504 description => "Select BIOS implementation.",
505 default => 'seabios',
a783c78e 506 },
1e3baf05
DM
507};
508
509# what about other qemu settings ?
510#cpu => 'string',
511#machine => 'string',
512#fda => 'file',
513#fdb => 'file',
514#mtdblock => 'file',
515#sd => 'file',
516#pflash => 'file',
517#snapshot => 'bool',
518#bootp => 'file',
519##tftp => 'dir',
520##smb => 'dir',
521#kernel => 'file',
522#append => 'string',
523#initrd => 'file',
524##soundhw => 'string',
525
526while (my ($k, $v) = each %$confdesc) {
527 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
528}
529
530my $MAX_IDE_DISKS = 4;
f62db2a4 531my $MAX_SCSI_DISKS = 14;
a2650619 532my $MAX_VIRTIO_DISKS = 16;
cdb0931f 533my $MAX_SATA_DISKS = 6;
1e3baf05 534my $MAX_USB_DEVICES = 5;
5bdcf937 535my $MAX_NETS = 32;
1e3baf05 536my $MAX_UNUSED_DISKS = 8;
5cffb2d2 537my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 538my $MAX_SERIAL_PORTS = 4;
1989a89c 539my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
540my $MAX_NUMA = 8;
541
ffc0d8c7
WB
542my $numa_fmt = {
543 cpus => {
544 type => "string",
545 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
52261945 546 description => "CPUs accessing this NUMA node.",
ffc0d8c7
WB
547 format_description => "id[-id];...",
548 },
549 memory => {
550 type => "number",
52261945 551 description => "Amount of memory this NUMA node provides.",
ffc0d8c7
WB
552 optional => 1,
553 },
554 hostnodes => {
555 type => "string",
556 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
52261945 557 description => "Host NUMA nodes to use.",
ffc0d8c7
WB
558 format_description => "id[-id];...",
559 optional => 1,
560 },
561 policy => {
562 type => 'string',
563 enum => [qw(preferred bind interleave)],
52261945 564 description => "NUMA allocation policy.",
ffc0d8c7
WB
565 optional => 1,
566 },
567};
568PVE::JSONSchema::register_format('pve-qm-numanode', $numa_fmt);
2ed5d572
AD
569my $numadesc = {
570 optional => 1,
ffc0d8c7 571 type => 'string', format => $numa_fmt,
52261945 572 description => "NUMA topology.",
2ed5d572
AD
573};
574PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
575
576for (my $i = 0; $i < $MAX_NUMA; $i++) {
577 $confdesc->{"numa$i"} = $numadesc;
578}
1e3baf05
DM
579
580my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
55034103
KT
581 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3',
582 'e1000-82540em', 'e1000-82544gc', 'e1000-82545em'];
6b64503e 583my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 584
52261945
DM
585my $net_fmt_bridge_descr = <<__EOD__;
586Bridge to attach the network device to. The Proxmox VE standard bridge
587is called 'vmbr0'.
588
589If you do not specify a bridge, we create a kvm user (NATed) network
590device, which provides DHCP and DNS services. The following addresses
591are used:
592
593 10.0.2.2 Gateway
594 10.0.2.3 DNS Server
595 10.0.2.4 SMB Server
596
597The DHCP server assign addresses to the guest starting from 10.0.2.15.
598__EOD__
599
cd9c34d1
WB
600my $net_fmt = {
601 macaddr => {
602 type => 'string',
603 pattern => qr/[0-9a-f]{2}(?::[0-9a-f]{2}){5}/i,
52261945 604 description => "MAC address. That address must be unique withing your network. This is automatically generated if not specified.",
cd9c34d1
WB
605 format_description => "XX:XX:XX:XX:XX:XX",
606 optional => 1,
607 },
7f694a71
DM
608 model => {
609 type => 'string',
52261945 610 description => "Network Card Model. The 'virtio' model provides the best performance with very low CPU overhead. If your guest does not support this driver, it is usually best to use 'e1000'.",
7f694a71
DM
611 enum => $nic_model_list,
612 default_key => 1,
613 },
614 (map { $_ => { keyAlias => 'model', alias => 'macaddr' }} @$nic_model_list),
cd9c34d1
WB
615 bridge => {
616 type => 'string',
52261945 617 description => $net_fmt_bridge_descr,
cd9c34d1
WB
618 format_description => 'bridge',
619 optional => 1,
620 },
621 queues => {
622 type => 'integer',
623 minimum => 0, maximum => 16,
624 description => 'Number of packet queues to be used on the device.',
cd9c34d1
WB
625 optional => 1,
626 },
627 rate => {
628 type => 'number',
629 minimum => 0,
52261945 630 description => "Rate limit in mbps (megabytes per second) as floating point number.",
cd9c34d1
WB
631 optional => 1,
632 },
633 tag => {
634 type => 'integer',
9f41a659 635 minimum => 1, maximum => 4094,
cd9c34d1 636 description => 'VLAN tag to apply to packets on this interface.',
cd9c34d1
WB
637 optional => 1,
638 },
639 trunks => {
640 type => 'string',
641 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
642 description => 'VLAN trunks to pass through this interface.',
7f694a71 643 format_description => 'vlanid[;vlanid...]',
cd9c34d1
WB
644 optional => 1,
645 },
646 firewall => {
647 type => 'boolean',
648 description => 'Whether this interface should be protected by the firewall.',
cd9c34d1
WB
649 optional => 1,
650 },
651 link_down => {
652 type => 'boolean',
52261945 653 description => 'Whether this interface should be disconnected (like pulling the plug).',
cd9c34d1
WB
654 optional => 1,
655 },
656};
52261945 657
1e3baf05
DM
658my $netdesc = {
659 optional => 1,
7f694a71 660 type => 'string', format => $net_fmt,
52261945 661 description => "Specify network devices.",
1e3baf05 662};
52261945 663
1e3baf05
DM
664PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
665
666for (my $i = 0; $i < $MAX_NETS; $i++) {
667 $confdesc->{"net$i"} = $netdesc;
668}
669
ffa42b86
DC
670PVE::JSONSchema::register_format('pve-volume-id-or-qm-path', \&verify_volume_id_or_qm_path);
671sub verify_volume_id_or_qm_path {
822c8a07
WB
672 my ($volid, $noerr) = @_;
673
ffa42b86
DC
674 if ($volid eq 'none' || $volid eq 'cdrom' || $volid =~ m|^/|) {
675 return $volid;
676 }
677
678 # if its neither 'none' nor 'cdrom' nor a path, check if its a volume-id
822c8a07
WB
679 $volid = eval { PVE::JSONSchema::check_format('pve-volume-id', $volid, '') };
680 if ($@) {
681 return undef if $noerr;
682 die $@;
683 }
684 return $volid;
685}
686
1e3baf05 687my $drivename_hash;
19672434 688
0541eeb8
WB
689my %drivedesc_base = (
690 volume => { alias => 'file' },
691 file => {
93c0971c 692 type => 'string',
ffa42b86 693 format => 'pve-volume-id-or-qm-path',
0541eeb8
WB
694 default_key => 1,
695 format_description => 'volume',
696 description => "The drive's backing volume.",
697 },
698 media => {
699 type => 'string',
0541eeb8
WB
700 enum => [qw(cdrom disk)],
701 description => "The drive's media type.",
702 default => 'disk',
703 optional => 1
704 },
705 cyls => {
706 type => 'integer',
0541eeb8
WB
707 description => "Force the drive's physical geometry to have a specific cylinder count.",
708 optional => 1
709 },
710 heads => {
711 type => 'integer',
0541eeb8
WB
712 description => "Force the drive's physical geometry to have a specific head count.",
713 optional => 1
714 },
715 secs => {
716 type => 'integer',
0541eeb8
WB
717 description => "Force the drive's physical geometry to have a specific sector count.",
718 optional => 1
719 },
720 trans => {
721 type => 'string',
0541eeb8
WB
722 enum => [qw(none lba auto)],
723 description => "Force disk geometry bios translation mode.",
724 optional => 1,
725 },
726 snapshot => {
727 type => 'boolean',
0541eeb8
WB
728 description => "Whether the drive should be included when making snapshots.",
729 optional => 1,
730 },
731 cache => {
732 type => 'string',
0541eeb8
WB
733 enum => [qw(none writethrough writeback unsafe directsync)],
734 description => "The drive's cache mode",
735 optional => 1,
736 },
c7d2b650 737 format => get_standard_option('pve-qm-image-format'),
0541eeb8 738 size => {
47c28a68
WB
739 type => 'string',
740 format => 'disk-size',
7f694a71 741 format_description => 'DiskSize',
0541eeb8
WB
742 description => "Disk size. This is purely informational and has no effect.",
743 optional => 1,
744 },
745 backup => {
746 type => 'boolean',
0541eeb8
WB
747 description => "Whether the drive should be included when making backups.",
748 optional => 1,
749 },
8557d01f 750 replicate => {
9edac22f 751 type => 'boolean',
3ab7663a 752 description => 'Whether the drive should considered for replication jobs.',
9edac22f
WL
753 optional => 1,
754 default => 1,
755 },
6e9d2550
AD
756 rerror => {
757 type => 'string',
758 enum => [qw(ignore report stop)],
759 description => 'Read error action.',
760 optional => 1,
761 },
0541eeb8
WB
762 werror => {
763 type => 'string',
0541eeb8
WB
764 enum => [qw(enospc ignore report stop)],
765 description => 'Write error action.',
766 optional => 1,
767 },
768 aio => {
769 type => 'string',
0541eeb8
WB
770 enum => [qw(native threads)],
771 description => 'AIO type to use.',
772 optional => 1,
773 },
774 discard => {
775 type => 'string',
0541eeb8
WB
776 enum => [qw(ignore on)],
777 description => 'Controls whether to pass discard/trim requests to the underlying storage.',
778 optional => 1,
779 },
780 detect_zeroes => {
781 type => 'boolean',
782 description => 'Controls whether to detect and try to optimize writes of zeroes.',
783 optional => 1,
784 },
785 serial => {
786 type => 'string',
46630a5f 787 format => 'urlencoded',
0541eeb8 788 format_description => 'serial',
ba8fc5d1
WB
789 maxLength => 20*3, # *3 since it's %xx url enoded
790 description => "The drive's reported serial number, url-encoded, up to 20 bytes long.",
0541eeb8
WB
791 optional => 1,
792 }
793);
794
0541eeb8
WB
795my %iothread_fmt = ( iothread => {
796 type => 'boolean',
0541eeb8
WB
797 description => "Whether to use iothreads for this drive",
798 optional => 1,
799});
800
801my %model_fmt = (
802 model => {
803 type => 'string',
46630a5f 804 format => 'urlencoded',
0541eeb8 805 format_description => 'model',
ba8fc5d1
WB
806 maxLength => 40*3, # *3 since it's %xx url enoded
807 description => "The drive's reported model name, url-encoded, up to 40 bytes long.",
0541eeb8
WB
808 optional => 1,
809 },
810);
811
812my %queues_fmt = (
813 queues => {
814 type => 'integer',
0541eeb8
WB
815 description => "Number of queues.",
816 minimum => 2,
817 optional => 1
818 }
819);
820
8e3c33ab
FG
821my %scsiblock_fmt = (
822 scsiblock => {
823 type => 'boolean',
824 description => "whether to use scsi-block for full passthrough of host block device\n\nWARNING: can lead to I/O errors in combination with low memory or high memory fragmentation on host",
825 optional => 1,
826 default => 0,
827 },
828);
829
0541eeb8 830my $add_throttle_desc = sub {
9196a8ec
WB
831 my ($key, $type, $what, $unit, $longunit, $minimum) = @_;
832 my $d = {
0541eeb8 833 type => $type,
7f694a71 834 format_description => $unit,
9196a8ec 835 description => "Maximum $what in $longunit.",
0541eeb8
WB
836 optional => 1,
837 };
9196a8ec
WB
838 $d->{minimum} = $minimum if defined($minimum);
839 $drivedesc_base{$key} = $d;
0541eeb8
WB
840};
841# throughput: (leaky bucket)
d3f3f1b3
DM
842$add_throttle_desc->('bps', 'integer', 'r/w speed', 'bps', 'bytes per second');
843$add_throttle_desc->('bps_rd', 'integer', 'read speed', 'bps', 'bytes per second');
844$add_throttle_desc->('bps_wr', 'integer', 'write speed', 'bps', 'bytes per second');
845$add_throttle_desc->('mbps', 'number', 'r/w speed', 'mbps', 'megabytes per second');
846$add_throttle_desc->('mbps_rd', 'number', 'read speed', 'mbps', 'megabytes per second');
847$add_throttle_desc->('mbps_wr', 'number', 'write speed', 'mbps', 'megabytes per second');
848$add_throttle_desc->('iops', 'integer', 'r/w I/O', 'iops', 'operations per second');
849$add_throttle_desc->('iops_rd', 'integer', 'read I/O', 'iops', 'operations per second');
850$add_throttle_desc->('iops_wr', 'integer', 'write I/O', 'iops', 'operations per second');
0541eeb8
WB
851
852# pools: (pool of IO before throttling starts taking effect)
d3f3f1b3
DM
853$add_throttle_desc->('mbps_max', 'number', 'unthrottled r/w pool', 'mbps', 'megabytes per second');
854$add_throttle_desc->('mbps_rd_max', 'number', 'unthrottled read pool', 'mbps', 'megabytes per second');
855$add_throttle_desc->('mbps_wr_max', 'number', 'unthrottled write pool', 'mbps', 'megabytes per second');
856$add_throttle_desc->('iops_max', 'integer', 'unthrottled r/w I/O pool', 'iops', 'operations per second');
857$add_throttle_desc->('iops_rd_max', 'integer', 'unthrottled read I/O pool', 'iops', 'operations per second');
858$add_throttle_desc->('iops_wr_max', 'integer', 'unthrottled write I/O pool', 'iops', 'operations per second');
9196a8ec
WB
859
860# burst lengths
fb8e95a2
WB
861$add_throttle_desc->('bps_max_length', 'integer', 'length of I/O bursts', 'seconds', 'seconds', 1);
862$add_throttle_desc->('bps_rd_max_length', 'integer', 'length of read I/O bursts', 'seconds', 'seconds', 1);
863$add_throttle_desc->('bps_wr_max_length', 'integer', 'length of write I/O bursts', 'seconds', 'seconds', 1);
864$add_throttle_desc->('iops_max_length', 'integer', 'length of I/O bursts', 'seconds', 'seconds', 1);
865$add_throttle_desc->('iops_rd_max_length', 'integer', 'length of read I/O bursts', 'seconds', 'seconds', 1);
866$add_throttle_desc->('iops_wr_max_length', 'integer', 'length of write I/O bursts', 'seconds', 'seconds', 1);
867
868# legacy support
869$drivedesc_base{'bps_rd_length'} = { alias => 'bps_rd_max_length' };
870$drivedesc_base{'bps_wr_length'} = { alias => 'bps_wr_max_length' };
871$drivedesc_base{'iops_rd_length'} = { alias => 'iops_rd_max_length' };
872$drivedesc_base{'iops_wr_length'} = { alias => 'iops_wr_max_length' };
0541eeb8
WB
873
874my $ide_fmt = {
875 %drivedesc_base,
0541eeb8
WB
876 %model_fmt,
877};
b799312f 878PVE::JSONSchema::register_format("pve-qm-ide", $ide_fmt);
0541eeb8 879
1e3baf05
DM
880my $idedesc = {
881 optional => 1,
0541eeb8 882 type => 'string', format => $ide_fmt,
3c770faa 883 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
884};
885PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
886
0541eeb8
WB
887my $scsi_fmt = {
888 %drivedesc_base,
889 %iothread_fmt,
890 %queues_fmt,
8e3c33ab 891 %scsiblock_fmt,
0541eeb8 892};
1e3baf05
DM
893my $scsidesc = {
894 optional => 1,
0541eeb8 895 type => 'string', format => $scsi_fmt,
3c770faa 896 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
897};
898PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
899
0541eeb8
WB
900my $sata_fmt = {
901 %drivedesc_base,
0541eeb8 902};
cdb0931f
DA
903my $satadesc = {
904 optional => 1,
0541eeb8 905 type => 'string', format => $sata_fmt,
3c770faa 906 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
907};
908PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
909
0541eeb8
WB
910my $virtio_fmt = {
911 %drivedesc_base,
912 %iothread_fmt,
0541eeb8 913};
1e3baf05
DM
914my $virtiodesc = {
915 optional => 1,
0541eeb8 916 type => 'string', format => $virtio_fmt,
3c770faa 917 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
918};
919PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
920
0541eeb8
WB
921my $alldrive_fmt = {
922 %drivedesc_base,
0541eeb8
WB
923 %iothread_fmt,
924 %model_fmt,
925 %queues_fmt,
8e3c33ab 926 %scsiblock_fmt,
0541eeb8
WB
927};
928
6470743f
DC
929my $efidisk_fmt = {
930 volume => { alias => 'file' },
931 file => {
932 type => 'string',
933 format => 'pve-volume-id-or-qm-path',
934 default_key => 1,
935 format_description => 'volume',
936 description => "The drive's backing volume.",
937 },
c7d2b650 938 format => get_standard_option('pve-qm-image-format'),
6470743f
DC
939 size => {
940 type => 'string',
941 format => 'disk-size',
942 format_description => 'DiskSize',
943 description => "Disk size. This is purely informational and has no effect.",
944 optional => 1,
945 },
946};
947
948my $efidisk_desc = {
949 optional => 1,
950 type => 'string', format => $efidisk_fmt,
951 description => "Configure a Disk for storing EFI vars",
952};
953
954PVE::JSONSchema::register_standard_option("pve-qm-efidisk", $efidisk_desc);
955
ff6ffe20 956my $usb_fmt = {
a6b9aee4
DC
957 host => {
958 default_key => 1,
959 type => 'string', format => 'pve-qm-usb-device',
960 format_description => 'HOSTUSBDEVICE|spice',
52261945
DM
961 description => <<EODESCR,
962The Host USB device or port or the value 'spice'. HOSTUSBDEVICE syntax is:
963
964 'bus-port(.port)*' (decimal numbers) or
965 'vendor_id:product_id' (hexadeciaml numbers) or
966 'spice'
967
968You can use the 'lsusb -t' command to list existing usb devices.
969
970NOTE: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
971
972The value 'spice' can be used to add a usb redirection devices for spice.
973EODESCR
a6b9aee4
DC
974 },
975 usb3 => {
976 optional => 1,
977 type => 'boolean',
52261945
DM
978 description => "Specifies whether if given host option is a USB3 device or port (this does currently not work reliably with spice redirection and is then ignored).",
979 default => 0,
a6b9aee4
DC
980 },
981};
982
1e3baf05
DM
983my $usbdesc = {
984 optional => 1,
ff6ffe20 985 type => 'string', format => $usb_fmt,
52261945 986 description => "Configure an USB device (n is 0 to 4).",
1e3baf05
DM
987};
988PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
989
1f4f447b
WB
990# NOTE: the match-groups of this regex are used in parse_hostpci
991my $PCIRE = qr/([a-f0-9]{2}:[a-f0-9]{2})(?:\.([a-f0-9]))?/;
992my $hostpci_fmt = {
993 host => {
994 default_key => 1,
995 type => 'string',
996 pattern => qr/$PCIRE(;$PCIRE)*/,
997 format_description => 'HOSTPCIID[;HOSTPCIID2...]',
52261945
DM
998 description => <<EODESCR,
999Host PCI device pass through. The PCI ID of a host's PCI device or a list
1000of PCI virtual functions of the host. HOSTPCIID syntax is:
1001
1002'bus:dev.func' (hexadecimal numbers)
1003
1004You can us the 'lspci' command to list existing PCI devices.
52261945 1005EODESCR
1f4f447b
WB
1006 },
1007 rombar => {
1008 type => 'boolean',
52261945 1009 description => "Specify whether or not the device's ROM will be visible in the guest's memory map.",
1f4f447b
WB
1010 optional => 1,
1011 default => 1,
1012 },
456a6fec
AD
1013 romfile => {
1014 type => 'string',
1015 pattern => '[^,;]+',
1016 format_description => 'string',
1017 description => "Custom pci device rom filename (must be located in /usr/share/kvm/).",
1018 optional => 1,
1019 },
1f4f447b
WB
1020 pcie => {
1021 type => 'boolean',
52261945 1022 description => "Choose the PCI-express bus (needs the 'q35' machine model).",
1f4f447b
WB
1023 optional => 1,
1024 default => 0,
1025 },
1026 'x-vga' => {
1027 type => 'boolean',
52261945 1028 description => "Enable vfio-vga device support.",
1f4f447b
WB
1029 optional => 1,
1030 default => 0,
1031 },
1032};
1033PVE::JSONSchema::register_format('pve-qm-hostpci', $hostpci_fmt);
1034
040b06b7
DA
1035my $hostpcidesc = {
1036 optional => 1,
1037 type => 'string', format => 'pve-qm-hostpci',
52261945 1038 description => "Map host PCI devices into guest.",
faab5306
DM
1039 verbose_description => <<EODESCR,
1040Map host PCI devices into guest.
1041
1042NOTE: This option allows direct access to host hardware. So it is no longer
1043possible to migrate such machines - use with special care.
1044
1045CAUTION: Experimental! User reported problems with this option.
1046EODESCR
040b06b7
DA
1047};
1048PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
1049
bae179aa
DA
1050my $serialdesc = {
1051 optional => 1,
ca0cef26 1052 type => 'string',
1b0b51ed 1053 pattern => '(/dev/.+|socket)',
52261945
DM
1054 description => "Create a serial device inside the VM (n is 0 to 3)",
1055 verbose_description => <<EODESCR,
52261945
DM
1056Create a serial device inside the VM (n is 0 to 3), and pass through a
1057host serial device (i.e. /dev/ttyS0), or create a unix socket on the
1058host side (use 'qm terminal' to open a terminal connection).
bae179aa 1059
8a61e0fd 1060NOTE: If you pass through a host serial device, it is no longer possible to migrate such machines - use with special care.
bae179aa 1061
52261945 1062CAUTION: Experimental! User reported problems with this option.
bae179aa
DA
1063EODESCR
1064};
bae179aa 1065
1989a89c
DA
1066my $paralleldesc= {
1067 optional => 1,
ca0cef26 1068 type => 'string',
9ecc8431 1069 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
52261945
DM
1070 description => "Map host parallel devices (n is 0 to 2).",
1071 verbose_description => <<EODESCR,
19672434 1072Map host parallel devices (n is 0 to 2).
1989a89c 1073
8a61e0fd 1074NOTE: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
1989a89c 1075
52261945 1076CAUTION: Experimental! User reported problems with this option.
1989a89c
DA
1077EODESCR
1078};
1989a89c
DA
1079
1080for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
1081 $confdesc->{"parallel$i"} = $paralleldesc;
1082}
1083
bae179aa
DA
1084for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
1085 $confdesc->{"serial$i"} = $serialdesc;
1086}
1087
040b06b7
DA
1088for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
1089 $confdesc->{"hostpci$i"} = $hostpcidesc;
1090}
1e3baf05
DM
1091
1092for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
1093 $drivename_hash->{"ide$i"} = 1;
1094 $confdesc->{"ide$i"} = $idedesc;
1095}
1096
cdb0931f
DA
1097for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
1098 $drivename_hash->{"sata$i"} = 1;
1099 $confdesc->{"sata$i"} = $satadesc;
1100}
1101
1e3baf05
DM
1102for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
1103 $drivename_hash->{"scsi$i"} = 1;
1104 $confdesc->{"scsi$i"} = $scsidesc ;
1105}
1106
1107for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
1108 $drivename_hash->{"virtio$i"} = 1;
1109 $confdesc->{"virtio$i"} = $virtiodesc;
1110}
1111
6470743f
DC
1112$drivename_hash->{efidisk0} = 1;
1113$confdesc->{efidisk0} = $efidisk_desc;
1114
1e3baf05
DM
1115for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
1116 $confdesc->{"usb$i"} = $usbdesc;
1117}
1118
1119my $unuseddesc = {
1120 optional => 1,
1121 type => 'string', format => 'pve-volume-id',
52261945 1122 description => "Reference to unused volumes. This is used internally, and should not be modified manually.",
1e3baf05
DM
1123};
1124
1125for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
1126 $confdesc->{"unused$i"} = $unuseddesc;
1127}
1128
1129my $kvm_api_version = 0;
1130
1131sub kvm_version {
1132
1133 return $kvm_api_version if $kvm_api_version;
1134
6b64503e 1135 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
1136 return 0;
1137
6b64503e 1138 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
1139 $kvm_api_version = $v;
1140 }
1141
1142 $fh->close();
1143
1144 return $kvm_api_version;
1145}
1146
1147my $kvm_user_version;
1148
1149sub kvm_user_version {
1150
1151 return $kvm_user_version if $kvm_user_version;
1152
1153 $kvm_user_version = 'unknown';
1154
09b11429
TL
1155 my $code = sub {
1156 my $line = shift;
1157 if ($line =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)(\.\d+)?[,\s]/) {
1158 $kvm_user_version = $2;
1159 }
1160 };
19672434 1161
09b11429
TL
1162 eval { run_command("kvm -version", outfunc => $code); };
1163 warn $@ if $@;
1e3baf05
DM
1164
1165 return $kvm_user_version;
1166
1167}
1168
1169my $kernel_has_vhost_net = -c '/dev/vhost-net';
1170
74479ee9 1171sub valid_drive_names {
1e3baf05 1172 # order is important - used to autoselect boot disk
19672434 1173 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 1174 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f 1175 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
6470743f
DC
1176 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))),
1177 'efidisk0');
1e3baf05
DM
1178}
1179
74479ee9 1180sub is_valid_drivename {
1e3baf05
DM
1181 my $dev = shift;
1182
6b64503e 1183 return defined($drivename_hash->{$dev});
1e3baf05
DM
1184}
1185
1186sub option_exists {
1187 my $key = shift;
1188 return defined($confdesc->{$key});
19672434 1189}
1e3baf05
DM
1190
1191sub nic_models {
1192 return $nic_model_list;
1193}
1194
1195sub os_list_description {
1196
1197 return {
1198 other => 'Other',
1199 wxp => 'Windows XP',
1200 w2k => 'Windows 2000',
1201 w2k3 =>, 'Windows 2003',
1202 w2k8 => 'Windows 2008',
1203 wvista => 'Windows Vista',
1204 win7 => 'Windows 7',
a70ebde3 1205 win8 => 'Windows 8/2012',
0cb9971e 1206 win10 => 'Windows 10/2016',
1e3baf05
DM
1207 l24 => 'Linux 2.4',
1208 l26 => 'Linux 2.6',
19672434 1209 };
1e3baf05
DM
1210}
1211
1e3baf05
DM
1212my $cdrom_path;
1213
1214sub get_cdrom_path {
1215
1216 return $cdrom_path if $cdrom_path;
1217
1218 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
1219 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
1220 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
1221}
1222
1223sub get_iso_path {
1224 my ($storecfg, $vmid, $cdrom) = @_;
1225
1226 if ($cdrom eq 'cdrom') {
1227 return get_cdrom_path();
1228 } elsif ($cdrom eq 'none') {
1229 return '';
1230 } elsif ($cdrom =~ m|^/|) {
1231 return $cdrom;
1232 } else {
6b64503e 1233 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
1234 }
1235}
1236
1237# try to convert old style file names to volume IDs
1238sub filename_to_volume_id {
1239 my ($vmid, $file, $media) = @_;
1240
1241 if (!($file eq 'none' || $file eq 'cdrom' ||
1242 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 1243
1e3baf05 1244 return undef if $file =~ m|/|;
19672434 1245
1e3baf05
DM
1246 if ($media && $media eq 'cdrom') {
1247 $file = "local:iso/$file";
1248 } else {
1249 $file = "local:$vmid/$file";
1250 }
1251 }
1252
1253 return $file;
1254}
1255
1256sub verify_media_type {
1257 my ($opt, $vtype, $media) = @_;
1258
1259 return if !$media;
1260
1261 my $etype;
1262 if ($media eq 'disk') {
a125592c 1263 $etype = 'images';
1e3baf05
DM
1264 } elsif ($media eq 'cdrom') {
1265 $etype = 'iso';
1266 } else {
1267 die "internal error";
1268 }
1269
1270 return if ($vtype eq $etype);
19672434 1271
1e3baf05
DM
1272 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
1273}
1274
1275sub cleanup_drive_path {
1276 my ($opt, $storecfg, $drive) = @_;
1277
1278 # try to convert filesystem paths to volume IDs
1279
1280 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
1281 ($drive->{file} !~ m|^/dev/.+|) &&
1282 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 1283 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
1284 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
1285 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
1286 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
1287 verify_media_type($opt, $vtype, $drive->{media});
1288 $drive->{file} = $volid;
1289 }
1290
1291 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
1292}
1293
b3c2bdd1
DM
1294sub parse_hotplug_features {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 return $res if $data eq '0';
a1b7d579 1300
b3c2bdd1
DM
1301 $data = $confdesc->{hotplug}->{default} if $data eq '1';
1302
45827685 1303 foreach my $feature (PVE::Tools::split_list($data)) {
b3c2bdd1
DM
1304 if ($feature =~ m/^(network|disk|cpu|memory|usb)$/) {
1305 $res->{$1} = 1;
1306 } else {
596a0a20 1307 die "invalid hotplug feature '$feature'\n";
b3c2bdd1
DM
1308 }
1309 }
1310 return $res;
1311}
1312
1313PVE::JSONSchema::register_format('pve-hotplug-features', \&pve_verify_hotplug_features);
1314sub pve_verify_hotplug_features {
1315 my ($value, $noerr) = @_;
1316
1317 return $value if parse_hotplug_features($value);
1318
1319 return undef if $noerr;
1320
1321 die "unable to parse hotplug option\n";
1322}
1323
1e3baf05
DM
1324# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
1325# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 1326# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
6e47c3b4
WB
1327# [,aio=native|threads][,discard=ignore|on][,detect_zeroes=on|off]
1328# [,iothread=on][,serial=serial][,model=model]
1e3baf05
DM
1329
1330sub parse_drive {
1331 my ($key, $data) = @_;
1332
0541eeb8 1333 my ($interface, $index);
19672434 1334
0541eeb8
WB
1335 if ($key =~ m/^([^\d]+)(\d+)$/) {
1336 $interface = $1;
1337 $index = $2;
1e3baf05
DM
1338 } else {
1339 return undef;
1340 }
1341
0541eeb8
WB
1342 my $desc = $key =~ /^unused\d+$/ ? $alldrive_fmt
1343 : $confdesc->{$key}->{format};
1344 if (!$desc) {
1345 warn "invalid drive key: $key\n";
1346 return undef;
1347 }
1348 my $res = eval { PVE::JSONSchema::parse_property_string($desc, $data) };
1349 return undef if !$res;
1350 $res->{interface} = $interface;
1351 $res->{index} = $index;
1352
1353 my $error = 0;
1354 foreach my $opt (qw(bps bps_rd bps_wr)) {
1355 if (my $bps = defined(delete $res->{$opt})) {
1356 if (defined($res->{"m$opt"})) {
1357 warn "both $opt and m$opt specified\n";
1358 ++$error;
1359 next;
1e3baf05 1360 }
0541eeb8 1361 $res->{"m$opt"} = sprintf("%.3f", $bps / (1024*1024.0));
1e3baf05
DM
1362 }
1363 }
9196a8ec
WB
1364
1365 # can't use the schema's 'requires' because of the mbps* => bps* "transforming aliases"
1366 for my $requirement (
fb8e95a2
WB
1367 [mbps_max => 'mbps'],
1368 [mbps_rd_max => 'mbps_rd'],
1369 [mbps_wr_max => 'mbps_wr'],
1370 [miops_max => 'miops'],
1371 [miops_rd_max => 'miops_rd'],
1372 [miops_wr_max => 'miops_wr'],
9196a8ec
WB
1373 [bps_max_length => 'mbps_max'],
1374 [bps_rd_max_length => 'mbps_rd_max'],
1375 [bps_wr_max_length => 'mbps_wr_max'],
1376 [iops_max_length => 'iops_max'],
1377 [iops_rd_max_length => 'iops_rd_max'],
1378 [iops_wr_max_length => 'iops_wr_max']) {
1379 my ($option, $requires) = @$requirement;
1380 if ($res->{$option} && !$res->{$requires}) {
1381 warn "$option requires $requires\n";
1382 ++$error;
1383 }
1384 }
1385
0541eeb8 1386 return undef if $error;
be190583 1387
9bf371a6
DM
1388 return undef if $res->{mbps_rd} && $res->{mbps};
1389 return undef if $res->{mbps_wr} && $res->{mbps};
affd2f88
AD
1390 return undef if $res->{iops_rd} && $res->{iops};
1391 return undef if $res->{iops_wr} && $res->{iops};
74edd76b 1392
1e3baf05
DM
1393 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1394 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1395 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1396 return undef if $res->{interface} eq 'virtio';
1397 }
1398
0541eeb8
WB
1399 if (my $size = $res->{size}) {
1400 return undef if !defined($res->{size} = PVE::JSONSchema::parse_size($size));
1e3baf05
DM
1401 }
1402
1403 return $res;
1404}
1405
1e3baf05
DM
1406sub print_drive {
1407 my ($vmid, $drive) = @_;
0541eeb8
WB
1408 my $data = { %$drive };
1409 delete $data->{$_} for qw(index interface);
1410 return PVE::JSONSchema::print_property_string($data, $alldrive_fmt);
1e3baf05
DM
1411}
1412
28ef82d3
DM
1413sub scsi_inquiry {
1414 my($fh, $noerr) = @_;
1415
1416 my $SG_IO = 0x2285;
1417 my $SG_GET_VERSION_NUM = 0x2282;
1418
1419 my $versionbuf = "\x00" x 8;
1420 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1421 if (!$ret) {
1422 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1423 return undef;
1424 }
97d62eb7 1425 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1426 if ($version < 30000) {
1427 die "scsi generic interface too old\n" if !$noerr;
1428 return undef;
1429 }
97d62eb7 1430
28ef82d3
DM
1431 my $buf = "\x00" x 36;
1432 my $sensebuf = "\x00" x 8;
f334aa3e 1433 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1434
28ef82d3
DM
1435 # see /usr/include/scsi/sg.h
1436 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1437
97d62eb7
DM
1438 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1439 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1440 $cmd, $sensebuf, 6000);
1441
1442 $ret = ioctl($fh, $SG_IO, $packet);
1443 if (!$ret) {
1444 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1445 return undef;
1446 }
97d62eb7 1447
28ef82d3
DM
1448 my @res = unpack($sg_io_hdr_t, $packet);
1449 if ($res[17] || $res[18]) {
1450 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1451 return undef;
1452 }
1453
1454 my $res = {};
09984754 1455 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1456 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1457
09984754
DM
1458 $res->{removable} = $byte1 & 128 ? 1 : 0;
1459 $res->{type} = $byte0 & 31;
1460
28ef82d3
DM
1461 return $res;
1462}
1463
1464sub path_is_scsi {
1465 my ($path) = @_;
1466
1467 my $fh = IO::File->new("+<$path") || return undef;
1468 my $res = scsi_inquiry($fh, 1);
1469 close($fh);
1470
1471 return $res;
1472}
1473
db656e5f
DM
1474sub machine_type_is_q35 {
1475 my ($conf) = @_;
b467f79a 1476
db656e5f
DM
1477 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1478}
1479
1480sub print_tabletdevice_full {
1481 my ($conf) = @_;
b467f79a 1482
db656e5f
DM
1483 my $q35 = machine_type_is_q35($conf);
1484
1485 # we use uhci for old VMs because tablet driver was buggy in older qemu
1486 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1487
db656e5f
DM
1488 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1489}
1490
ca916ecc 1491sub print_drivedevice_full {
5bdcf937 1492 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1493
1494 my $device = '';
1495 my $maxdev = 0;
19672434 1496
ca916ecc 1497 if ($drive->{interface} eq 'virtio') {
5bdcf937 1498 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1499 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
51f492cd 1500 $device .= ",iothread=iothread-$drive->{interface}$drive->{index}" if $drive->{iothread};
2ed36a41 1501 } elsif ($drive->{interface} eq 'scsi') {
6731a4cf 1502
ee034f5c 1503 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $drive);
2ed36a41
DM
1504 my $unit = $drive->{index} % $maxdev;
1505 my $devicetype = 'hd';
69bcf246
WB
1506 my $path = '';
1507 if (drive_is_cdrom($drive)) {
1508 $devicetype = 'cd';
29b19529 1509 } else {
69bcf246
WB
1510 if ($drive->{file} =~ m|^/|) {
1511 $path = $drive->{file};
1512 if (my $info = path_is_scsi($path)) {
8e3c33ab 1513 if ($info->{type} == 0 && $drive->{scsiblock}) {
69bcf246
WB
1514 $devicetype = 'block';
1515 } elsif ($info->{type} == 1) { # tape
1516 $devicetype = 'generic';
1517 }
1518 }
1519 } else {
1520 $path = PVE::Storage::path($storecfg, $drive->{file});
1521 }
1522
1523 if($path =~ m/^iscsi\:\/\//){
1524 $devicetype = 'generic';
1525 }
1526 }
1527
1528 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1529 $device = "scsi-$devicetype,bus=$controller_prefix$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1530 } else {
1531 $device = "scsi-$devicetype,bus=$controller_prefix$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1532 }
cdd20088 1533
2ed36a41
DM
1534 } elsif ($drive->{interface} eq 'ide'){
1535 $maxdev = 2;
1536 my $controller = int($drive->{index} / $maxdev);
1537 my $unit = $drive->{index} % $maxdev;
1538 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1539
7ebe888a 1540 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
0f2812c2 1541 if ($devicetype eq 'hd' && (my $model = $drive->{model})) {
46630a5f 1542 $model = URI::Escape::uri_unescape($model);
0f2812c2
WB
1543 $device .= ",model=$model";
1544 }
cdb0931f
DA
1545 } elsif ($drive->{interface} eq 'sata'){
1546 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1547 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1548 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1549 } elsif ($drive->{interface} eq 'usb') {
1550 die "implement me";
1551 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1552 } else {
1553 die "unsupported interface type";
ca916ecc
DA
1554 }
1555
3b408e82
DM
1556 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1557
ca916ecc
DA
1558 return $device;
1559}
1560
15b21acc 1561sub get_initiator_name {
46f58b5f 1562 my $initiator;
15b21acc 1563
46f58b5f
DM
1564 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1565 while (defined(my $line = <$fh>)) {
1566 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1567 $initiator = $1;
1568 last;
1569 }
46f58b5f
DM
1570 $fh->close();
1571
15b21acc
MR
1572 return $initiator;
1573}
1574
1e3baf05
DM
1575sub print_drive_full {
1576 my ($storecfg, $vmid, $drive) = @_;
1577
d81f0f09
DM
1578 my $path;
1579 my $volid = $drive->{file};
1580 my $format;
1581
1582 if (drive_is_cdrom($drive)) {
1583 $path = get_iso_path($storecfg, $vmid, $volid);
1584 } else {
1585 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
1586 if ($storeid) {
1587 $path = PVE::Storage::path($storecfg, $volid);
1588 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
1589 $format = qemu_img_format($scfg, $volname);
1590 } else {
1591 $path = $volid;
5b61bff2 1592 $format = "raw";
d81f0f09
DM
1593 }
1594 }
1595
1e3baf05 1596 my $opts = '';
fb8e95a2 1597 my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard);
1e3baf05
DM
1598 foreach my $o (@qemu_drive_options) {
1599 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1600 }
fb8e95a2
WB
1601 foreach my $type (['', '-total'], [_rd => '-read'], [_wr => '-write']) {
1602 my ($dir, $qmpname) = @$type;
1603 if (my $v = $drive->{"mbps$dir"}) {
1604 $opts .= ",throttling.bps$qmpname=".int($v*1024*1024);
1605 }
1606 if (my $v = $drive->{"mbps${dir}_max"}) {
1607 $opts .= ",throttling.bps$qmpname-max=".int($v*1024*1024);
1608 }
1609 if (my $v = $drive->{"bps${dir}_max_length"}) {
1610 $opts .= ",throttling.bps$qmpname-max-length=$v";
1611 }
1612 if (my $v = $drive->{"iops${dir}"}) {
1613 $opts .= ",throttling.iops$qmpname=$v";
1614 }
1615 if (my $v = $drive->{"iops${dir}_max"}) {
1616 $opts .= ",throttling.iops$qmpname=-max$v";
1617 }
1618 if (my $v = $drive->{"iops${dir}_max_length"}) {
1619 $opts .= ",throttling.iops$qmpname=-max-length$v";
1620 }
1621 }
1622
46630a5f
WB
1623 if (my $serial = $drive->{serial}) {
1624 $serial = URI::Escape::uri_unescape($serial);
1625 $opts .= ",serial=$serial";
1626 }
1e3baf05 1627
d81f0f09
DM
1628 $opts .= ",format=$format" if $format && !$drive->{format};
1629
b2ee900e
WB
1630 my $cache_direct = 0;
1631
1632 if (my $cache = $drive->{cache}) {
1633 $cache_direct = $cache =~ /^(?:off|none|directsync)$/;
1634 } elsif (!drive_is_cdrom($drive)) {
1635 $opts .= ",cache=none";
1636 $cache_direct = 1;
1637 }
1638
1639 # aio native works only with O_DIRECT
1640 if (!$drive->{aio}) {
1641 if($cache_direct) {
1642 $opts .= ",aio=native";
1643 } else {
1644 $opts .= ",aio=threads";
1645 }
1646 }
11490cf2 1647
6e47c3b4
WB
1648 if (!drive_is_cdrom($drive)) {
1649 my $detectzeroes;
7d4e30f3 1650 if (defined($drive->{detect_zeroes}) && !$drive->{detect_zeroes}) {
6e47c3b4
WB
1651 $detectzeroes = 'off';
1652 } elsif ($drive->{discard}) {
1653 $detectzeroes = $drive->{discard} eq 'on' ? 'unmap' : 'on';
1654 } else {
1655 # This used to be our default with discard not being specified:
1656 $detectzeroes = 'on';
1657 }
1658 $opts .= ",detect-zeroes=$detectzeroes" if $detectzeroes;
1659 }
f1e05305 1660
1e3baf05
DM
1661 my $pathinfo = $path ? "file=$path," : '';
1662
3ebfcc86 1663 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1664}
1665
cc4d6182 1666sub print_netdevice_full {
ba9e1000 1667 my ($vmid, $conf, $net, $netid, $bridges, $use_old_bios_files) = @_;
cc4d6182
DA
1668
1669 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1670
1671 my $device = $net->{model};
1672 if ($net->{model} eq 'virtio') {
1673 $device = 'virtio-net-pci';
1674 };
1675
5bdcf937 1676 my $pciaddr = print_pci_addr("$netid", $bridges);
5e2068d2 1677 my $tmpstr = "$device,mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1678 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1679 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1680 my $vectors = $net->{queues} * 2 + 2;
1681 $tmpstr .= ",vectors=$vectors,mq=on";
1682 }
cc4d6182 1683 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
ba9e1000
DM
1684
1685 if ($use_old_bios_files) {
1686 my $romfile;
1687 if ($device eq 'virtio-net-pci') {
1688 $romfile = 'pxe-virtio.rom';
1689 } elsif ($device eq 'e1000') {
1690 $romfile = 'pxe-e1000.rom';
1691 } elsif ($device eq 'ne2k') {
1692 $romfile = 'pxe-ne2k_pci.rom';
1693 } elsif ($device eq 'pcnet') {
1694 $romfile = 'pxe-pcnet.rom';
1695 } elsif ($device eq 'rtl8139') {
1696 $romfile = 'pxe-rtl8139.rom';
1697 }
1698 $tmpstr .= ",romfile=$romfile" if $romfile;
1699 }
1700
cc4d6182
DA
1701 return $tmpstr;
1702}
1703
1704sub print_netdev_full {
208ba94e 1705 my ($vmid, $conf, $net, $netid, $hotplug) = @_;
cc4d6182
DA
1706
1707 my $i = '';
1708 if ($netid =~ m/^net(\d+)$/) {
1709 $i = int($1);
1710 }
1711
1712 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1713
1714 my $ifname = "tap${vmid}i$i";
1715
1716 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1717 die "interface name '$ifname' is too long (max 15 character)\n"
1718 if length($ifname) >= 16;
1719
1720 my $vhostparam = '';
1721 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1722
1723 my $vmname = $conf->{name} || "vm$vmid";
1724
a9410357 1725 my $netdev = "";
208ba94e 1726 my $script = $hotplug ? "pve-bridge-hotplug" : "pve-bridge";
a9410357 1727
cc4d6182 1728 if ($net->{bridge}) {
208ba94e 1729 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/$script,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1730 } else {
a9410357 1731 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1732 }
a9410357
AD
1733
1734 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1735
1736 return $netdev;
cc4d6182 1737}
1e3baf05 1738
0efb537e
AD
1739
1740sub print_cpu_device {
1741 my ($conf, $id) = @_;
1742
1743 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
1744 my $cpu = $nokvm ? "qemu64" : "kvm64";
1745 if (my $cputype = $conf->{cpu}) {
1746 my $cpuconf = PVE::JSONSchema::parse_property_string($cpu_fmt, $cputype)
1747 or die "Cannot parse cpu description: $cputype\n";
1748 $cpu = $cpuconf->{cputype};
1749 }
1750
0efb537e
AD
1751 my $cores = $conf->{cores} || 1;
1752
1753 my $current_core = ($id - 1) % $cores;
7032e08c 1754 my $current_socket = int(($id - 1 - $current_core)/$cores);
0efb537e
AD
1755
1756 return "$cpu-x86_64-cpu,id=cpu$id,socket-id=$current_socket,core-id=$current_core,thread-id=0";
1757}
1758
1e3baf05
DM
1759sub drive_is_cdrom {
1760 my ($drive) = @_;
1761
1762 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1763
1764}
1765
ffc0d8c7
WB
1766sub parse_number_sets {
1767 my ($set) = @_;
1768 my $res = [];
1769 foreach my $part (split(/;/, $set)) {
1770 if ($part =~ /^\s*(\d+)(?:-(\d+))?\s*$/) {
1771 die "invalid range: $part ($2 < $1)\n" if defined($2) && $2 < $1;
1772 push @$res, [ $1, $2 ];
2ed5d572 1773 } else {
ffc0d8c7 1774 die "invalid range: $part\n";
2ed5d572
AD
1775 }
1776 }
ffc0d8c7
WB
1777 return $res;
1778}
2ed5d572 1779
ffc0d8c7
WB
1780sub parse_numa {
1781 my ($data) = @_;
1782
1783 my $res = PVE::JSONSchema::parse_property_string($numa_fmt, $data);
1784 $res->{cpus} = parse_number_sets($res->{cpus}) if defined($res->{cpus});
1785 $res->{hostnodes} = parse_number_sets($res->{hostnodes}) if defined($res->{hostnodes});
2ed5d572
AD
1786 return $res;
1787}
1788
040b06b7
DA
1789sub parse_hostpci {
1790 my ($value) = @_;
1791
1792 return undef if !$value;
1793
1f4f447b 1794 my $res = PVE::JSONSchema::parse_property_string($hostpci_fmt, $value);
0cea6a01 1795
1f4f447b
WB
1796 my @idlist = split(/;/, $res->{host});
1797 delete $res->{host};
1798 foreach my $id (@idlist) {
1799 if ($id =~ /^$PCIRE$/) {
a3139f90
WB
1800 if (defined($2)) {
1801 push @{$res->{pciid}}, { id => $1, function => $2 };
1802 } else {
1803 my $pcidevices = lspci($1);
1804 $res->{pciid} = $pcidevices->{$1};
1805 }
0cea6a01 1806 } else {
1f4f447b
WB
1807 # should have been caught by parse_property_string already
1808 die "failed to parse PCI id: $id\n";
0cea6a01 1809 }
040b06b7 1810 }
040b06b7
DA
1811 return $res;
1812}
1813
1e3baf05
DM
1814# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1815sub parse_net {
1816 my ($data) = @_;
1817
cd9c34d1
WB
1818 my $res = eval { PVE::JSONSchema::parse_property_string($net_fmt, $data) };
1819 if ($@) {
1820 warn $@;
1821 return undef;
1e3baf05 1822 }
b5b99790
WB
1823 if (!defined($res->{macaddr})) {
1824 my $dc = PVE::Cluster::cfs_read_file('datacenter.cfg');
1825 $res->{macaddr} = PVE::Tools::random_ether_addr($dc->{mac_prefix});
1826 }
1e3baf05
DM
1827 return $res;
1828}
1829
1830sub print_net {
1831 my $net = shift;
1832
cd9c34d1 1833 return PVE::JSONSchema::print_property_string($net, $net_fmt);
1e3baf05
DM
1834}
1835
1836sub add_random_macs {
1837 my ($settings) = @_;
1838
1839 foreach my $opt (keys %$settings) {
1840 next if $opt !~ m/^net(\d+)$/;
1841 my $net = parse_net($settings->{$opt});
1842 next if !$net;
1843 $settings->{$opt} = print_net($net);
1844 }
1845}
1846
055d554d
DM
1847sub vm_is_volid_owner {
1848 my ($storecfg, $vmid, $volid) = @_;
1849
1850 if ($volid !~ m|^/|) {
1851 my ($path, $owner);
1852 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1853 if ($owner && ($owner == $vmid)) {
1854 return 1;
1855 }
1856 }
1857
1858 return undef;
1859}
1860
3dc38fbb
WB
1861sub split_flagged_list {
1862 my $text = shift || '';
1863 $text =~ s/[,;]/ /g;
1864 $text =~ s/^\s+//;
1865 return { map { /^(!?)(.*)$/ && ($2, $1) } ($text =~ /\S+/g) };
1866}
1867
1868sub join_flagged_list {
1869 my ($how, $lst) = @_;
1870 join $how, map { $lst->{$_} . $_ } keys %$lst;
1871}
1872
055d554d 1873sub vmconfig_delete_pending_option {
3dc38fbb 1874 my ($conf, $key, $force) = @_;
055d554d
DM
1875
1876 delete $conf->{pending}->{$key};
3dc38fbb
WB
1877 my $pending_delete_hash = split_flagged_list($conf->{pending}->{delete});
1878 $pending_delete_hash->{$key} = $force ? '!' : '';
1879 $conf->{pending}->{delete} = join_flagged_list(',', $pending_delete_hash);
055d554d
DM
1880}
1881
1882sub vmconfig_undelete_pending_option {
1883 my ($conf, $key) = @_;
1884
3dc38fbb 1885 my $pending_delete_hash = split_flagged_list($conf->{pending}->{delete});
055d554d
DM
1886 delete $pending_delete_hash->{$key};
1887
3dc38fbb
WB
1888 if (%$pending_delete_hash) {
1889 $conf->{pending}->{delete} = join_flagged_list(',', $pending_delete_hash);
055d554d
DM
1890 } else {
1891 delete $conf->{pending}->{delete};
1892 }
1893}
1894
1895sub vmconfig_register_unused_drive {
1896 my ($storecfg, $vmid, $conf, $drive) = @_;
1897
1898 if (!drive_is_cdrom($drive)) {
1899 my $volid = $drive->{file};
1900 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
8793d495 1901 PVE::QemuConfig->add_unused_volume($conf, $volid, $vmid);
055d554d
DM
1902 }
1903 }
1904}
1905
c750e90a
DM
1906sub vmconfig_cleanup_pending {
1907 my ($conf) = @_;
1908
1909 # remove pending changes when nothing changed
1910 my $changes;
1911 foreach my $opt (keys %{$conf->{pending}}) {
1912 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1913 $changes = 1;
1914 delete $conf->{pending}->{$opt};
1915 }
1916 }
1917
3dc38fbb 1918 my $current_delete_hash = split_flagged_list($conf->{pending}->{delete});
c750e90a 1919 my $pending_delete_hash = {};
3dc38fbb 1920 while (my ($opt, $force) = each %$current_delete_hash) {
c750e90a 1921 if (defined($conf->{$opt})) {
3dc38fbb 1922 $pending_delete_hash->{$opt} = $force;
c750e90a
DM
1923 } else {
1924 $changes = 1;
1925 }
1926 }
1927
3dc38fbb
WB
1928 if (%$pending_delete_hash) {
1929 $conf->{pending}->{delete} = join_flagged_list(',', $pending_delete_hash);
c750e90a
DM
1930 } else {
1931 delete $conf->{pending}->{delete};
1932 }
1933
1934 return $changes;
1935}
1936
bd27e851 1937# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
ff6ffe20 1938my $smbios1_fmt = {
bd27e851
WB
1939 uuid => {
1940 type => 'string',
1941 pattern => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1942 format_description => 'UUID',
52261945 1943 description => "Set SMBIOS1 UUID.",
bd27e851
WB
1944 optional => 1,
1945 },
1946 version => {
1947 type => 'string',
1948 pattern => '\S+',
7f694a71 1949 format_description => 'string',
52261945 1950 description => "Set SMBIOS1 version.",
bd27e851
WB
1951 optional => 1,
1952 },
1953 serial => {
1954 type => 'string',
1955 pattern => '\S+',
7f694a71 1956 format_description => 'string',
52261945 1957 description => "Set SMBIOS1 serial number.",
bd27e851
WB
1958 optional => 1,
1959 },
1960 manufacturer => {
1961 type => 'string',
1962 pattern => '\S+',
7f694a71 1963 format_description => 'string',
52261945 1964 description => "Set SMBIOS1 manufacturer.",
bd27e851
WB
1965 optional => 1,
1966 },
1967 product => {
1968 type => 'string',
1969 pattern => '\S+',
7f694a71 1970 format_description => 'string',
52261945 1971 description => "Set SMBIOS1 product ID.",
bd27e851
WB
1972 optional => 1,
1973 },
1974 sku => {
1975 type => 'string',
1976 pattern => '\S+',
7f694a71 1977 format_description => 'string',
52261945 1978 description => "Set SMBIOS1 SKU string.",
bd27e851
WB
1979 optional => 1,
1980 },
1981 family => {
1982 type => 'string',
1983 pattern => '\S+',
7f694a71 1984 format_description => 'string',
52261945 1985 description => "Set SMBIOS1 family string.",
bd27e851
WB
1986 optional => 1,
1987 },
2796e7d5
DM
1988};
1989
2796e7d5
DM
1990sub parse_smbios1 {
1991 my ($data) = @_;
1992
ff6ffe20 1993 my $res = eval { PVE::JSONSchema::parse_property_string($smbios1_fmt, $data) };
bd27e851 1994 warn $@ if $@;
2796e7d5
DM
1995 return $res;
1996}
1997
cd11416f
DM
1998sub print_smbios1 {
1999 my ($smbios1) = @_;
ff6ffe20 2000 return PVE::JSONSchema::print_property_string($smbios1, $smbios1_fmt);
cd11416f
DM
2001}
2002
ff6ffe20 2003PVE::JSONSchema::register_format('pve-qm-smbios1', $smbios1_fmt);
2796e7d5 2004
1e3baf05
DM
2005PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
2006sub verify_bootdisk {
2007 my ($value, $noerr) = @_;
2008
74479ee9 2009 return $value if is_valid_drivename($value);
1e3baf05
DM
2010
2011 return undef if $noerr;
2012
2013 die "invalid boot disk '$value'\n";
2014}
2015
0ea9541d
DM
2016sub parse_watchdog {
2017 my ($value) = @_;
2018
2019 return undef if !$value;
2020
ec3582b5
WB
2021 my $res = eval { PVE::JSONSchema::parse_property_string($watchdog_fmt, $value) };
2022 warn $@ if $@;
0ea9541d
DM
2023 return $res;
2024}
2025
1e3baf05
DM
2026PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
2027sub verify_usb_device {
2028 my ($value, $noerr) = @_;
2029
2030 return $value if parse_usb_device($value);
2031
2032 return undef if $noerr;
19672434 2033
1e3baf05
DM
2034 die "unable to parse usb device\n";
2035}
2036
1e3baf05
DM
2037# add JSON properties for create and set function
2038sub json_config_properties {
2039 my $prop = shift;
2040
2041 foreach my $opt (keys %$confdesc) {
18bfb361 2042 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
2043 $prop->{$opt} = $confdesc->{$opt};
2044 }
2045
2046 return $prop;
2047}
2048
2049sub check_type {
2050 my ($key, $value) = @_;
2051
2052 die "unknown setting '$key'\n" if !$confdesc->{$key};
2053
2054 my $type = $confdesc->{$key}->{type};
2055
6b64503e 2056 if (!defined($value)) {
1e3baf05
DM
2057 die "got undefined value\n";
2058 }
2059
2060 if ($value =~ m/[\n\r]/) {
2061 die "property contains a line feed\n";
2062 }
2063
2064 if ($type eq 'boolean') {
19672434
DM
2065 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
2066 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
2067 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
2068 } elsif ($type eq 'integer') {
2069 return int($1) if $value =~ m/^(\d+)$/;
2070 die "type check ('integer') failed - got '$value'\n";
04432191
AD
2071 } elsif ($type eq 'number') {
2072 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
2073 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
2074 } elsif ($type eq 'string') {
2075 if (my $fmt = $confdesc->{$key}->{format}) {
1e3baf05 2076 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
2077 return $value;
2078 }
1e3baf05 2079 $value =~ s/^\"(.*)\"$/$1/;
19672434 2080 return $value;
1e3baf05
DM
2081 } else {
2082 die "internal error"
2083 }
2084}
2085
040b06b7
DA
2086sub check_iommu_support{
2087 #fixme : need to check IOMMU support
2088 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
2089
2090 my $iommu=1;
2091 return $iommu;
2092
2093}
2094
1e3baf05
DM
2095sub touch_config {
2096 my ($vmid) = @_;
2097
ffda963f 2098 my $conf = PVE::QemuConfig->config_file($vmid);
1e3baf05
DM
2099 utime undef, undef, $conf;
2100}
2101
1e3baf05 2102sub destroy_vm {
15cc8784 2103 my ($storecfg, $vmid, $keep_empty_config, $skiplock) = @_;
1e3baf05 2104
ffda963f 2105 my $conffile = PVE::QemuConfig->config_file($vmid);
1e3baf05 2106
ffda963f 2107 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 2108
ffda963f 2109 PVE::QemuConfig->check_lock($conf) if !$skiplock;
1e3baf05 2110
19672434 2111 # only remove disks owned by this VM
1e3baf05
DM
2112 foreach_drive($conf, sub {
2113 my ($ds, $drive) = @_;
2114
6b64503e 2115 return if drive_is_cdrom($drive);
1e3baf05
DM
2116
2117 my $volid = $drive->{file};
ed221350 2118
ff1a2432 2119 return if !$volid || $volid =~ m|^/|;
1e3baf05 2120
6b64503e 2121 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 2122 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 2123
31b52247
FG
2124 eval {
2125 PVE::Storage::vdisk_free($storecfg, $volid);
2126 };
2127 warn "Could not remove disk '$volid', check manually: $@" if $@;
2128
1e3baf05 2129 });
19672434 2130
a6af7b3e 2131 if ($keep_empty_config) {
9c502e26 2132 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
2133 } else {
2134 unlink $conffile;
2135 }
1e3baf05
DM
2136
2137 # also remove unused disk
2138 eval {
6b64503e 2139 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
2140
2141 eval {
6b64503e 2142 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 2143 my ($volid, $sid, $volname, $d) = @_;
6b64503e 2144 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
2145 });
2146 };
2147 warn $@ if $@;
2148
2149 };
2150 warn $@ if $@;
2151}
2152
1e3baf05
DM
2153sub parse_vm_config {
2154 my ($filename, $raw) = @_;
2155
2156 return undef if !defined($raw);
2157
554ac7e7 2158 my $res = {
fc1ddcdc 2159 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 2160 snapshots => {},
0d732d16 2161 pending => {},
554ac7e7 2162 };
1e3baf05 2163
19672434 2164 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
2165 || die "got strange filename '$filename'";
2166
2167 my $vmid = $1;
2168
0d18dcfc 2169 my $conf = $res;
b0ec896e 2170 my $descr;
e297c490 2171 my $section = '';
0581fe4f 2172
0d18dcfc
DM
2173 my @lines = split(/\n/, $raw);
2174 foreach my $line (@lines) {
1e3baf05 2175 next if $line =~ m/^\s*$/;
be190583 2176
eab09f4e 2177 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 2178 $section = 'pending';
b0ec896e
DM
2179 if (defined($descr)) {
2180 $descr =~ s/\s+$//;
2181 $conf->{description} = $descr;
2182 }
2183 $descr = undef;
e297c490 2184 $conf = $res->{$section} = {};
eab09f4e
AD
2185 next;
2186
0d732d16 2187 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 2188 $section = $1;
b0ec896e
DM
2189 if (defined($descr)) {
2190 $descr =~ s/\s+$//;
2191 $conf->{description} = $descr;
2192 }
2193 $descr = undef;
e297c490 2194 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
2195 next;
2196 }
1e3baf05 2197
0581fe4f 2198 if ($line =~ m/^\#(.*)\s*$/) {
b0ec896e 2199 $descr = '' if !defined($descr);
0581fe4f
DM
2200 $descr .= PVE::Tools::decode_text($1) . "\n";
2201 next;
2202 }
2203
1e3baf05 2204 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
b0ec896e 2205 $descr = '' if !defined($descr);
0581fe4f 2206 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
2207 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
2208 $conf->{snapstate} = $1;
1e3baf05
DM
2209 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
2210 my $key = $1;
2211 my $value = $2;
0d18dcfc 2212 $conf->{$key} = $value;
ef824322 2213 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
e297c490 2214 my $value = $1;
ef824322
DM
2215 if ($section eq 'pending') {
2216 $conf->{delete} = $value; # we parse this later
2217 } else {
2218 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
eab09f4e 2219 }
1e3baf05
DM
2220 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
2221 my $key = $1;
2222 my $value = $2;
2223 eval { $value = check_type($key, $value); };
2224 if ($@) {
2225 warn "vm $vmid - unable to parse value of '$key' - $@";
2226 } else {
b799312f 2227 $key = 'ide2' if $key eq 'cdrom';
1e3baf05 2228 my $fmt = $confdesc->{$key}->{format};
b799312f 2229 if ($fmt && $fmt =~ /^pve-qm-(?:ide|scsi|virtio|sata)$/) {
1e3baf05
DM
2230 my $v = parse_drive($key, $value);
2231 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
2232 $v->{file} = $volid;
6b64503e 2233 $value = print_drive($vmid, $v);
1e3baf05
DM
2234 } else {
2235 warn "vm $vmid - unable to parse value of '$key'\n";
2236 next;
2237 }
2238 }
2239
b799312f 2240 $conf->{$key} = $value;
1e3baf05
DM
2241 }
2242 }
2243 }
2244
b0ec896e
DM
2245 if (defined($descr)) {
2246 $descr =~ s/\s+$//;
2247 $conf->{description} = $descr;
2248 }
0d18dcfc 2249 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
2250
2251 return $res;
2252}
2253
1858638f
DM
2254sub write_vm_config {
2255 my ($filename, $conf) = @_;
1e3baf05 2256
0d18dcfc
DM
2257 delete $conf->{snapstate}; # just to be sure
2258
1858638f
DM
2259 if ($conf->{cdrom}) {
2260 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2261 $conf->{ide2} = $conf->{cdrom};
2262 delete $conf->{cdrom};
2263 }
1e3baf05
DM
2264
2265 # we do not use 'smp' any longer
1858638f
DM
2266 if ($conf->{sockets}) {
2267 delete $conf->{smp};
2268 } elsif ($conf->{smp}) {
2269 $conf->{sockets} = $conf->{smp};
2270 delete $conf->{cores};
2271 delete $conf->{smp};
1e3baf05
DM
2272 }
2273
ee2f90b1 2274 my $used_volids = {};
0d18dcfc 2275
ee2f90b1 2276 my $cleanup_config = sub {
ef824322 2277 my ($cref, $pending, $snapname) = @_;
1858638f 2278
ee2f90b1
DM
2279 foreach my $key (keys %$cref) {
2280 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
ef824322 2281 $key eq 'snapstate' || $key eq 'pending';
ee2f90b1 2282 my $value = $cref->{$key};
ef824322
DM
2283 if ($key eq 'delete') {
2284 die "propertry 'delete' is only allowed in [PENDING]\n"
2285 if !$pending;
2286 # fixme: check syntax?
2287 next;
2288 }
ee2f90b1
DM
2289 eval { $value = check_type($key, $value); };
2290 die "unable to parse value of '$key' - $@" if $@;
1858638f 2291
ee2f90b1
DM
2292 $cref->{$key} = $value;
2293
74479ee9 2294 if (!$snapname && is_valid_drivename($key)) {
ed221350 2295 my $drive = parse_drive($key, $value);
ee2f90b1
DM
2296 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2297 }
1e3baf05 2298 }
ee2f90b1
DM
2299 };
2300
2301 &$cleanup_config($conf);
ef824322
DM
2302
2303 &$cleanup_config($conf->{pending}, 1);
2304
ee2f90b1 2305 foreach my $snapname (keys %{$conf->{snapshots}}) {
ef824322
DM
2306 die "internal error" if $snapname eq 'pending';
2307 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
1e3baf05
DM
2308 }
2309
1858638f
DM
2310 # remove 'unusedX' settings if we re-add a volume
2311 foreach my $key (keys %$conf) {
2312 my $value = $conf->{$key};
ee2f90b1 2313 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 2314 delete $conf->{$key};
1e3baf05 2315 }
1858638f 2316 }
be190583 2317
0d18dcfc 2318 my $generate_raw_config = sub {
b0ec896e 2319 my ($conf, $pending) = @_;
0581fe4f 2320
0d18dcfc
DM
2321 my $raw = '';
2322
2323 # add description as comment to top of file
b0ec896e
DM
2324 if (defined(my $descr = $conf->{description})) {
2325 if ($descr) {
2326 foreach my $cl (split(/\n/, $descr)) {
2327 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2328 }
2329 } else {
2330 $raw .= "#\n" if $pending;
2331 }
0d18dcfc
DM
2332 }
2333
2334 foreach my $key (sort keys %$conf) {
ef824322 2335 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
0d18dcfc
DM
2336 $raw .= "$key: $conf->{$key}\n";
2337 }
2338 return $raw;
2339 };
0581fe4f 2340
0d18dcfc 2341 my $raw = &$generate_raw_config($conf);
ef824322
DM
2342
2343 if (scalar(keys %{$conf->{pending}})){
2344 $raw .= "\n[PENDING]\n";
b0ec896e 2345 $raw .= &$generate_raw_config($conf->{pending}, 1);
ef824322
DM
2346 }
2347
0d18dcfc
DM
2348 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2349 $raw .= "\n[$snapname]\n";
2350 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2351 }
1e3baf05 2352
1858638f
DM
2353 return $raw;
2354}
1e3baf05 2355
19672434 2356sub load_defaults {
1e3baf05
DM
2357
2358 my $res = {};
2359
2360 # we use static defaults from our JSON schema configuration
2361 foreach my $key (keys %$confdesc) {
2362 if (defined(my $default = $confdesc->{$key}->{default})) {
2363 $res->{$key} = $default;
2364 }
2365 }
19672434 2366
1e3baf05
DM
2367 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2368 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2369
2370 return $res;
2371}
2372
2373sub config_list {
2374 my $vmlist = PVE::Cluster::get_vmlist();
2375 my $res = {};
2376 return $res if !$vmlist || !$vmlist->{ids};
2377 my $ids = $vmlist->{ids};
2378
1e3baf05
DM
2379 foreach my $vmid (keys %$ids) {
2380 my $d = $ids->{$vmid};
2381 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2382 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2383 $res->{$vmid}->{exists} = 1;
2384 }
2385 return $res;
2386}
2387
64e13401
DM
2388# test if VM uses local resources (to prevent migration)
2389sub check_local_resources {
2390 my ($conf, $noerr) = @_;
2391
2392 my $loc_res = 0;
19672434 2393
e0ab7331
DM
2394 $loc_res = 1 if $conf->{hostusb}; # old syntax
2395 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2396
0d29ab3b 2397 foreach my $k (keys %$conf) {
49ca581d 2398 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
d44712fc
EK
2399 # sockets are safe: they will recreated be on the target side post-migrate
2400 next if $k =~ m/^serial/ && ($conf->{$k} eq 'socket');
2fe1a152 2401 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2402 }
2403
2404 die "VM uses local resources\n" if $loc_res && !$noerr;
2405
2406 return $loc_res;
2407}
2408
719893a9 2409# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2410sub check_storage_availability {
2411 my ($storecfg, $conf, $node) = @_;
2412
2413 foreach_drive($conf, sub {
2414 my ($ds, $drive) = @_;
2415
2416 my $volid = $drive->{file};
2417 return if !$volid;
2418
2419 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2420 return if !$sid;
2421
2422 # check if storage is available on both nodes
2423 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2424 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2425 });
2426}
2427
719893a9
DM
2428# list nodes where all VM images are available (used by has_feature API)
2429sub shared_nodes {
2430 my ($conf, $storecfg) = @_;
2431
2432 my $nodelist = PVE::Cluster::get_nodelist();
2433 my $nodehash = { map { $_ => 1 } @$nodelist };
2434 my $nodename = PVE::INotify::nodename();
be190583 2435
719893a9
DM
2436 foreach_drive($conf, sub {
2437 my ($ds, $drive) = @_;
2438
2439 my $volid = $drive->{file};
2440 return if !$volid;
2441
2442 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2443 if ($storeid) {
2444 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2445 if ($scfg->{disable}) {
2446 $nodehash = {};
2447 } elsif (my $avail = $scfg->{nodes}) {
2448 foreach my $node (keys %$nodehash) {
2449 delete $nodehash->{$node} if !$avail->{$node};
2450 }
2451 } elsif (!$scfg->{shared}) {
2452 foreach my $node (keys %$nodehash) {
2453 delete $nodehash->{$node} if $node ne $nodename
2454 }
2455 }
2456 }
2457 });
2458
2459 return $nodehash
2460}
2461
1e3baf05
DM
2462sub check_cmdline {
2463 my ($pidfile, $pid) = @_;
2464
6b64503e
DM
2465 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2466 if (defined($fh)) {
1e3baf05
DM
2467 my $line = <$fh>;
2468 $fh->close;
2469 return undef if !$line;
6b64503e 2470 my @param = split(/\0/, $line);
1e3baf05
DM
2471
2472 my $cmd = $param[0];
06094efd 2473 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2474
2475 for (my $i = 0; $i < scalar (@param); $i++) {
2476 my $p = $param[$i];
2477 next if !$p;
2478 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2479 my $p = $param[$i+1];
2480 return 1 if $p && ($p eq $pidfile);
2481 return undef;
2482 }
2483 }
2484 }
2485 return undef;
2486}
2487
2488sub check_running {
7e8dcf2c 2489 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2490
ffda963f 2491 my $filename = PVE::QemuConfig->config_file($vmid, $node);
1e3baf05
DM
2492
2493 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2494 if !$nocheck && ! -f $filename;
1e3baf05 2495
e6c3b671 2496 my $pidfile = pidfile_name($vmid);
1e3baf05 2497
e6c3b671
DM
2498 if (my $fd = IO::File->new("<$pidfile")) {
2499 my $st = stat($fd);
1e3baf05 2500 my $line = <$fd>;
6b64503e 2501 close($fd);
1e3baf05
DM
2502
2503 my $mtime = $st->mtime;
2504 if ($mtime > time()) {
2505 warn "file '$filename' modified in future\n";
2506 }
2507
2508 if ($line =~ m/^(\d+)$/) {
2509 my $pid = $1;
e6c3b671
DM
2510 if (check_cmdline($pidfile, $pid)) {
2511 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2512 return $pid;
2513 }
2514 }
1e3baf05
DM
2515 }
2516 }
2517
2518 return undef;
2519}
2520
2521sub vzlist {
19672434 2522
1e3baf05
DM
2523 my $vzlist = config_list();
2524
6b64503e 2525 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2526
19672434 2527 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2528 next if $de !~ m/^(\d+)\.pid$/;
2529 my $vmid = $1;
6b64503e
DM
2530 next if !defined($vzlist->{$vmid});
2531 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2532 $vzlist->{$vmid}->{pid} = $pid;
2533 }
2534 }
2535
2536 return $vzlist;
2537}
2538
1e3baf05
DM
2539sub disksize {
2540 my ($storecfg, $conf) = @_;
2541
2542 my $bootdisk = $conf->{bootdisk};
2543 return undef if !$bootdisk;
74479ee9 2544 return undef if !is_valid_drivename($bootdisk);
1e3baf05
DM
2545
2546 return undef if !$conf->{$bootdisk};
2547
2548 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2549 return undef if !defined($drive);
2550
2551 return undef if drive_is_cdrom($drive);
2552
2553 my $volid = $drive->{file};
2554 return undef if !$volid;
2555
24afaca0 2556 return $drive->{size};
1e3baf05
DM
2557}
2558
2559my $last_proc_pid_stat;
2560
03a33f30
DM
2561# get VM status information
2562# This must be fast and should not block ($full == false)
2563# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2564sub vmstatus {
03a33f30 2565 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2566
2567 my $res = {};
2568
19672434 2569 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2570
2571 my $list = vzlist();
694fcad4 2572 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2573
ae4915a2
DM
2574 my $cpucount = $cpuinfo->{cpus} || 1;
2575
1e3baf05
DM
2576 foreach my $vmid (keys %$list) {
2577 next if $opt_vmid && ($vmid ne $opt_vmid);
2578
ffda963f 2579 my $cfspath = PVE::QemuConfig->cfs_config_path($vmid);
1e3baf05
DM
2580 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2581
2582 my $d = {};
2583 $d->{pid} = $list->{$vmid}->{pid};
2584
2585 # fixme: better status?
2586 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2587
af990afe
DM
2588 my $size = disksize($storecfg, $conf);
2589 if (defined($size)) {
2590 $d->{disk} = 0; # no info available
1e3baf05
DM
2591 $d->{maxdisk} = $size;
2592 } else {
2593 $d->{disk} = 0;
2594 $d->{maxdisk} = 0;
2595 }
2596
2597 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2 2598 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
d7c8364b 2599 $d->{cpus} = $conf->{vcpus} if $conf->{vcpus};
ae4915a2 2600
1e3baf05 2601 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2602 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2603
8b1accf7 2604 if ($conf->{balloon}) {
4bdb0514 2605 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2606 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2607 }
2608
1e3baf05
DM
2609 $d->{uptime} = 0;
2610 $d->{cpu} = 0;
1e3baf05
DM
2611 $d->{mem} = 0;
2612
2613 $d->{netout} = 0;
2614 $d->{netin} = 0;
2615
2616 $d->{diskread} = 0;
2617 $d->{diskwrite} = 0;
2618
ffda963f 2619 $d->{template} = PVE::QemuConfig->is_template($conf);
4d8c851b 2620
1e3baf05
DM
2621 $res->{$vmid} = $d;
2622 }
2623
2624 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2625 foreach my $dev (keys %$netdev) {
2626 next if $dev !~ m/^tap([1-9]\d*)i/;
2627 my $vmid = $1;
2628 my $d = $res->{$vmid};
2629 next if !$d;
19672434 2630
1e3baf05
DM
2631 $d->{netout} += $netdev->{$dev}->{receive};
2632 $d->{netin} += $netdev->{$dev}->{transmit};
604ea644
AD
2633
2634 if ($full) {
2635 $d->{nics}->{$dev}->{netout} = $netdev->{$dev}->{receive};
2636 $d->{nics}->{$dev}->{netin} = $netdev->{$dev}->{transmit};
2637 }
2638
1e3baf05
DM
2639 }
2640
1e3baf05
DM
2641 my $ctime = gettimeofday;
2642
2643 foreach my $vmid (keys %$list) {
2644
2645 my $d = $res->{$vmid};
2646 my $pid = $d->{pid};
2647 next if !$pid;
2648
694fcad4
DM
2649 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2650 next if !$pstat; # not running
19672434 2651
694fcad4 2652 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2653
694fcad4 2654 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2655
694fcad4 2656 if ($pstat->{vsize}) {
6b64503e 2657 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2658 }
2659
2660 my $old = $last_proc_pid_stat->{$pid};
2661 if (!$old) {
19672434
DM
2662 $last_proc_pid_stat->{$pid} = {
2663 time => $ctime,
1e3baf05
DM
2664 used => $used,
2665 cpu => 0,
1e3baf05
DM
2666 };
2667 next;
2668 }
2669
7f0b5beb 2670 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2671
2672 if ($dtime > 1000) {
2673 my $dutime = $used - $old->{used};
2674
ae4915a2 2675 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2676 $last_proc_pid_stat->{$pid} = {
19672434 2677 time => $ctime,
1e3baf05
DM
2678 used => $used,
2679 cpu => $d->{cpu},
1e3baf05
DM
2680 };
2681 } else {
2682 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2683 }
2684 }
2685
f5eb281a 2686 return $res if !$full;
03a33f30
DM
2687
2688 my $qmpclient = PVE::QMPClient->new();
2689
64e7fcf2
DM
2690 my $ballooncb = sub {
2691 my ($vmid, $resp) = @_;
2692
2693 my $info = $resp->{'return'};
38babf81
DM
2694 return if !$info->{max_mem};
2695
64e7fcf2
DM
2696 my $d = $res->{$vmid};
2697
38babf81
DM
2698 # use memory assigned to VM
2699 $d->{maxmem} = $info->{max_mem};
2700 $d->{balloon} = $info->{actual};
2701
2702 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2703 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2704 $d->{freemem} = $info->{free_mem};
64e7fcf2
DM
2705 }
2706
604ea644 2707 $d->{ballooninfo} = $info;
64e7fcf2
DM
2708 };
2709
03a33f30
DM
2710 my $blockstatscb = sub {
2711 my ($vmid, $resp) = @_;
2712 my $data = $resp->{'return'} || [];
2713 my $totalrdbytes = 0;
2714 my $totalwrbytes = 0;
604ea644 2715
03a33f30
DM
2716 for my $blockstat (@$data) {
2717 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2718 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
604ea644
AD
2719
2720 $blockstat->{device} =~ s/drive-//;
2721 $res->{$vmid}->{blockstat}->{$blockstat->{device}} = $blockstat->{stats};
03a33f30
DM
2722 }
2723 $res->{$vmid}->{diskread} = $totalrdbytes;
2724 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2725 };
2726
2727 my $statuscb = sub {
2728 my ($vmid, $resp) = @_;
64e7fcf2 2729
03a33f30 2730 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2731 # this fails if ballon driver is not loaded, so this must be
2732 # the last commnand (following command are aborted if this fails).
38babf81 2733 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2734
2735 my $status = 'unknown';
2736 if (!defined($status = $resp->{'return'}->{status})) {
2737 warn "unable to get VM status\n";
2738 return;
2739 }
2740
2741 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2742 };
2743
2744 foreach my $vmid (keys %$list) {
2745 next if $opt_vmid && ($vmid ne $opt_vmid);
2746 next if !$res->{$vmid}->{pid}; # not running
2747 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2748 }
2749
b017fbda 2750 $qmpclient->queue_execute(undef, 2);
03a33f30
DM
2751
2752 foreach my $vmid (keys %$list) {
2753 next if $opt_vmid && ($vmid ne $opt_vmid);
2754 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2755 }
2756
1e3baf05
DM
2757 return $res;
2758}
2759
2760sub foreach_drive {
b74ff047 2761 my ($conf, $func, @param) = @_;
1e3baf05 2762
74479ee9
FG
2763 foreach my $ds (valid_drive_names()) {
2764 next if !defined($conf->{$ds});
1e3baf05 2765
6b64503e 2766 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2767 next if !$drive;
2768
b74ff047 2769 &$func($ds, $drive, @param);
1e3baf05
DM
2770 }
2771}
2772
d5769dc2 2773sub foreach_volid {
b6adff33 2774 my ($conf, $func, @param) = @_;
be190583 2775
d5769dc2
DM
2776 my $volhash = {};
2777
2778 my $test_volid = sub {
39019f75 2779 my ($volid, $is_cdrom, $replicate, $snapname) = @_;
d5769dc2
DM
2780
2781 return if !$volid;
be190583 2782
392f8b5d
DM
2783 $volhash->{$volid}->{cdrom} //= 1;
2784 $volhash->{$volid}->{cdrom} = 0 if !$is_cdrom;
2785
2786 $volhash->{$volid}->{replicate} //= 0;
2787 $volhash->{$volid}->{replicate} = 1 if $replicate;
39019f75
DM
2788
2789 $volhash->{$volid}->{referenced_in_config} //= 0;
2790 $volhash->{$volid}->{referenced_in_config} = 1 if !defined($snapname);
2791
2792 $volhash->{$volid}->{referenced_in_snapshot}->{$snapname} = 1
2793 if defined($snapname);
d5769dc2
DM
2794 };
2795
ed221350 2796 foreach_drive($conf, sub {
d5769dc2 2797 my ($ds, $drive) = @_;
39019f75 2798 $test_volid->($drive->{file}, drive_is_cdrom($drive), $drive->{replicate} // 1, undef);
d5769dc2
DM
2799 });
2800
2801 foreach my $snapname (keys %{$conf->{snapshots}}) {
2802 my $snap = $conf->{snapshots}->{$snapname};
39019f75 2803 $test_volid->($snap->{vmstate}, 0, 1, $snapname);
ed221350 2804 foreach_drive($snap, sub {
d5769dc2 2805 my ($ds, $drive) = @_;
39019f75 2806 $test_volid->($drive->{file}, drive_is_cdrom($drive), $drive->{replicate} // 1, $snapname);
d5769dc2
DM
2807 });
2808 }
2809
2810 foreach my $volid (keys %$volhash) {
b6adff33 2811 &$func($volid, $volhash->{$volid}, @param);
d5769dc2
DM
2812 }
2813}
2814
86b8228b
DM
2815sub vga_conf_has_spice {
2816 my ($vga) = @_;
2817
590e698c
DM
2818 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2819
2820 return $1 || 1;
86b8228b
DM
2821}
2822
1e3baf05 2823sub config_to_command {
67812f9c 2824 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2825
2826 my $cmd = [];
8c559505
DM
2827 my $globalFlags = [];
2828 my $machineFlags = [];
2829 my $rtcFlags = [];
519ed28c 2830 my $cpuFlags = [];
5bdcf937 2831 my $devices = [];
b78ebef7 2832 my $pciaddr = '';
5bdcf937 2833 my $bridges = {};
1e3baf05
DM
2834 my $kvmver = kvm_user_version();
2835 my $vernum = 0; # unknown
b42d3cf9 2836 my $ostype = $conf->{ostype};
4317f69f
AD
2837 my $winversion = windows_version($ostype);
2838
a3c52213
DM
2839 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2840 $vernum = $1*1000000+$2*1000;
2841 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2842 $vernum = $1*1000000+$2*1000+$3;
2843 }
2844
a3c52213 2845 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2846
2847 my $have_ovz = -f '/proc/vz/vestat';
2848
db656e5f 2849 my $q35 = machine_type_is_q35($conf);
4d3f29ed 2850 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
23f73120 2851 my $machine_type = $forcemachine || $conf->{machine};
249c4a6c
AD
2852 my $use_old_bios_files = undef;
2853 ($use_old_bios_files, $machine_type) = qemu_use_old_bios_files($machine_type);
db656e5f 2854
f08e17c7
AD
2855 my $cpuunits = defined($conf->{cpuunits}) ?
2856 $conf->{cpuunits} : $defaults->{cpuunits};
2857
1e3baf05
DM
2858 push @$cmd, '/usr/bin/kvm';
2859
2860 push @$cmd, '-id', $vmid;
2861
2862 my $use_virtio = 0;
2863
c971c4f2
AD
2864 my $qmpsocket = qmp_socket($vmid);
2865 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2866 push @$cmd, '-mon', "chardev=qmp,mode=control";
2867
1e3baf05 2868
6b64503e 2869 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2870
1e3baf05
DM
2871 push @$cmd, '-daemonize';
2872
2796e7d5
DM
2873 if ($conf->{smbios1}) {
2874 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2875 }
2876
3edb45e7 2877 if ($conf->{bios} && $conf->{bios} eq 'ovmf') {
2ddc0a5c
DC
2878 my $ovmfbase;
2879
2880 # prefer the OVMF_CODE variant
2881 if (-f $OVMF_CODE) {
2882 $ovmfbase = $OVMF_CODE;
2883 } elsif (-f $OVMF_IMG) {
2884 $ovmfbase = $OVMF_IMG;
2885 }
2886
2887 die "no uefi base img found\n" if !$ovmfbase;
2888 push @$cmd, '-drive', "if=pflash,unit=0,format=raw,readonly,file=$ovmfbase";
4a5cf64a
WL
2889
2890 if (defined($conf->{efidisk0}) && ($ovmfbase eq $OVMF_CODE)) {
2891 my $d = PVE::JSONSchema::parse_property_string($efidisk_fmt, $conf->{efidisk0});
2ddc0a5c
DC
2892 my $format = $d->{format} // 'raw';
2893 my $path;
2894 my ($storeid, $volname) = PVE::Storage::parse_volume_id($d->{file}, 1);
2895 if ($storeid) {
2896 $path = PVE::Storage::path($storecfg, $d->{file});
2897 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2898 $format = qemu_img_format($scfg, $volname);
2899 } else {
2900 $path = $d->{file};
2901 $format = "raw";
2902 }
2903 push @$cmd, '-drive', "if=pflash,unit=1,id=drive-efidisk0,format=$format,file=$path";
2904 } elsif ($ovmfbase eq $OVMF_CODE) {
2905 warn "using uefi without permanent efivars disk\n";
2906 my $ovmfvar_dst = "/tmp/$vmid-ovmf.fd";
2907 PVE::Tools::file_copy($OVMF_VARS, $ovmfvar_dst, 256*1024);
2908 push @$cmd, '-drive', "if=pflash,unit=1,format=raw,file=$ovmfvar_dst";
2909 } else {
2910 # if the base img is not OVMF_CODE, we do not have to bother
2911 # to create/use a vars image, since it will not be used anyway
2912 # this can only happen if someone manually deletes the OVMF_CODE image
2913 # or has an old pve-qemu-kvm version installed.
2914 # both should not happen, but we ignore it here
2915 }
a783c78e
AD
2916 }
2917
da8b4189 2918
d40e5e18
DC
2919 # add usb controllers
2920 my @usbcontrollers = PVE::QemuServer::USB::get_usb_controllers($conf, $bridges, $q35, $usbdesc->{format}, $MAX_USB_DEVICES);
2921 push @$devices, @usbcontrollers if @usbcontrollers;
5acbfe9e 2922 my $vga = $conf->{vga};
2fa3151e 2923
590e698c
DM
2924 my $qxlnum = vga_conf_has_spice($vga);
2925 $vga = 'qxl' if $qxlnum;
2fa3151e 2926
5acbfe9e 2927 if (!$vga) {
85909c04 2928 $vga = (!$winversion || $winversion >= 6) ? 'std' : 'cirrus';
5acbfe9e
DM
2929 }
2930
1e3baf05 2931 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2932 my $tablet;
2933 if (defined($conf->{tablet})) {
2934 $tablet = $conf->{tablet};
2935 } else {
2936 $tablet = $defaults->{tablet};
590e698c 2937 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2938 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2939 }
2940
db656e5f 2941 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2942
16a91d65 2943 my $kvm_off = 0;
4317f69f
AD
2944 my $gpu_passthrough;
2945
1e3baf05 2946 # host pci devices
040b06b7 2947 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2948 my $d = parse_hostpci($conf->{"hostpci$i"});
2949 next if !$d;
2950
2951 my $pcie = $d->{pcie};
2952 if($pcie){
2953 die "q35 machine model is not enabled" if !$q35;
2954 $pciaddr = print_pcie_addr("hostpci$i");
2955 }else{
2956 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2957 }
2958
1f4f447b 2959 my $rombar = defined($d->{rombar}) && !$d->{rombar} ? ',rombar=0' : '';
9009150b 2960 my $romfile = $d->{romfile};
456a6fec 2961
1f4f447b
WB
2962 my $xvga = '';
2963 if ($d->{'x-vga'}) {
2964 $xvga = ',x-vga=on';
16a91d65 2965 $kvm_off = 1;
137483c0 2966 $vga = 'none';
4317f69f
AD
2967 $gpu_passthrough = 1;
2968
230a4382
AD
2969 if ($conf->{bios} && $conf->{bios} eq 'ovmf') {
2970 $xvga = "";
2971 }
137483c0 2972 }
4543ecf0
AD
2973 my $pcidevices = $d->{pciid};
2974 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2975
4543ecf0
AD
2976 my $j=0;
2977 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2978
4543ecf0
AD
2979 my $id = "hostpci$i";
2980 $id .= ".$j" if $multifunction;
2981 my $addr = $pciaddr;
2982 $addr .= ".$j" if $multifunction;
6ea8cd3b 2983 my $devicestr = "vfio-pci,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
4543ecf0
AD
2984
2985 if($j == 0){
2986 $devicestr .= "$rombar$xvga";
2987 $devicestr .= ",multifunction=on" if $multifunction;
456a6fec 2988 $devicestr .= ",romfile=/usr/share/kvm/$romfile" if $romfile;
4543ecf0
AD
2989 }
2990
2991 push @$devices, '-device', $devicestr;
2992 $j++;
2993 }
1e3baf05
DM
2994 }
2995
2996 # usb devices
d40e5e18
DC
2997 my @usbdevices = PVE::QemuServer::USB::get_usb_devices($conf, $usbdesc->{format}, $MAX_USB_DEVICES);
2998 push @$devices, @usbdevices if @usbdevices;
1e3baf05 2999 # serial devices
bae179aa 3000 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 3001 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
3002 if ($path eq 'socket') {
3003 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
3004 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
3005 push @$devices, '-device', "isa-serial,chardev=serial$i";
3006 } else {
3007 die "no such serial device\n" if ! -c $path;
3008 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
3009 push @$devices, '-device', "isa-serial,chardev=serial$i";
3010 }
34978be3 3011 }
1e3baf05
DM
3012 }
3013
3014 # parallel devices
1989a89c 3015 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 3016 if (my $path = $conf->{"parallel$i"}) {
19672434 3017 die "no such parallel device\n" if ! -c $path;
32e69805 3018 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 3019 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 3020 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 3021 }
1e3baf05
DM
3022 }
3023
3024 my $vmname = $conf->{name} || "vm$vmid";
3025
3026 push @$cmd, '-name', $vmname;
19672434 3027
1e3baf05
DM
3028 my $sockets = 1;
3029 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
3030 $sockets = $conf->{sockets} if $conf->{sockets};
3031
3032 my $cores = $conf->{cores} || 1;
3bd18e48 3033
de9d1e55 3034 my $maxcpus = $sockets * $cores;
76267728 3035
de9d1e55 3036 my $vcpus = $conf->{vcpus} ? $conf->{vcpus} : $maxcpus;
76267728 3037
de9d1e55
AD
3038 my $allowed_vcpus = $cpuinfo->{cpus};
3039
6965d5d1 3040 die "MAX $allowed_vcpus vcpus allowed per VM on this node\n"
de9d1e55
AD
3041 if ($allowed_vcpus < $maxcpus);
3042
69c81430 3043 if($hotplug_features->{cpu} && qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 7)) {
1e3baf05 3044
69c81430
AD
3045 push @$cmd, '-smp', "1,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
3046 for (my $i = 2; $i <= $vcpus; $i++) {
3047 my $cpustr = print_cpu_device($conf,$i);
3048 push @$cmd, '-device', $cpustr;
3049 }
3050
3051 } else {
3052
3053 push @$cmd, '-smp', "$vcpus,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
3054 }
1e3baf05
DM
3055 push @$cmd, '-nodefaults';
3056
32baffb4 3057 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 3058
0888fdce
DM
3059 my $bootindex_hash = {};
3060 my $i = 1;
3061 foreach my $o (split(//, $bootorder)) {
3062 $bootindex_hash->{$o} = $i*100;
3063 $i++;
afdb31d5 3064 }
3b408e82 3065
dbea4415 3066 push @$cmd, '-boot', "menu=on,strict=on,reboot-timeout=1000,splash=/usr/share/qemu-server/bootsplash.jpg";
1e3baf05 3067
6b64503e 3068 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 3069
6b64503e 3070 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 3071
ef5e2be2 3072 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05 3073
b7be4ba9
AD
3074 if ($vga && $vga !~ m/^serial\d+$/ && $vga ne 'none'){
3075 my $socket = vnc_socket($vmid);
3076 push @$cmd, '-vnc', "unix:$socket,x509,password";
3077 } else {
3078 push @$cmd, '-nographic';
3079 }
3080
1e3baf05 3081 # time drift fix
6b64503e 3082 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 3083
6b64503e 3084 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 3085 my $useLocaltime = $conf->{localtime};
1e3baf05 3086
4317f69f
AD
3087 if ($winversion >= 5) { # windows
3088 $useLocaltime = 1 if !defined($conf->{localtime});
7a131888 3089
4317f69f
AD
3090 # use time drift fix when acpi is enabled
3091 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
3092 $tdf = 1 if !defined($conf->{tdf});
462e8d19 3093 }
4317f69f 3094 }
462e8d19 3095
4317f69f
AD
3096 if ($winversion >= 6) {
3097 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
3098 push @$cmd, '-no-hpet';
1e3baf05
DM
3099 }
3100
8c559505
DM
3101 push @$rtcFlags, 'driftfix=slew' if $tdf;
3102
7f0b5beb 3103 if ($nokvm) {
8c559505 3104 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
3105 } else {
3106 die "No accelerator found!\n" if !$cpuinfo->{hvm};
3107 }
1e3baf05 3108
952958bc
DM
3109 if ($machine_type) {
3110 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
3111 }
3112
8c559505
DM
3113 if ($conf->{startdate}) {
3114 push @$rtcFlags, "base=$conf->{startdate}";
3115 } elsif ($useLocaltime) {
3116 push @$rtcFlags, 'base=localtime';
3117 }
1e3baf05 3118
519ed28c 3119 my $cpu = $nokvm ? "qemu64" : "kvm64";
16a91d65 3120 if (my $cputype = $conf->{cpu}) {
ff6ffe20 3121 my $cpuconf = PVE::JSONSchema::parse_property_string($cpu_fmt, $cputype)
16a91d65
WB
3122 or die "Cannot parse cpu description: $cputype\n";
3123 $cpu = $cpuconf->{cputype};
3124 $kvm_off = 1 if $cpuconf->{hidden};
3125 }
519ed28c 3126
4dc339e7
AD
3127 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
3128
d853f40a
DM
3129 push @$cpuFlags , '-x2apic'
3130 if $conf->{ostype} && $conf->{ostype} eq 'solaris';
519ed28c 3131
2e1a5389
AD
3132 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
3133
0dc48c3d
AD
3134 push @$cpuFlags, '-rdtscp' if $cpu =~ m/^Opteron/;
3135
117a0414
AD
3136 if (qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 3)) {
3137
3138 push @$cpuFlags , '+kvm_pv_unhalt' if !$nokvm;
0da5a08c 3139 push @$cpuFlags , '+kvm_pv_eoi' if !$nokvm;
117a0414
AD
3140 }
3141
4317f69f
AD
3142 add_hyperv_enlighments($cpuFlags, $winversion, $machine_type, $kvmver, $nokvm, $conf->{bios}, $gpu_passthrough);
3143
f1f7ea88 3144 push @$cpuFlags, 'enforce' if $cpu ne 'host' && !$nokvm;
dac7c619 3145
16a91d65
WB
3146 push @$cpuFlags, 'kvm=off' if $kvm_off;
3147
8930da74
DM
3148 my $cpu_vendor = $cpu_vendor_list->{$cpu} ||
3149 die "internal error"; # should not happen
3150
3151 push @$cpuFlags, "vendor=${cpu_vendor}"
3152 if $cpu_vendor ne 'default';
3153
be190583 3154 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 3155
dac7c619 3156 push @$cmd, '-cpu', $cpu;
519ed28c 3157
0567a4d5
AD
3158 PVE::QemuServer::Memory::config($conf, $vmid, $sockets, $cores, $defaults, $hotplug_features, $cmd);
3159
1e3baf05
DM
3160 push @$cmd, '-S' if $conf->{freeze};
3161
3162 # set keyboard layout
3163 my $kb = $conf->{keyboard} || $defaults->{keyboard};
3164 push @$cmd, '-k', $kb if $kb;
3165
3166 # enable sound
3167 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
3168 #push @$cmd, '-soundhw', 'es1370';
3169 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 3170
bc84dcca 3171 if($conf->{agent}) {
7a6c2150 3172 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
3173 my $pciaddr = print_pci_addr("qga0", $bridges);
3174 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
3175 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
3176 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
3177 }
3178
1d794448 3179 my $spice_port;
2fa3151e 3180
590e698c
DM
3181 if ($qxlnum) {
3182 if ($qxlnum > 1) {
ac087616 3183 if ($winversion){
590e698c
DM
3184 for(my $i = 1; $i < $qxlnum; $i++){
3185 my $pciaddr = print_pci_addr("vga$i", $bridges);
3186 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
3187 }
3188 } else {
3189 # assume other OS works like Linux
3190 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
3191 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
3192 }
3193 }
3194
1011b570 3195 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 3196
af0eba7e
WB
3197 my $nodename = PVE::INotify::nodename();
3198 my $pfamily = PVE::Tools::get_host_address_family($nodename);
91152441
WB
3199 my @nodeaddrs = PVE::Tools::getaddrinfo_all('localhost', family => $pfamily);
3200 die "failed to get an ip address of type $pfamily for 'localhost'\n" if !@nodeaddrs;
3201 my $localhost = PVE::Network::addr_to_ip($nodeaddrs[0]->{addr});
3202 $spice_port = PVE::Tools::next_spice_port($pfamily, $localhost);
943340a6 3203
91152441 3204 push @$devices, '-spice', "tls-port=${spice_port},addr=$localhost,tls-ciphers=HIGH,seamless-migration=on";
1011b570 3205
d2da6d9b
AD
3206 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
3207 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
3208 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
3209 }
3210
8d9ae0d2
DM
3211 # enable balloon by default, unless explicitly disabled
3212 if (!defined($conf->{balloon}) || $conf->{balloon}) {
3213 $pciaddr = print_pci_addr("balloon0", $bridges);
3214 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
3215 }
1e3baf05 3216
0ea9541d
DM
3217 if ($conf->{watchdog}) {
3218 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 3219 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 3220 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
3221 push @$devices, '-device', "$watchdog$pciaddr";
3222 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
3223 }
3224
1e3baf05 3225 my $vollist = [];
941e0c42 3226 my $scsicontroller = {};
26ee04b6 3227 my $ahcicontroller = {};
cdd20088 3228 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 3229
5881b913
DM
3230 # Add iscsi initiator name if available
3231 if (my $initiator = get_initiator_name()) {
3232 push @$devices, '-iscsi', "initiator-name=$initiator";
3233 }
3234
1e3baf05
DM
3235 foreach_drive($conf, sub {
3236 my ($ds, $drive) = @_;
3237
ff1a2432 3238 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 3239 push @$vollist, $drive->{file};
ff1a2432 3240 }
afdb31d5 3241
1e3baf05 3242 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
3243
3244 if (drive_is_cdrom ($drive)) {
3245 if ($bootindex_hash->{d}) {
3246 $drive->{bootindex} = $bootindex_hash->{d};
3247 $bootindex_hash->{d} += 1;
3248 }
3249 } else {
3250 if ($bootindex_hash->{c}) {
3251 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3252 $bootindex_hash->{c} += 1;
3253 }
3254 }
3255
51f492cd
AD
3256 if($drive->{interface} eq 'virtio'){
3257 push @$cmd, '-object', "iothread,id=iothread-$ds" if $drive->{iothread};
3258 }
3259
941e0c42 3260 if ($drive->{interface} eq 'scsi') {
cdd20088 3261
ee034f5c 3262 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $drive);
6731a4cf 3263
6731a4cf 3264 $pciaddr = print_pci_addr("$controller_prefix$controller", $bridges);
a1b7d579 3265 my $scsihw_type = $scsihw =~ m/^virtio-scsi-single/ ? "virtio-scsi-pci" : $scsihw;
fc8b40fd
AD
3266
3267 my $iothread = '';
3268 if($conf->{scsihw} && $conf->{scsihw} eq "virtio-scsi-single" && $drive->{iothread}){
3269 $iothread .= ",iothread=iothread-$controller_prefix$controller";
3270 push @$cmd, '-object', "iothread,id=iothread-$controller_prefix$controller";
e7a5104d
DC
3271 } elsif ($drive->{iothread}) {
3272 warn "iothread is only valid with virtio disk or virtio-scsi-single controller, ignoring\n";
fc8b40fd
AD
3273 }
3274
6e11f143
AD
3275 my $queues = '';
3276 if($conf->{scsihw} && $conf->{scsihw} eq "virtio-scsi-single" && $drive->{queues}){
3277 $queues = ",num_queues=$drive->{queues}";
3278 }
3279
3280 push @$devices, '-device', "$scsihw_type,id=$controller_prefix$controller$pciaddr$iothread$queues" if !$scsicontroller->{$controller};
cdd20088 3281 $scsicontroller->{$controller}=1;
941e0c42 3282 }
3b408e82 3283
26ee04b6
DA
3284 if ($drive->{interface} eq 'sata') {
3285 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
3286 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3287 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
3288 $ahcicontroller->{$controller}=1;
3289 }
46f58b5f 3290
6470743f
DC
3291 if ($drive->{interface} eq 'efidisk') {
3292 # this will be added somewhere else
3293 return;
3294 }
3295
15b21acc
MR
3296 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3297 push @$devices, '-drive',$drive_cmd;
46f58b5f 3298 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
3299 });
3300
cc4d6182 3301 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 3302 next if !$conf->{"net$i"};
cc4d6182
DA
3303 my $d = parse_net($conf->{"net$i"});
3304 next if !$d;
1e3baf05 3305
cc4d6182 3306 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 3307
cc4d6182
DA
3308 if ($bootindex_hash->{n}) {
3309 $d->{bootindex} = $bootindex_hash->{n};
3310 $bootindex_hash->{n} += 1;
3311 }
1e3baf05 3312
cc4d6182 3313 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
3314 push @$devices, '-netdev', $netdevfull;
3315
ba9e1000 3316 my $netdevicefull = print_netdevice_full($vmid, $conf, $d, "net$i", $bridges, $use_old_bios_files);
5bdcf937
AD
3317 push @$devices, '-device', $netdevicefull;
3318 }
1e3baf05 3319
db656e5f
DM
3320 if (!$q35) {
3321 # add pci bridges
fc79e813
AD
3322 if (qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 3)) {
3323 $bridges->{1} = 1;
3324 $bridges->{2} = 1;
3325 }
3326
6731a4cf
AD
3327 $bridges->{3} = 1 if $scsihw =~ m/^virtio-scsi-single/;
3328
f8e83f05
AD
3329 while (my ($k, $v) = each %$bridges) {
3330 $pciaddr = print_pci_addr("pci.$k");
3331 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3332 }
19672434
DM
3333 }
3334
1e3baf05
DM
3335 # add custom args
3336 if ($conf->{args}) {
3ada46c9 3337 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
3338 push @$cmd, @$aa;
3339 }
3340
5bdcf937 3341 push @$cmd, @$devices;
be190583 3342 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 3343 if scalar(@$rtcFlags);
be190583 3344 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
3345 if scalar(@$machineFlags);
3346 push @$cmd, '-global', join(',', @$globalFlags)
3347 if scalar(@$globalFlags);
3348
1d794448 3349 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 3350}
19672434 3351
1e3baf05
DM
3352sub vnc_socket {
3353 my ($vmid) = @_;
3354 return "${var_run_tmpdir}/$vmid.vnc";
3355}
3356
943340a6 3357sub spice_port {
1011b570 3358 my ($vmid) = @_;
943340a6 3359
1d794448 3360 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
3361
3362 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3363}
3364
c971c4f2 3365sub qmp_socket {
693d12a2
AD
3366 my ($vmid, $qga) = @_;
3367 my $sockettype = $qga ? 'qga' : 'qmp';
3368 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3369}
3370
1e3baf05
DM
3371sub pidfile_name {
3372 my ($vmid) = @_;
3373 return "${var_run_tmpdir}/$vmid.pid";
3374}
3375
86fdcfb2
DA
3376sub vm_devices_list {
3377 my ($vmid) = @_;
3378
ceea9078 3379 my $res = vm_mon_cmd($vmid, 'query-pci');
ceea9078
DM
3380 my $devices = {};
3381 foreach my $pcibus (@$res) {
3382 foreach my $device (@{$pcibus->{devices}}) {
6e62a21f 3383 next if !$device->{'qdev_id'};
200644a7 3384 if ($device->{'pci_bridge'}) {
200644a7
AD
3385 $devices->{$device->{'qdev_id'}} = 1;
3386 foreach my $bridge_device (@{$device->{'pci_bridge'}->{devices}}) {
3387 next if !$bridge_device->{'qdev_id'};
3388 $devices->{$bridge_device->{'qdev_id'}} = 1;
3389 $devices->{$device->{'qdev_id'}}++;
3390 }
3391 } else {
200644a7
AD
3392 $devices->{$device->{'qdev_id'}} = 1;
3393 }
f78cc802
AD
3394 }
3395 }
3396
3397 my $resblock = vm_mon_cmd($vmid, 'query-block');
3398 foreach my $block (@$resblock) {
3399 if($block->{device} =~ m/^drive-(\S+)/){
3400 $devices->{$1} = 1;
1dc4f496
DM
3401 }
3402 }
86fdcfb2 3403
3d7389fe
DM
3404 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3405 foreach my $mice (@$resmice) {
3406 if ($mice->{name} eq 'QEMU HID Tablet') {
3407 $devices->{tablet} = 1;
3408 last;
3409 }
3410 }
3411
deb091c5
DC
3412 # for usb devices there is no query-usb
3413 # but we can iterate over the entries in
3414 # qom-list path=/machine/peripheral
3415 my $resperipheral = vm_mon_cmd($vmid, 'qom-list', path => '/machine/peripheral');
3416 foreach my $per (@$resperipheral) {
3417 if ($per->{name} =~ m/^usb\d+$/) {
3418 $devices->{$per->{name}} = 1;
3419 }
3420 }
3421
1dc4f496 3422 return $devices;
86fdcfb2
DA
3423}
3424
ec21aa11 3425sub vm_deviceplug {
f19d1c47 3426 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3427
db656e5f
DM
3428 my $q35 = machine_type_is_q35($conf);
3429
95d6343b
DA
3430 my $devices_list = vm_devices_list($vmid);
3431 return 1 if defined($devices_list->{$deviceid});
3432
fee46675
DM
3433 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid); # add PCI bridge if we need it for the device
3434
3d7389fe 3435 if ($deviceid eq 'tablet') {
fee46675 3436
3d7389fe 3437 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3d7389fe 3438
4eb68604
DC
3439 } elsif ($deviceid =~ m/^usb(\d+)$/) {
3440
f745762b
DC
3441 die "usb hotplug currently not reliable\n";
3442 # since we can't reliably hot unplug all added usb devices
3443 # and usb passthrough disables live migration
3444 # we disable usb hotplugging for now
4eb68604
DC
3445 qemu_deviceadd($vmid, PVE::QemuServer::USB::print_usbdevice_full($conf, $deviceid, $device));
3446
fee46675 3447 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
40f28a9f 3448
22de899a
AD
3449 qemu_iothread_add($vmid, $deviceid, $device);
3450
fee46675 3451 qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3452 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
fee46675 3453
5e5dcb73 3454 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3455 eval { qemu_deviceaddverify($vmid, $deviceid); };
3456 if (my $err = $@) {
63c2da2f
DM
3457 eval { qemu_drivedel($vmid, $deviceid); };
3458 warn $@ if $@;
fee46675 3459 die $err;
5e5dcb73 3460 }
cfc817c7 3461
2733141c 3462 } elsif ($deviceid =~ m/^(virtioscsi|scsihw)(\d+)$/) {
fee46675 3463
fc8b40fd 3464
cdd20088 3465 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3466 my $pciaddr = print_pci_addr($deviceid);
a1b7d579 3467 my $scsihw_type = $scsihw eq 'virtio-scsi-single' ? "virtio-scsi-pci" : $scsihw;
2733141c
AD
3468
3469 my $devicefull = "$scsihw_type,id=$deviceid$pciaddr";
fee46675 3470
fc8b40fd
AD
3471 if($deviceid =~ m/^virtioscsi(\d+)$/ && $device->{iothread}) {
3472 qemu_iothread_add($vmid, $deviceid, $device);
3473 $devicefull .= ",iothread=iothread-$deviceid";
3474 }
3475
6e11f143
AD
3476 if($deviceid =~ m/^virtioscsi(\d+)$/ && $device->{queues}) {
3477 $devicefull .= ",num_queues=$device->{queues}";
3478 }
3479
cfc817c7 3480 qemu_deviceadd($vmid, $devicefull);
fee46675 3481 qemu_deviceaddverify($vmid, $deviceid);
cfc817c7 3482
fee46675
DM
3483 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3484
3485 qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
3486 qemu_driveadd($storecfg, $vmid, $device);
a1b7d579 3487
fee46675
DM
3488 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3489 eval { qemu_deviceadd($vmid, $devicefull); };
3490 if (my $err = $@) {
63c2da2f
DM
3491 eval { qemu_drivedel($vmid, $deviceid); };
3492 warn $@ if $@;
fee46675 3493 die $err;
a4f091a0 3494 }
a4f091a0 3495
fee46675
DM
3496 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3497
2630d2a9 3498 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
8718099c
AD
3499
3500 my $machine_type = PVE::QemuServer::qemu_machine_pxe($vmid, $conf);
3501 my $use_old_bios_files = undef;
3502 ($use_old_bios_files, $machine_type) = qemu_use_old_bios_files($machine_type);
3503
3504 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid, undef, $use_old_bios_files);
2630d2a9 3505 qemu_deviceadd($vmid, $netdevicefull);
fee46675
DM
3506 eval { qemu_deviceaddverify($vmid, $deviceid); };
3507 if (my $err = $@) {
3508 eval { qemu_netdevdel($vmid, $deviceid); };
3509 warn $@ if $@;
3510 die $err;
2630d2a9 3511 }
2630d2a9 3512
fee46675 3513 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
b467f79a 3514
40f28a9f
AD
3515 my $bridgeid = $2;
3516 my $pciaddr = print_pci_addr($deviceid);
3517 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
a1b7d579 3518
40f28a9f 3519 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3520 qemu_deviceaddverify($vmid, $deviceid);
3521
3522 } else {
a1b7d579 3523 die "can't hotplug device '$deviceid'\n";
40f28a9f
AD
3524 }
3525
5e5dcb73 3526 return 1;
a4dea331
DA
3527}
3528
3eec5767 3529# fixme: this should raise exceptions on error!
ec21aa11 3530sub vm_deviceunplug {
f19d1c47 3531 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3532
95d6343b
DA
3533 my $devices_list = vm_devices_list($vmid);
3534 return 1 if !defined($devices_list->{$deviceid});
3535
63c2da2f
DM
3536 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3537
3d7389fe 3538 if ($deviceid eq 'tablet') {
63c2da2f 3539
3d7389fe 3540 qemu_devicedel($vmid, $deviceid);
3d7389fe 3541
4eb68604
DC
3542 } elsif ($deviceid =~ m/^usb\d+$/) {
3543
f745762b
DC
3544 die "usb hotplug currently not reliable\n";
3545 # when unplugging usb devices this way,
3546 # there may be remaining usb controllers/hubs
3547 # so we disable it for now
4eb68604
DC
3548 qemu_devicedel($vmid, $deviceid);
3549 qemu_devicedelverify($vmid, $deviceid);
3550
63c2da2f 3551 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
f19d1c47 3552
5e5dcb73 3553 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3554 qemu_devicedelverify($vmid, $deviceid);
3555 qemu_drivedel($vmid, $deviceid);
22de899a
AD
3556 qemu_iothread_del($conf, $vmid, $deviceid);
3557
2733141c 3558 } elsif ($deviceid =~ m/^(virtioscsi|scsihw)(\d+)$/) {
a1b7d579 3559
63c2da2f 3560 qemu_devicedel($vmid, $deviceid);
8ce30dde 3561 qemu_devicedelverify($vmid, $deviceid);
fc8b40fd 3562 qemu_iothread_del($conf, $vmid, $deviceid);
a1b7d579 3563
63c2da2f 3564 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
cfc817c7 3565
8bcf3068
AD
3566 #qemu 2.3 segfault on drive_del with virtioscsi + iothread
3567 my $device = parse_drive($deviceid, $conf->{$deviceid});
3568 die "virtioscsi with iothread is not hot-unplugglable currently" if $device->{iothread};
3569
63c2da2f
DM
3570 qemu_devicedel($vmid, $deviceid);
3571 qemu_drivedel($vmid, $deviceid);
a1b7d579 3572 qemu_deletescsihw($conf, $vmid, $deviceid);
8ce30dde 3573
63c2da2f 3574 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
a4f091a0 3575
2630d2a9 3576 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3577 qemu_devicedelverify($vmid, $deviceid);
3578 qemu_netdevdel($vmid, $deviceid);
3579
3580 } else {
3581 die "can't unplug device '$deviceid'\n";
2630d2a9
DA
3582 }
3583
5e5dcb73
DA
3584 return 1;
3585}
3586
3587sub qemu_deviceadd {
3588 my ($vmid, $devicefull) = @_;
873c2d69 3589
d695b5b7
AD
3590 $devicefull = "driver=".$devicefull;
3591 my %options = split(/[=,]/, $devicefull);
f19d1c47 3592
d695b5b7 3593 vm_mon_cmd($vmid, "device_add" , %options);
5e5dcb73 3594}
afdb31d5 3595
5e5dcb73 3596sub qemu_devicedel {
fee46675 3597 my ($vmid, $deviceid) = @_;
63c2da2f 3598
5a77d8c1 3599 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
5e5dcb73
DA
3600}
3601
22de899a
AD
3602sub qemu_iothread_add {
3603 my($vmid, $deviceid, $device) = @_;
3604
3605 if ($device->{iothread}) {
3606 my $iothreads = vm_iothreads_list($vmid);
3607 qemu_objectadd($vmid, "iothread-$deviceid", "iothread") if !$iothreads->{"iothread-$deviceid"};
3608 }
3609}
3610
3611sub qemu_iothread_del {
3612 my($conf, $vmid, $deviceid) = @_;
3613
3614 my $device = parse_drive($deviceid, $conf->{$deviceid});
3615 if ($device->{iothread}) {
3616 my $iothreads = vm_iothreads_list($vmid);
3617 qemu_objectdel($vmid, "iothread-$deviceid") if $iothreads->{"iothread-$deviceid"};
3618 }
3619}
3620
4d3f29ed
AD
3621sub qemu_objectadd {
3622 my($vmid, $objectid, $qomtype) = @_;
3623
3624 vm_mon_cmd($vmid, "object-add", id => $objectid, "qom-type" => $qomtype);
3625
3626 return 1;
3627}
3628
3629sub qemu_objectdel {
3630 my($vmid, $objectid) = @_;
3631
3632 vm_mon_cmd($vmid, "object-del", id => $objectid);
3633
3634 return 1;
3635}
3636
5e5dcb73 3637sub qemu_driveadd {
fee46675 3638 my ($storecfg, $vmid, $device) = @_;
5e5dcb73
DA
3639
3640 my $drive = print_drive_full($storecfg, $vmid, $device);
7a69fc3c 3641 $drive =~ s/\\/\\\\/g;
8ead5ec7 3642 my $ret = vm_human_monitor_command($vmid, "drive_add auto \"$drive\"");
fee46675 3643
5e5dcb73 3644 # If the command succeeds qemu prints: "OK"
fee46675
DM
3645 return 1 if $ret =~ m/OK/s;
3646
3647 die "adding drive failed: $ret\n";
5e5dcb73 3648}
afdb31d5 3649
5e5dcb73
DA
3650sub qemu_drivedel {
3651 my($vmid, $deviceid) = @_;
873c2d69 3652
7b7c6d1b 3653 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73 3654 $ret =~ s/^\s+//;
a1b7d579 3655
63c2da2f 3656 return 1 if $ret eq "";
a1b7d579 3657
63c2da2f 3658 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
a1b7d579
DM
3659 return 1 if $ret =~ m/Device \'.*?\' not found/s;
3660
63c2da2f 3661 die "deleting drive $deviceid failed : $ret\n";
5e5dcb73 3662}
f19d1c47 3663
5e5dcb73 3664sub qemu_deviceaddverify {
fee46675 3665 my ($vmid, $deviceid) = @_;
873c2d69 3666
5e5dcb73
DA
3667 for (my $i = 0; $i <= 5; $i++) {
3668 my $devices_list = vm_devices_list($vmid);
3669 return 1 if defined($devices_list->{$deviceid});
3670 sleep 1;
afdb31d5 3671 }
fee46675
DM
3672
3673 die "error on hotplug device '$deviceid'\n";
5e5dcb73 3674}
afdb31d5 3675
5e5dcb73
DA
3676
3677sub qemu_devicedelverify {
63c2da2f
DM
3678 my ($vmid, $deviceid) = @_;
3679
a1b7d579 3680 # need to verify that the device is correctly removed as device_del
63c2da2f 3681 # is async and empty return is not reliable
5e5dcb73 3682
5e5dcb73
DA
3683 for (my $i = 0; $i <= 5; $i++) {
3684 my $devices_list = vm_devices_list($vmid);
3685 return 1 if !defined($devices_list->{$deviceid});
3686 sleep 1;
afdb31d5 3687 }
63c2da2f
DM
3688
3689 die "error on hot-unplugging device '$deviceid'\n";
873c2d69
DA
3690}
3691
cdd20088 3692sub qemu_findorcreatescsihw {
cfc817c7
DA
3693 my ($storecfg, $conf, $vmid, $device) = @_;
3694
ee034f5c 3695 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $device);
2733141c
AD
3696
3697 my $scsihwid="$controller_prefix$controller";
cfc817c7
DA
3698 my $devices_list = vm_devices_list($vmid);
3699
cdd20088 3700 if(!defined($devices_list->{$scsihwid})) {
fc8b40fd 3701 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid, $device);
cfc817c7 3702 }
fee46675 3703
cfc817c7
DA
3704 return 1;
3705}
3706
8ce30dde
AD
3707sub qemu_deletescsihw {
3708 my ($conf, $vmid, $opt) = @_;
3709
3710 my $device = parse_drive($opt, $conf->{$opt});
3711
a1511b3c 3712 if ($conf->{scsihw} && ($conf->{scsihw} eq 'virtio-scsi-single')) {
2733141c
AD
3713 vm_deviceunplug($vmid, $conf, "virtioscsi$device->{index}");
3714 return 1;
3715 }
3716
ee034f5c 3717 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $device);
8ce30dde
AD
3718
3719 my $devices_list = vm_devices_list($vmid);
3720 foreach my $opt (keys %{$devices_list}) {
74479ee9 3721 if (PVE::QemuServer::is_valid_drivename($opt)) {
8ce30dde
AD
3722 my $drive = PVE::QemuServer::parse_drive($opt, $conf->{$opt});
3723 if($drive->{interface} eq 'scsi' && $drive->{index} < (($maxdev-1)*($controller+1))) {
3724 return 1;
3725 }
3726 }
3727 }
3728
3729 my $scsihwid="scsihw$controller";
3730
3731 vm_deviceunplug($vmid, $conf, $scsihwid);
3732
3733 return 1;
3734}
3735
281fedb3 3736sub qemu_add_pci_bridge {
40f28a9f
AD
3737 my ($storecfg, $conf, $vmid, $device) = @_;
3738
3739 my $bridges = {};
281fedb3
DM
3740
3741 my $bridgeid;
3742
40f28a9f
AD
3743 print_pci_addr($device, $bridges);
3744
3745 while (my ($k, $v) = each %$bridges) {
3746 $bridgeid = $k;
3747 }
fee46675 3748 return 1 if !defined($bridgeid) || $bridgeid < 1;
281fedb3 3749
40f28a9f
AD
3750 my $bridge = "pci.$bridgeid";
3751 my $devices_list = vm_devices_list($vmid);
3752
281fedb3 3753 if (!defined($devices_list->{$bridge})) {
fee46675 3754 vm_deviceplug($storecfg, $conf, $vmid, $bridge);
40f28a9f 3755 }
281fedb3 3756
40f28a9f
AD
3757 return 1;
3758}
3759
25088687
DM
3760sub qemu_set_link_status {
3761 my ($vmid, $device, $up) = @_;
3762
a1b7d579 3763 vm_mon_cmd($vmid, "set_link", name => $device,
25088687
DM
3764 up => $up ? JSON::true : JSON::false);
3765}
3766
2630d2a9
DA
3767sub qemu_netdevadd {
3768 my ($vmid, $conf, $device, $deviceid) = @_;
3769
208ba94e 3770 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid, 1);
73aa03b8 3771 my %options = split(/[=,]/, $netdev);
2630d2a9 3772
73aa03b8
AD
3773 vm_mon_cmd($vmid, "netdev_add", %options);
3774 return 1;
2630d2a9
DA
3775}
3776
3777sub qemu_netdevdel {
3778 my ($vmid, $deviceid) = @_;
3779
89c1e0f4 3780 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
2630d2a9
DA
3781}
3782
16521d63
DC
3783sub qemu_usb_hotplug {
3784 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
3785
3786 return if !$device;
3787
3788 # remove the old one first
3789 vm_deviceunplug($vmid, $conf, $deviceid);
3790
3791 # check if xhci controller is necessary and available
3792 if ($device->{usb3}) {
3793
3794 my $devicelist = vm_devices_list($vmid);
3795
3796 if (!$devicelist->{xhci}) {
3797 my $pciaddr = print_pci_addr("xhci");
3798 qemu_deviceadd($vmid, "nec-usb-xhci,id=xhci$pciaddr");
3799 }
3800 }
3801 my $d = parse_usb_device($device->{host});
3802 $d->{usb3} = $device->{usb3};
3803
3804 # add the new one
3805 vm_deviceplug($storecfg, $conf, $vmid, $deviceid, $d);
3806}
3807
838776ab 3808sub qemu_cpu_hotplug {
8edc9c08 3809 my ($vmid, $conf, $vcpus) = @_;
838776ab 3810
1e881b75
AD
3811 my $machine_type = PVE::QemuServer::get_current_qemu_machine($vmid);
3812
8edc9c08
AD
3813 my $sockets = 1;
3814 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
3815 $sockets = $conf->{sockets} if $conf->{sockets};
3816 my $cores = $conf->{cores} || 1;
3817 my $maxcpus = $sockets * $cores;
838776ab 3818
8edc9c08 3819 $vcpus = $maxcpus if !$vcpus;
3a11fadb 3820
8edc9c08
AD
3821 die "you can't add more vcpus than maxcpus\n"
3822 if $vcpus > $maxcpus;
3a11fadb 3823
8edc9c08 3824 my $currentvcpus = $conf->{vcpus} || $maxcpus;
1e881b75 3825
eba3e64d 3826 if ($vcpus < $currentvcpus) {
1e881b75
AD
3827
3828 if (qemu_machine_feature_enabled ($machine_type, undef, 2, 7)) {
3829
3830 for (my $i = $currentvcpus; $i > $vcpus; $i--) {
3831 qemu_devicedel($vmid, "cpu$i");
3832 my $retry = 0;
3833 my $currentrunningvcpus = undef;
3834 while (1) {
3835 $currentrunningvcpus = vm_mon_cmd($vmid, "query-cpus");
3836 last if scalar(@{$currentrunningvcpus}) == $i-1;
961af8a3 3837 raise_param_exc({ vcpus => "error unplugging cpu$i" }) if $retry > 5;
1e881b75
AD
3838 $retry++;
3839 sleep 1;
3840 }
3841 #update conf after each succesfull cpu unplug
3842 $conf->{vcpus} = scalar(@{$currentrunningvcpus});
3843 PVE::QemuConfig->write_config($vmid, $conf);
3844 }
3845 } else {
961af8a3 3846 die "cpu hot-unplugging requires qemu version 2.7 or higher\n";
1e881b75
AD
3847 }
3848
3849 return;
3850 }
838776ab 3851
8edc9c08 3852 my $currentrunningvcpus = vm_mon_cmd($vmid, "query-cpus");
961af8a3 3853 die "vcpus in running vm does not match its configuration\n"
8edc9c08 3854 if scalar(@{$currentrunningvcpus}) != $currentvcpus;
838776ab 3855
eba3e64d
AD
3856 if (qemu_machine_feature_enabled ($machine_type, undef, 2, 7)) {
3857
3858 for (my $i = $currentvcpus+1; $i <= $vcpus; $i++) {
3859 my $cpustr = print_cpu_device($conf, $i);
3860 qemu_deviceadd($vmid, $cpustr);
3861
3862 my $retry = 0;
3863 my $currentrunningvcpus = undef;
3864 while (1) {
3865 $currentrunningvcpus = vm_mon_cmd($vmid, "query-cpus");
3866 last if scalar(@{$currentrunningvcpus}) == $i;
961af8a3 3867 raise_param_exc({ vcpus => "error hotplugging cpu$i" }) if $retry > 10;
eba3e64d
AD
3868 sleep 1;
3869 $retry++;
3870 }
3871 #update conf after each succesfull cpu hotplug
3872 $conf->{vcpus} = scalar(@{$currentrunningvcpus});
3873 PVE::QemuConfig->write_config($vmid, $conf);
3874 }
3875 } else {
3876
3877 for (my $i = $currentvcpus; $i < $vcpus; $i++) {
3878 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3879 }
838776ab
AD
3880 }
3881}
3882
affd2f88 3883sub qemu_block_set_io_throttle {
277ca170
WB
3884 my ($vmid, $deviceid,
3885 $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr,
9196a8ec
WB
3886 $bps_max, $bps_rd_max, $bps_wr_max, $iops_max, $iops_rd_max, $iops_wr_max,
3887 $bps_max_length, $bps_rd_max_length, $bps_wr_max_length,
3888 $iops_max_length, $iops_rd_max_length, $iops_wr_max_length) = @_;
affd2f88 3889
f3f323a3
AD
3890 return if !check_running($vmid) ;
3891
277ca170
WB
3892 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid,
3893 bps => int($bps),
3894 bps_rd => int($bps_rd),
3895 bps_wr => int($bps_wr),
3896 iops => int($iops),
3897 iops_rd => int($iops_rd),
3898 iops_wr => int($iops_wr),
3899 bps_max => int($bps_max),
3900 bps_rd_max => int($bps_rd_max),
3901 bps_wr_max => int($bps_wr_max),
3902 iops_max => int($iops_max),
3903 iops_rd_max => int($iops_rd_max),
9196a8ec
WB
3904 iops_wr_max => int($iops_wr_max),
3905 bps_max_length => int($bps_max_length),
3906 bps_rd_max_length => int($bps_rd_max_length),
3907 bps_wr_max_length => int($bps_wr_max_length),
3908 iops_max_length => int($iops_max_length),
3909 iops_rd_max_length => int($iops_rd_max_length),
3910 iops_wr_max_length => int($iops_wr_max_length),
277ca170 3911 );
f3f323a3 3912
affd2f88
AD
3913}
3914
f5eb281a 3915# old code, only used to shutdown old VM after update
dab36e1e
DM
3916sub __read_avail {
3917 my ($fh, $timeout) = @_;
3918
3919 my $sel = new IO::Select;
3920 $sel->add($fh);
3921
3922 my $res = '';
3923 my $buf;
3924
3925 my @ready;
3926 while (scalar (@ready = $sel->can_read($timeout))) {
3927 my $count;
3928 if ($count = $fh->sysread($buf, 8192)) {
3929 if ($buf =~ /^(.*)\(qemu\) $/s) {
3930 $res .= $1;
3931 last;
3932 } else {
3933 $res .= $buf;
3934 }
3935 } else {
3936 if (!defined($count)) {
3937 die "$!\n";
3938 }
3939 last;
3940 }
3941 }
3942
3943 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3944
dab36e1e
DM
3945 return $res;
3946}
3947
f5eb281a 3948# old code, only used to shutdown old VM after update
dab36e1e
DM
3949sub vm_monitor_command {
3950 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3951
dab36e1e
DM
3952 my $res;
3953
3954 eval {
3955 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3956
3957 my $sname = "${var_run_tmpdir}/$vmid.mon";
3958
3959 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3960 die "unable to connect to VM $vmid socket - $!\n";
3961
3962 my $timeout = 3;
3963
3964 # hack: migrate sometime blocks the monitor (when migrate_downtime
3965 # is set)
3966 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3967 $timeout = 60*60; # 1 hour
3968 }
3969
3970 # read banner;
3971 my $data = __read_avail($sock, $timeout);
3972
3973 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3974 die "got unexpected qemu monitor banner\n";
3975 }
3976
3977 my $sel = new IO::Select;
3978 $sel->add($sock);
3979
3980 if (!scalar(my @ready = $sel->can_write($timeout))) {
3981 die "monitor write error - timeout";
3982 }
3983
3984 my $fullcmd = "$cmdstr\r";
3985
3986 # syslog('info', "VM $vmid monitor command: $cmdstr");
3987
3988 my $b;
3989 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3990 die "monitor write error - $!";
3991 }
3992
3993 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3994
3995 $timeout = 20;
3996
3997 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3998 $timeout = 60*60; # 1 hour
3999 } elsif ($cmdstr =~ m/^(eject|change)/) {
4000 $timeout = 60; # note: cdrom mount command is slow
4001 }
4002 if ($res = __read_avail($sock, $timeout)) {
4003
4004 my @lines = split("\r?\n", $res);
f5eb281a 4005
dab36e1e 4006 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 4007
dab36e1e
DM
4008 $res = join("\n", @lines);
4009 $res .= "\n";
4010 }
4011 };
4012
4013 my $err = $@;
4014
4015 if ($err) {
4016 syslog("err", "VM $vmid monitor command failed - $err");
4017 die $err;
4018 }
f5eb281a 4019
dab36e1e
DM
4020 return $res;
4021}
4022
c1175c92
AD
4023sub qemu_block_resize {
4024 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
4025
ed221350 4026 my $running = check_running($vmid);
c1175c92 4027
7246e8f9 4028 $size = 0 if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
c1175c92
AD
4029
4030 return if !$running;
4031
4032 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
4033
4034}
4035
1ab0057c
AD
4036sub qemu_volume_snapshot {
4037 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
4038
ed221350 4039 my $running = check_running($vmid);
1ab0057c 4040
e5eaa028
WL
4041 if ($running && do_snapshots_with_qemu($storecfg, $volid)){
4042 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
4043 } else {
4044 PVE::Storage::volume_snapshot($storecfg, $volid, $snap);
4045 }
1ab0057c
AD
4046}
4047
fc46aff9
AD
4048sub qemu_volume_snapshot_delete {
4049 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
4050
ed221350 4051 my $running = check_running($vmid);
fc46aff9 4052
1ef7592f
AD
4053 if ($running && do_snapshots_with_qemu($storecfg, $volid)){
4054 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
4055 } else {
4056 PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
4057 }
fc46aff9
AD
4058}
4059
264e519f
DM
4060sub set_migration_caps {
4061 my ($vmid) = @_;
a89fded1 4062
8b8345f3 4063 my $cap_ref = [];
a89fded1
AD
4064
4065 my $enabled_cap = {
8b8345f3 4066 "auto-converge" => 1,
0b0a47e8 4067 "xbzrle" => 1,
8b8345f3
DM
4068 "x-rdma-pin-all" => 0,
4069 "zero-blocks" => 0,
b62532e4 4070 "compress" => 0
a89fded1
AD
4071 };
4072
8b8345f3 4073 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 4074
8b8345f3 4075 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
4076 push @$cap_ref, {
4077 capability => $supported_capability->{capability},
22430fa2
DM
4078 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
4079 };
a89fded1
AD
4080 }
4081
8b8345f3
DM
4082 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
4083}
a89fded1 4084
81d95ae1 4085my $fast_plug_option = {
7498eb64 4086 'lock' => 1,
81d95ae1 4087 'name' => 1,
a1b7d579 4088 'onboot' => 1,
81d95ae1
DM
4089 'shares' => 1,
4090 'startup' => 1,
b0ec896e 4091 'description' => 1,
ec647db4 4092 'protection' => 1,
81d95ae1
DM
4093};
4094
3a11fadb
DM
4095# hotplug changes in [PENDING]
4096# $selection hash can be used to only apply specified options, for
4097# example: { cores => 1 } (only apply changed 'cores')
4098# $errors ref is used to return error messages
c427973b 4099sub vmconfig_hotplug_pending {
3a11fadb 4100 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
c427973b 4101
8e90138a 4102 my $defaults = load_defaults();
c427973b
DM
4103
4104 # commit values which do not have any impact on running VM first
3a11fadb
DM
4105 # Note: those option cannot raise errors, we we do not care about
4106 # $selection and always apply them.
4107
4108 my $add_error = sub {
4109 my ($opt, $msg) = @_;
4110 $errors->{$opt} = "hotplug problem - $msg";
4111 };
c427973b
DM
4112
4113 my $changes = 0;
4114 foreach my $opt (keys %{$conf->{pending}}) { # add/change
81d95ae1 4115 if ($fast_plug_option->{$opt}) {
c427973b
DM
4116 $conf->{$opt} = $conf->{pending}->{$opt};
4117 delete $conf->{pending}->{$opt};
4118 $changes = 1;
4119 }
4120 }
4121
4122 if ($changes) {
ffda963f
FG
4123 PVE::QemuConfig->write_config($vmid, $conf);
4124 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
c427973b
DM
4125 }
4126
b3c2bdd1 4127 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
c427973b 4128
3dc38fbb
WB
4129 my $pending_delete_hash = split_flagged_list($conf->{pending}->{delete});
4130 while (my ($opt, $force) = each %$pending_delete_hash) {
3a11fadb 4131 next if $selection && !$selection->{$opt};
3a11fadb 4132 eval {
51a6f637
AD
4133 if ($opt eq 'hotplug') {
4134 die "skip\n" if ($conf->{hotplug} =~ /memory/);
4135 } elsif ($opt eq 'tablet') {
b3c2bdd1 4136 die "skip\n" if !$hotplug_features->{usb};
3a11fadb
DM
4137 if ($defaults->{tablet}) {
4138 vm_deviceplug($storecfg, $conf, $vmid, $opt);
4139 } else {
4140 vm_deviceunplug($vmid, $conf, $opt);
4141 }
4eb68604 4142 } elsif ($opt =~ m/^usb\d+/) {
f745762b
DC
4143 die "skip\n";
4144 # since we cannot reliably hot unplug usb devices
4145 # we are disabling it
4eb68604
DC
4146 die "skip\n" if !$hotplug_features->{usb} || $conf->{$opt} =~ m/spice/i;
4147 vm_deviceunplug($vmid, $conf, $opt);
8edc9c08 4148 } elsif ($opt eq 'vcpus') {
b3c2bdd1 4149 die "skip\n" if !$hotplug_features->{cpu};
8edc9c08 4150 qemu_cpu_hotplug($vmid, $conf, undef);
9c2f7069 4151 } elsif ($opt eq 'balloon') {
81d95ae1
DM
4152 # enable balloon device is not hotpluggable
4153 die "skip\n" if !defined($conf->{balloon}) || $conf->{balloon};
4154 } elsif ($fast_plug_option->{$opt}) {
4155 # do nothing
3eec5767 4156 } elsif ($opt =~ m/^net(\d+)$/) {
b3c2bdd1 4157 die "skip\n" if !$hotplug_features->{network};
3eec5767 4158 vm_deviceunplug($vmid, $conf, $opt);
74479ee9 4159 } elsif (is_valid_drivename($opt)) {
b3c2bdd1 4160 die "skip\n" if !$hotplug_features->{disk} || $opt =~ m/(ide|sata)(\d+)/;
19120f99 4161 vm_deviceunplug($vmid, $conf, $opt);
3dc38fbb 4162 vmconfig_delete_or_detach_drive($vmid, $storecfg, $conf, $opt, $force);
4d3f29ed
AD
4163 } elsif ($opt =~ m/^memory$/) {
4164 die "skip\n" if !$hotplug_features->{memory};
6779f1ac 4165 PVE::QemuServer::Memory::qemu_memory_hotplug($vmid, $conf, $defaults, $opt);
c8effec3
AD
4166 } elsif ($opt eq 'cpuunits') {
4167 cgroups_write("cpu", $vmid, "cpu.shares", $defaults->{cpuunits});
58be00f1
AD
4168 } elsif ($opt eq 'cpulimit') {
4169 cgroups_write("cpu", $vmid, "cpu.cfs_quota_us", -1);
3d7389fe 4170 } else {
e56beeda 4171 die "skip\n";
3d7389fe 4172 }
3a11fadb
DM
4173 };
4174 if (my $err = $@) {
e56beeda
DM
4175 &$add_error($opt, $err) if $err ne "skip\n";
4176 } else {
3a11fadb
DM
4177 # save new config if hotplug was successful
4178 delete $conf->{$opt};
4179 vmconfig_undelete_pending_option($conf, $opt);
ffda963f
FG
4180 PVE::QemuConfig->write_config($vmid, $conf);
4181 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
3d7389fe 4182 }
3d7389fe
DM
4183 }
4184
4185 foreach my $opt (keys %{$conf->{pending}}) {
3a11fadb 4186 next if $selection && !$selection->{$opt};
3d7389fe 4187 my $value = $conf->{pending}->{$opt};
3a11fadb 4188 eval {
51a6f637
AD
4189 if ($opt eq 'hotplug') {
4190 die "skip\n" if ($value =~ /memory/) || ($value !~ /memory/ && $conf->{hotplug} =~ /memory/);
4191 } elsif ($opt eq 'tablet') {
b3c2bdd1 4192 die "skip\n" if !$hotplug_features->{usb};
3a11fadb
DM
4193 if ($value == 1) {
4194 vm_deviceplug($storecfg, $conf, $vmid, $opt);
4195 } elsif ($value == 0) {
4196 vm_deviceunplug($vmid, $conf, $opt);
4197 }
4eb68604 4198 } elsif ($opt =~ m/^usb\d+$/) {
f745762b
DC
4199 die "skip\n";
4200 # since we cannot reliably hot unplug usb devices
4201 # we are disabling it
4eb68604
DC
4202 die "skip\n" if !$hotplug_features->{usb} || $value =~ m/spice/i;
4203 my $d = eval { PVE::JSONSchema::parse_property_string($usbdesc->{format}, $value) };
4204 die "skip\n" if !$d;
4205 qemu_usb_hotplug($storecfg, $conf, $vmid, $opt, $d);
8edc9c08 4206 } elsif ($opt eq 'vcpus') {
b3c2bdd1 4207 die "skip\n" if !$hotplug_features->{cpu};
3a11fadb
DM
4208 qemu_cpu_hotplug($vmid, $conf, $value);
4209 } elsif ($opt eq 'balloon') {
81d95ae1 4210 # enable/disable balloning device is not hotpluggable
8fe689e7 4211 my $old_balloon_enabled = !!(!defined($conf->{balloon}) || $conf->{balloon});
a1b7d579 4212 my $new_balloon_enabled = !!(!defined($conf->{pending}->{balloon}) || $conf->{pending}->{balloon});
81d95ae1
DM
4213 die "skip\n" if $old_balloon_enabled != $new_balloon_enabled;
4214
3a11fadb 4215 # allow manual ballooning if shares is set to zero
4cc1efa6 4216 if ((defined($conf->{shares}) && ($conf->{shares} == 0))) {
9c2f7069
AD
4217 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
4218 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
4219 }
a1b7d579 4220 } elsif ($opt =~ m/^net(\d+)$/) {
3eec5767 4221 # some changes can be done without hotplug
a1b7d579 4222 vmconfig_update_net($storecfg, $conf, $hotplug_features->{network},
b3c2bdd1 4223 $vmid, $opt, $value);
74479ee9 4224 } elsif (is_valid_drivename($opt)) {
a05cff86 4225 # some changes can be done without hotplug
b3c2bdd1
DM
4226 vmconfig_update_disk($storecfg, $conf, $hotplug_features->{disk},
4227 $vmid, $opt, $value, 1);
4d3f29ed
AD
4228 } elsif ($opt =~ m/^memory$/) { #dimms
4229 die "skip\n" if !$hotplug_features->{memory};
6779f1ac 4230 $value = PVE::QemuServer::Memory::qemu_memory_hotplug($vmid, $conf, $defaults, $opt, $value);
c8effec3
AD
4231 } elsif ($opt eq 'cpuunits') {
4232 cgroups_write("cpu", $vmid, "cpu.shares", $conf->{pending}->{$opt});
58be00f1 4233 } elsif ($opt eq 'cpulimit') {
c6f773b8 4234 my $cpulimit = $conf->{pending}->{$opt} == 0 ? -1 : int($conf->{pending}->{$opt} * 100000);
58be00f1 4235 cgroups_write("cpu", $vmid, "cpu.cfs_quota_us", $cpulimit);
3a11fadb 4236 } else {
e56beeda 4237 die "skip\n"; # skip non-hot-pluggable options
3d7389fe 4238 }
3a11fadb
DM
4239 };
4240 if (my $err = $@) {
e56beeda
DM
4241 &$add_error($opt, $err) if $err ne "skip\n";
4242 } else {
3a11fadb
DM
4243 # save new config if hotplug was successful
4244 $conf->{$opt} = $value;
4245 delete $conf->{pending}->{$opt};
ffda963f
FG
4246 PVE::QemuConfig->write_config($vmid, $conf);
4247 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
3d7389fe 4248 }
3d7389fe 4249 }
c427973b 4250}
055d554d 4251
3dc38fbb
WB
4252sub try_deallocate_drive {
4253 my ($storecfg, $vmid, $conf, $key, $drive, $rpcenv, $authuser, $force) = @_;
4254
4255 if (($force || $key =~ /^unused/) && !drive_is_cdrom($drive, 1)) {
4256 my $volid = $drive->{file};
4257 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
4258 my $sid = PVE::Storage::parse_volume_id($volid);
4259 $rpcenv->check($authuser, "/storage/$sid", ['Datastore.AllocateSpace']);
cee01bcb
WB
4260
4261 # check if the disk is really unused
cee01bcb 4262 die "unable to delete '$volid' - volume is still in use (snapshot?)\n"
77019edf 4263 if is_volume_in_use($storecfg, $conf, $key, $volid);
cee01bcb 4264 PVE::Storage::vdisk_free($storecfg, $volid);
3dc38fbb 4265 return 1;
40b977f3
WL
4266 } else {
4267 # If vm is not owner of this disk remove from config
4268 return 1;
3dc38fbb
WB
4269 }
4270 }
4271
4272 return undef;
4273}
4274
4275sub vmconfig_delete_or_detach_drive {
4276 my ($vmid, $storecfg, $conf, $opt, $force) = @_;
4277
4278 my $drive = parse_drive($opt, $conf->{$opt});
4279
4280 my $rpcenv = PVE::RPCEnvironment::get();
4281 my $authuser = $rpcenv->get_user();
4282
4283 if ($force) {
4284 $rpcenv->check_vm_perm($authuser, $vmid, undef, ['VM.Config.Disk']);
4285 try_deallocate_drive($storecfg, $vmid, $conf, $opt, $drive, $rpcenv, $authuser, $force);
4286 } else {
4287 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $drive);
4288 }
4289}
4290
055d554d 4291sub vmconfig_apply_pending {
3a11fadb 4292 my ($vmid, $conf, $storecfg) = @_;
c427973b
DM
4293
4294 # cold plug
055d554d 4295
3dc38fbb
WB
4296 my $pending_delete_hash = split_flagged_list($conf->{pending}->{delete});
4297 while (my ($opt, $force) = each %$pending_delete_hash) {
055d554d 4298 die "internal error" if $opt =~ m/^unused/;
ffda963f 4299 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4300 if (!defined($conf->{$opt})) {
4301 vmconfig_undelete_pending_option($conf, $opt);
ffda963f 4302 PVE::QemuConfig->write_config($vmid, $conf);
74479ee9 4303 } elsif (is_valid_drivename($opt)) {
3dc38fbb 4304 vmconfig_delete_or_detach_drive($vmid, $storecfg, $conf, $opt, $force);
055d554d
DM
4305 vmconfig_undelete_pending_option($conf, $opt);
4306 delete $conf->{$opt};
ffda963f 4307 PVE::QemuConfig->write_config($vmid, $conf);
055d554d
DM
4308 } else {
4309 vmconfig_undelete_pending_option($conf, $opt);
4310 delete $conf->{$opt};
ffda963f 4311 PVE::QemuConfig->write_config($vmid, $conf);
055d554d
DM
4312 }
4313 }
4314
ffda963f 4315 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4316
4317 foreach my $opt (keys %{$conf->{pending}}) { # add/change
ffda963f 4318 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4319
4320 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
4321 # skip if nothing changed
74479ee9 4322 } elsif (is_valid_drivename($opt)) {
055d554d
DM
4323 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
4324 if defined($conf->{$opt});
4325 $conf->{$opt} = $conf->{pending}->{$opt};
4326 } else {
4327 $conf->{$opt} = $conf->{pending}->{$opt};
4328 }
4329
4330 delete $conf->{pending}->{$opt};
ffda963f 4331 PVE::QemuConfig->write_config($vmid, $conf);
055d554d
DM
4332 }
4333}
4334
3eec5767
DM
4335my $safe_num_ne = sub {
4336 my ($a, $b) = @_;
4337
4338 return 0 if !defined($a) && !defined($b);
4339 return 1 if !defined($a);
4340 return 1 if !defined($b);
4341
4342 return $a != $b;
4343};
4344
4345my $safe_string_ne = sub {
4346 my ($a, $b) = @_;
4347
4348 return 0 if !defined($a) && !defined($b);
4349 return 1 if !defined($a);
4350 return 1 if !defined($b);
4351
4352 return $a ne $b;
4353};
4354
4355sub vmconfig_update_net {
b3c2bdd1 4356 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value) = @_;
3eec5767
DM
4357
4358 my $newnet = parse_net($value);
4359
4360 if ($conf->{$opt}) {
4361 my $oldnet = parse_net($conf->{$opt});
4362
4363 if (&$safe_string_ne($oldnet->{model}, $newnet->{model}) ||
4364 &$safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
4365 &$safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
4366 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
4367
4368 # for non online change, we try to hot-unplug
7196b757 4369 die "skip\n" if !$hotplug;
3eec5767
DM
4370 vm_deviceunplug($vmid, $conf, $opt);
4371 } else {
4372
4373 die "internal error" if $opt !~ m/net(\d+)/;
4374 my $iface = "tap${vmid}i$1";
a1b7d579 4375
25088687
DM
4376 if (&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
4377 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
16d08ecf 4378 &$safe_string_ne($oldnet->{trunks}, $newnet->{trunks}) ||
25088687 4379 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3eec5767 4380 PVE::Network::tap_unplug($iface);
4f4fbeb0
WB
4381 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks}, $newnet->{rate});
4382 } elsif (&$safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
4383 # Rate can be applied on its own but any change above needs to
4384 # include the rate in tap_plug since OVS resets everything.
4385 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3eec5767 4386 }
38c590d9 4387
25088687
DM
4388 if (&$safe_string_ne($oldnet->{link_down}, $newnet->{link_down})) {
4389 qemu_set_link_status($vmid, $opt, !$newnet->{link_down});
4390 }
4391
38c590d9 4392 return 1;
3eec5767
DM
4393 }
4394 }
a1b7d579 4395
7196b757 4396 if ($hotplug) {
38c590d9
DM
4397 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet);
4398 } else {
4399 die "skip\n";
4400 }
3eec5767
DM
4401}
4402
a05cff86 4403sub vmconfig_update_disk {
b3c2bdd1 4404 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value, $force) = @_;
a05cff86
DM
4405
4406 # fixme: do we need force?
4407
4408 my $drive = parse_drive($opt, $value);
4409
4410 if ($conf->{$opt}) {
4411
4412 if (my $old_drive = parse_drive($opt, $conf->{$opt})) {
4413
4414 my $media = $drive->{media} || 'disk';
4415 my $oldmedia = $old_drive->{media} || 'disk';
4416 die "unable to change media type\n" if $media ne $oldmedia;
4417
4418 if (!drive_is_cdrom($old_drive)) {
4419
a1b7d579 4420 if ($drive->{file} ne $old_drive->{file}) {
a05cff86 4421
7196b757 4422 die "skip\n" if !$hotplug;
a05cff86
DM
4423
4424 # unplug and register as unused
4425 vm_deviceunplug($vmid, $conf, $opt);
4426 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $old_drive)
a1b7d579 4427
a05cff86
DM
4428 } else {
4429 # update existing disk
4430
4431 # skip non hotpluggable value
6ecfbb44 4432 if (&$safe_string_ne($drive->{discard}, $old_drive->{discard}) ||
22de899a 4433 &$safe_string_ne($drive->{iothread}, $old_drive->{iothread}) ||
6e11f143 4434 &$safe_string_ne($drive->{queues}, $old_drive->{queues}) ||
a05cff86
DM
4435 &$safe_string_ne($drive->{cache}, $old_drive->{cache})) {
4436 die "skip\n";
4437 }
4438
4439 # apply throttle
4440 if (&$safe_num_ne($drive->{mbps}, $old_drive->{mbps}) ||
4441 &$safe_num_ne($drive->{mbps_rd}, $old_drive->{mbps_rd}) ||
4442 &$safe_num_ne($drive->{mbps_wr}, $old_drive->{mbps_wr}) ||
4443 &$safe_num_ne($drive->{iops}, $old_drive->{iops}) ||
4444 &$safe_num_ne($drive->{iops_rd}, $old_drive->{iops_rd}) ||
4445 &$safe_num_ne($drive->{iops_wr}, $old_drive->{iops_wr}) ||
4446 &$safe_num_ne($drive->{mbps_max}, $old_drive->{mbps_max}) ||
4447 &$safe_num_ne($drive->{mbps_rd_max}, $old_drive->{mbps_rd_max}) ||
4448 &$safe_num_ne($drive->{mbps_wr_max}, $old_drive->{mbps_wr_max}) ||
4449 &$safe_num_ne($drive->{iops_max}, $old_drive->{iops_max}) ||
4450 &$safe_num_ne($drive->{iops_rd_max}, $old_drive->{iops_rd_max}) ||
9196a8ec
WB
4451 &$safe_num_ne($drive->{iops_wr_max}, $old_drive->{iops_wr_max}) ||
4452 &$safe_num_ne($drive->{bps_max_length}, $old_drive->{bps_max_length}) ||
4453 &$safe_num_ne($drive->{bps_rd_max_length}, $old_drive->{bps_rd_max_length}) ||
4454 &$safe_num_ne($drive->{bps_wr_max_length}, $old_drive->{bps_wr_max_length}) ||
4455 &$safe_num_ne($drive->{iops_max_length}, $old_drive->{iops_max_length}) ||
4456 &$safe_num_ne($drive->{iops_rd_max_length}, $old_drive->{iops_rd_max_length}) ||
4457 &$safe_num_ne($drive->{iops_wr_max_length}, $old_drive->{iops_wr_max_length})) {
a1b7d579 4458
a05cff86
DM
4459 qemu_block_set_io_throttle($vmid,"drive-$opt",
4460 ($drive->{mbps} || 0)*1024*1024,
4461 ($drive->{mbps_rd} || 0)*1024*1024,
4462 ($drive->{mbps_wr} || 0)*1024*1024,
4463 $drive->{iops} || 0,
4464 $drive->{iops_rd} || 0,
4465 $drive->{iops_wr} || 0,
4466 ($drive->{mbps_max} || 0)*1024*1024,
4467 ($drive->{mbps_rd_max} || 0)*1024*1024,
4468 ($drive->{mbps_wr_max} || 0)*1024*1024,
4469 $drive->{iops_max} || 0,
4470 $drive->{iops_rd_max} || 0,
9196a8ec
WB
4471 $drive->{iops_wr_max} || 0,
4472 $drive->{bps_max_length} || 1,
4473 $drive->{bps_rd_max_length} || 1,
4474 $drive->{bps_wr_max_length} || 1,
4475 $drive->{iops_max_length} || 1,
4476 $drive->{iops_rd_max_length} || 1,
4477 $drive->{iops_wr_max_length} || 1);
a05cff86
DM
4478
4479 }
a1b7d579 4480
a05cff86
DM
4481 return 1;
4482 }
4de1bb25
DM
4483
4484 } else { # cdrom
a1b7d579 4485
4de1bb25
DM
4486 if ($drive->{file} eq 'none') {
4487 vm_mon_cmd($vmid, "eject",force => JSON::true,device => "drive-$opt");
4488 } else {
4489 my $path = get_iso_path($storecfg, $vmid, $drive->{file});
4490 vm_mon_cmd($vmid, "eject", force => JSON::true,device => "drive-$opt"); # force eject if locked
4491 vm_mon_cmd($vmid, "change", device => "drive-$opt",target => "$path") if $path;
4492 }
a1b7d579 4493
34758d66 4494 return 1;
a05cff86
DM
4495 }
4496 }
4497 }
4498
a1b7d579 4499 die "skip\n" if !$hotplug || $opt =~ m/(ide|sata)(\d+)/;
4de1bb25 4500 # hotplug new disks
f7b4356f 4501 PVE::Storage::activate_volumes($storecfg, [$drive->{file}]) if $drive->{file} !~ m|^/dev/.+|;
4de1bb25 4502 vm_deviceplug($storecfg, $conf, $vmid, $opt, $drive);
a05cff86
DM
4503}
4504
1e3baf05 4505sub vm_start {
ba9e1000 4506 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused,
2189246c 4507 $forcemachine, $spice_ticket, $migration_network, $migration_type, $targetstorage) = @_;
1e3baf05 4508
ffda963f
FG
4509 PVE::QemuConfig->lock_config($vmid, sub {
4510 my $conf = PVE::QemuConfig->load_config($vmid, $migratedfrom);
1e3baf05 4511
ffda963f 4512 die "you can't start a vm if it's a template\n" if PVE::QemuConfig->is_template($conf);
3dcb98d5 4513
ffda963f 4514 PVE::QemuConfig->check_lock($conf) if !$skiplock;
1e3baf05 4515
7e8dcf2c 4516 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 4517
055d554d 4518 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3a11fadb 4519 vmconfig_apply_pending($vmid, $conf, $storecfg);
ffda963f 4520 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4521 }
4522
6c47d546
DM
4523 my $defaults = load_defaults();
4524
4525 # set environment variable useful inside network script
4526 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
4527
2189246c
AD
4528 my $local_volumes = {};
4529
3b4cf0f0 4530 if ($targetstorage) {
2189246c
AD
4531 foreach_drive($conf, sub {
4532 my ($ds, $drive) = @_;
4533
4534 return if drive_is_cdrom($drive);
4535
4536 my $volid = $drive->{file};
4537
4538 return if !$volid;
4539
4540 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid);
4541
4542 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
4543 return if $scfg->{shared};
4544 $local_volumes->{$ds} = [$volid, $storeid, $volname];
4545 });
4546
4547 my $format = undef;
4548
4549 foreach my $opt (sort keys %$local_volumes) {
4550
4551 my ($volid, $storeid, $volname) = @{$local_volumes->{$opt}};
4552 my $drive = parse_drive($opt, $conf->{$opt});
4553
4554 #if remote storage is specified, use default format
4555 if ($targetstorage && $targetstorage ne "1") {
4556 $storeid = $targetstorage;
4557 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
4558 $format = $defFormat;
4559 } else {
4560 #else we use same format than original
4561 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
4562 $format = qemu_img_format($scfg, $volid);
4563 }
4564
4565 my $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $vmid, $format, undef, ($drive->{size}/1024));
4566 my $newdrive = $drive;
4567 $newdrive->{format} = $format;
4568 $newdrive->{file} = $newvolid;
4569 my $drivestr = PVE::QemuServer::print_drive($vmid, $newdrive);
4570 $local_volumes->{$opt} = $drivestr;
4571 #pass drive to conf for command line
4572 $conf->{$opt} = $drivestr;
4573 }
4574 }
4575
67812f9c 4576 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 4577
1e3baf05 4578 my $migrate_port = 0;
5bc1e039 4579 my $migrate_uri;
1e3baf05
DM
4580 if ($statefile) {
4581 if ($statefile eq 'tcp') {
5bc1e039
SP
4582 my $localip = "localhost";
4583 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
af0eba7e 4584 my $nodename = PVE::INotify::nodename();
2de2d6f7 4585
b7a5a225
TL
4586 if (!defined($migration_type)) {
4587 if (defined($datacenterconf->{migration}->{type})) {
4588 $migration_type = $datacenterconf->{migration}->{type};
4589 } else {
4590 $migration_type = 'secure';
4591 }
4592 }
4593
2de2d6f7
TL
4594 if ($migration_type eq 'insecure') {
4595 my $migrate_network_addr = PVE::Cluster::get_local_migration_ip($migration_network);
4596 if ($migrate_network_addr) {
4597 $localip = $migrate_network_addr;
4598 } else {
5bc1e039 4599 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
2de2d6f7
TL
4600 }
4601
4602 $localip = "[$localip]" if Net::IP::ip_is_ipv6($localip);
5bc1e039 4603 }
2de2d6f7 4604
af0eba7e
WB
4605 my $pfamily = PVE::Tools::get_host_address_family($nodename);
4606 $migrate_port = PVE::Tools::next_migrate_port($pfamily);
407e0b8b 4607 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
4608 push @$cmd, '-incoming', $migrate_uri;
4609 push @$cmd, '-S';
1c9d54bf
TL
4610
4611 } elsif ($statefile eq 'unix') {
4612 # should be default for secure migrations as a ssh TCP forward
4613 # tunnel is not deterministic reliable ready and fails regurarly
4614 # to set up in time, so use UNIX socket forwards
54323eed
TL
4615 my $socket_addr = "/run/qemu-server/$vmid.migrate";
4616 unlink $socket_addr;
4617
4618 $migrate_uri = "unix:$socket_addr";
1c9d54bf
TL
4619
4620 push @$cmd, '-incoming', $migrate_uri;
4621 push @$cmd, '-S';
4622
1e3baf05 4623 } else {
6c47d546 4624 push @$cmd, '-loadstate', $statefile;
1e3baf05 4625 }
91bd6c90
DM
4626 } elsif ($paused) {
4627 push @$cmd, '-S';
1e3baf05
DM
4628 }
4629
1e3baf05 4630 # host pci devices
040b06b7
DA
4631 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
4632 my $d = parse_hostpci($conf->{"hostpci$i"});
4633 next if !$d;
b1f72af6
AD
4634 my $pcidevices = $d->{pciid};
4635 foreach my $pcidevice (@$pcidevices) {
4636 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 4637
b1f72af6
AD
4638 my $info = pci_device_info("0000:$pciid");
4639 die "IOMMU not present\n" if !check_iommu_support();
4640 die "no pci device info for device '$pciid'\n" if !$info;
6ea8cd3b 4641 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
8f3e88af 4642 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 4643 }
040b06b7 4644 }
1e3baf05
DM
4645
4646 PVE::Storage::activate_volumes($storecfg, $vollist);
4647
2b401189
AD
4648 if (!check_running($vmid, 1) && -d "/sys/fs/cgroup/systemd/qemu.slice/$vmid.scope") {
4649 my $cmd = [];
4650 push @$cmd, '/bin/systemctl', 'stop', "$vmid.scope";
4651 eval { run_command($cmd); };
4652 }
4653
8e59d952
WB
4654 my $cpuunits = defined($conf->{cpuunits}) ? $conf->{cpuunits}
4655 : $defaults->{cpuunits};
4656
7023f3ea
AD
4657 my %run_params = (timeout => $statefile ? undef : 30, umask => 0077);
4658
4659 my %properties = (
4660 Slice => 'qemu.slice',
4661 KillMode => 'none',
4662 CPUShares => $cpuunits
4663 );
4664
4665 if (my $cpulimit = $conf->{cpulimit}) {
4666 $properties{CPUQuota} = int($cpulimit * 100);
4667 }
4668 $properties{timeout} = 10 if $statefile; # setting up the scope shoul be quick
4669
4670 if ($conf->{hugepages}) {
4671
4672 my $code = sub {
4673 my $hugepages_topology = PVE::QemuServer::Memory::hugepages_topology($conf);
4674 my $hugepages_host_topology = PVE::QemuServer::Memory::hugepages_host_topology();
4675
4676 PVE::QemuServer::Memory::hugepages_mount();
4677 PVE::QemuServer::Memory::hugepages_allocate($hugepages_topology, $hugepages_host_topology);
4678
4679 eval {
4680 PVE::Tools::enter_systemd_scope($vmid, "Proxmox VE VM $vmid", %properties);
4681 run_command($cmd, %run_params);
4682 };
4683
4684 if (my $err = $@) {
4685 PVE::QemuServer::Memory::hugepages_reset($hugepages_host_topology);
4686 die $err;
4687 }
4688
4689 PVE::QemuServer::Memory::hugepages_pre_deallocate($hugepages_topology);
4690 };
4691 eval { PVE::QemuServer::Memory::hugepages_update_locked($code); };
4692
4693 } else {
4694 eval {
4695 PVE::Tools::enter_systemd_scope($vmid, "Proxmox VE VM $vmid", %properties);
4696 run_command($cmd, %run_params);
4697 };
4698 }
77cde36b
DC
4699
4700 if (my $err = $@) {
4701 # deactivate volumes if start fails
4702 eval { PVE::Storage::deactivate_volumes($storecfg, $vollist); };
4703 die "start failed: $err";
4704 }
1e3baf05 4705
5bc1e039 4706 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 4707
b37ecfe6 4708 if ($statefile && $statefile ne 'tcp' && $statefile ne 'unix') {
95381ce0 4709 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 4710 warn $@ if $@;
62de2cbd
DM
4711 }
4712
2189246c
AD
4713 #start nbd server for storage migration
4714 if ($targetstorage) {
2189246c
AD
4715 my $nodename = PVE::INotify::nodename();
4716 my $migrate_network_addr = PVE::Cluster::get_local_migration_ip($migration_network);
4717 my $localip = $migrate_network_addr ? $migrate_network_addr : PVE::Cluster::remote_node_ip($nodename, 1);
4718 my $pfamily = PVE::Tools::get_host_address_family($nodename);
4719 $migrate_port = PVE::Tools::next_migrate_port($pfamily);
4720
4721 vm_mon_cmd_nocheck($vmid, "nbd-server-start", addr => { type => 'inet', data => { host => "${localip}", port => "${migrate_port}" } } );
4722
4723 $localip = "[$localip]" if Net::IP::ip_is_ipv6($localip);
4724
4725 foreach my $opt (sort keys %$local_volumes) {
4726 my $volid = $local_volumes->{$opt};
4727 vm_mon_cmd_nocheck($vmid, "nbd-server-add", device => "drive-$opt", writable => JSON::true );
4728 my $migrate_storage_uri = "nbd:${localip}:${migrate_port}:exportname=drive-$opt";
4729 print "storage migration listens on $migrate_storage_uri volume:$volid\n";
4730 }
4731 }
4732
1d794448 4733 if ($migratedfrom) {
a89fded1 4734 eval {
8e90138a 4735 set_migration_caps($vmid);
a89fded1 4736 };
1d794448 4737 warn $@ if $@;
a89fded1 4738
1d794448
DM
4739 if ($spice_port) {
4740 print "spice listens on port $spice_port\n";
4741 if ($spice_ticket) {
8e90138a
DM
4742 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
4743 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
4744 }
4745 }
4746
1d794448 4747 } else {
15b1fc93 4748 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 4749 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 4750 if $conf->{balloon};
4ec05c4c 4751 }
25088687
DM
4752
4753 foreach my $opt (keys %$conf) {
4754 next if $opt !~ m/^net\d+$/;
4755 my $nicconf = parse_net($conf->{$opt});
4756 qemu_set_link_status($vmid, $opt, 0) if $nicconf->{link_down};
4757 }
e18b0b99 4758 }
a1b7d579 4759
eb065317
AD
4760 vm_mon_cmd_nocheck($vmid, 'qom-set',
4761 path => "machine/peripheral/balloon0",
4762 property => "guest-stats-polling-interval",
4763 value => 2) if (!defined($conf->{balloon}) || $conf->{balloon});
4764
1e3baf05
DM
4765 });
4766}
4767
0eedc444
AD
4768sub vm_mon_cmd {
4769 my ($vmid, $execute, %params) = @_;
4770
26f11676
DM
4771 my $cmd = { execute => $execute, arguments => \%params };
4772 vm_qmp_command($vmid, $cmd);
0eedc444
AD
4773}
4774
4775sub vm_mon_cmd_nocheck {
4776 my ($vmid, $execute, %params) = @_;
4777
26f11676
DM
4778 my $cmd = { execute => $execute, arguments => \%params };
4779 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
4780}
4781
c971c4f2 4782sub vm_qmp_command {
c5a07de5 4783 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 4784
c971c4f2 4785 my $res;
26f11676 4786
14db5366
DM
4787 my $timeout;
4788 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
4789 $timeout = $cmd->{arguments}->{timeout};
4790 delete $cmd->{arguments}->{timeout};
4791 }
be190583 4792
c971c4f2
AD
4793 eval {
4794 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
4795 my $sname = qmp_socket($vmid);
4796 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 4797 my $qmpclient = PVE::QMPClient->new();
dab36e1e 4798
14db5366 4799 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 4800 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
4801 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
4802 if scalar(%{$cmd->{arguments}});
4803 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
4804 } else {
4805 die "unable to open monitor socket\n";
4806 }
c971c4f2 4807 };
26f11676 4808 if (my $err = $@) {
c971c4f2
AD
4809 syslog("err", "VM $vmid qmp command failed - $err");
4810 die $err;
4811 }
4812
4813 return $res;
4814}
4815
9df5cbcc
DM
4816sub vm_human_monitor_command {
4817 my ($vmid, $cmdline) = @_;
4818
4819 my $res;
4820
f5eb281a 4821 my $cmd = {
9df5cbcc
DM
4822 execute => 'human-monitor-command',
4823 arguments => { 'command-line' => $cmdline},
4824 };
4825
4826 return vm_qmp_command($vmid, $cmd);
4827}
4828
1e3baf05
DM
4829sub vm_commandline {
4830 my ($storecfg, $vmid) = @_;
4831
ffda963f 4832 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05
DM
4833
4834 my $defaults = load_defaults();
4835
6b64503e 4836 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 4837
5930c1ff 4838 return PVE::Tools::cmd2string($cmd);
1e3baf05
DM
4839}
4840
4841sub vm_reset {
4842 my ($vmid, $skiplock) = @_;
4843
ffda963f 4844 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 4845
ffda963f 4846 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 4847
ffda963f 4848 PVE::QemuConfig->check_lock($conf) if !$skiplock;
1e3baf05 4849
816e2c4a 4850 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
4851 });
4852}
4853
4854sub get_vm_volumes {
4855 my ($conf) = @_;
1e3baf05 4856
ff1a2432 4857 my $vollist = [];
d5769dc2 4858 foreach_volid($conf, sub {
392f8b5d 4859 my ($volid, $attr) = @_;
ff1a2432 4860
d5769dc2 4861 return if $volid =~ m|^/|;
ff1a2432 4862
d5769dc2
DM
4863 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4864 return if !$sid;
ff1a2432
DM
4865
4866 push @$vollist, $volid;
1e3baf05 4867 });
ff1a2432
DM
4868
4869 return $vollist;
4870}
4871
4872sub vm_stop_cleanup {
70b04821 4873 my ($storecfg, $vmid, $conf, $keepActive, $apply_pending_changes) = @_;
ff1a2432 4874
745fed70 4875 eval {
ff1a2432 4876
254575e9
DM
4877 if (!$keepActive) {
4878 my $vollist = get_vm_volumes($conf);
4879 PVE::Storage::deactivate_volumes($storecfg, $vollist);
4880 }
a1b7d579 4881
ab6a046f 4882 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
4883 unlink "/var/run/qemu-server/${vmid}.$ext";
4884 }
a1b7d579 4885
70b04821 4886 vmconfig_apply_pending($vmid, $conf, $storecfg) if $apply_pending_changes;
745fed70
DM
4887 };
4888 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
4889}
4890
e6c3b671 4891# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
4892# We need that when migration VMs to other nodes (files already moved)
4893# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 4894sub vm_stop {
af30308f 4895 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 4896
9269013a 4897 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 4898
af30308f
DM
4899 if ($migratedfrom){
4900 my $pid = check_running($vmid, $nocheck, $migratedfrom);
4901 kill 15, $pid if $pid;
ffda963f 4902 my $conf = PVE::QemuConfig->load_config($vmid, $migratedfrom);
70b04821 4903 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 0);
af30308f
DM
4904 return;
4905 }
4906
ffda963f 4907 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 4908
e6c3b671 4909 my $pid = check_running($vmid, $nocheck);
ff1a2432 4910 return if !$pid;
1e3baf05 4911
ff1a2432 4912 my $conf;
e6c3b671 4913 if (!$nocheck) {
ffda963f
FG
4914 $conf = PVE::QemuConfig->load_config($vmid);
4915 PVE::QemuConfig->check_lock($conf) if !$skiplock;
7f4a5b5a 4916 if (!defined($timeout) && $shutdown && $conf->{startup}) {
38f7f26c 4917 my $opts = PVE::JSONSchema::pve_parse_startup_order($conf->{startup});
7f4a5b5a
DM
4918 $timeout = $opts->{down} if $opts->{down};
4919 }
e6c3b671 4920 }
19672434 4921
7f4a5b5a 4922 $timeout = 60 if !defined($timeout);
67fb9de6 4923
9269013a
DM
4924 eval {
4925 if ($shutdown) {
fbda7965 4926 if (defined($conf) && $conf->{agent}) {
2ea54503 4927 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 4928 } else {
2ea54503 4929 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 4930 }
9269013a 4931 } else {
2ea54503 4932 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 4933 }
9269013a 4934 };
1e3baf05
DM
4935 my $err = $@;
4936
4937 if (!$err) {
1e3baf05 4938 my $count = 0;
e6c3b671 4939 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4940 $count++;
4941 sleep 1;
4942 }
4943
4944 if ($count >= $timeout) {
9269013a
DM
4945 if ($force) {
4946 warn "VM still running - terminating now with SIGTERM\n";
4947 kill 15, $pid;
4948 } else {
4949 die "VM quit/powerdown failed - got timeout\n";
4950 }
4951 } else {
70b04821 4952 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
9269013a 4953 return;
1e3baf05
DM
4954 }
4955 } else {
9269013a
DM
4956 if ($force) {
4957 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4958 kill 15, $pid;
4959 } else {
afdb31d5 4960 die "VM quit/powerdown failed\n";
9269013a 4961 }
1e3baf05
DM
4962 }
4963
4964 # wait again
ff1a2432 4965 $timeout = 10;
1e3baf05
DM
4966
4967 my $count = 0;
e6c3b671 4968 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4969 $count++;
4970 sleep 1;
4971 }
4972
4973 if ($count >= $timeout) {
ff1a2432 4974 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 4975 kill 9, $pid;
ff1a2432 4976 sleep 1;
1e3baf05
DM
4977 }
4978
70b04821 4979 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
ff1a2432 4980 });
1e3baf05
DM
4981}
4982
4983sub vm_suspend {
4984 my ($vmid, $skiplock) = @_;
4985
ffda963f 4986 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 4987
ffda963f 4988 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 4989
e79706d4
FG
4990 PVE::QemuConfig->check_lock($conf)
4991 if !($skiplock || PVE::QemuConfig->has_lock($conf, 'backup'));
bcb7c9cf 4992
f77f91f3 4993 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
4994 });
4995}
4996
4997sub vm_resume {
289e0b85 4998 my ($vmid, $skiplock, $nocheck) = @_;
1e3baf05 4999
ffda963f 5000 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 5001
289e0b85 5002 if (!$nocheck) {
1e3baf05 5003
ffda963f 5004 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 5005
e79706d4
FG
5006 PVE::QemuConfig->check_lock($conf)
5007 if !($skiplock || PVE::QemuConfig->has_lock($conf, 'backup'));
289e0b85
AD
5008
5009 vm_mon_cmd($vmid, "cont");
5010
5011 } else {
5012 vm_mon_cmd_nocheck($vmid, "cont");
5013 }
1e3baf05
DM
5014 });
5015}
5016
5fdbe4f0
DM
5017sub vm_sendkey {
5018 my ($vmid, $skiplock, $key) = @_;
1e3baf05 5019
ffda963f 5020 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 5021
ffda963f 5022 my $conf = PVE::QemuConfig->load_config($vmid);
f5eb281a 5023
7b7c6d1b
DM
5024 # there is no qmp command, so we use the human monitor command
5025 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
5026 });
5027}
5028
5029sub vm_destroy {
5030 my ($storecfg, $vmid, $skiplock) = @_;
5031
ffda963f 5032 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 5033
ffda963f 5034 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 5035
ff1a2432 5036 if (!check_running($vmid)) {
15cc8784 5037 destroy_vm($storecfg, $vmid, undef, $skiplock);
ff1a2432
DM
5038 } else {
5039 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
5040 }
5041 });
5042}
5043
1e3baf05
DM
5044# pci helpers
5045
5046sub file_write {
5047 my ($filename, $buf) = @_;
5048
6b64503e 5049 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
5050 return undef if !$fh;
5051
5052 my $res = print $fh $buf;
5053
5054 $fh->close();
5055
5056 return $res;
5057}
5058
5059sub pci_device_info {
5060 my ($name) = @_;
5061
5062 my $res;
5063
5064 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
5065 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
5066
5067 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
5068 return undef if !defined($irq) || $irq !~ m/^\d+$/;
5069
5070 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
5071 return undef if !defined($vendor) || $vendor !~ s/^0x//;
5072
5073 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
5074 return undef if !defined($product) || $product !~ s/^0x//;
5075
5076 $res = {
5077 name => $name,
5078 vendor => $vendor,
5079 product => $product,
5080 domain => $domain,
5081 bus => $bus,
5082 slot => $slot,
5083 func => $func,
5084 irq => $irq,
5085 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
5086 };
5087
5088 return $res;
5089}
5090
5091sub pci_dev_reset {
5092 my ($dev) = @_;
5093
5094 my $name = $dev->{name};
5095
5096 my $fn = "$pcisysfs/devices/$name/reset";
5097
6b64503e 5098 return file_write($fn, "1");
1e3baf05
DM
5099}
5100
000fc0a2
SP
5101sub pci_dev_bind_to_vfio {
5102 my ($dev) = @_;
5103
5104 my $name = $dev->{name};
5105
5106 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
5107
5108 if (!-d $vfio_basedir) {
5109 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
5110 }
5111 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
5112
5113 my $testdir = "$vfio_basedir/$name";
5114 return 1 if -d $testdir;
5115
5116 my $data = "$dev->{vendor} $dev->{product}";
5117 return undef if !file_write("$vfio_basedir/new_id", $data);
5118
5119 my $fn = "$pcisysfs/devices/$name/driver/unbind";
5120 if (!file_write($fn, $name)) {
5121 return undef if -f $fn;
5122 }
5123
5124 $fn = "$vfio_basedir/bind";
5125 if (! -d $testdir) {
5126 return undef if !file_write($fn, $name);
5127 }
5128
5129 return -d $testdir;
5130}
5131
5132sub pci_dev_group_bind_to_vfio {
5133 my ($pciid) = @_;
5134
5135 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
5136
5137 if (!-d $vfio_basedir) {
5138 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
5139 }
5140 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
5141
5142 # get IOMMU group devices
5143 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
5144 my @devs = grep /^0000:/, readdir($D);
5145 closedir($D);
5146
5147 foreach my $pciid (@devs) {
5148 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
f8fa2ed7
SP
5149
5150 # pci bridges, switches or root ports are not supported
5151 # they have a pci_bus subdirectory so skip them
5152 next if (-e "$pcisysfs/devices/$pciid/pci_bus");
5153
000fc0a2
SP
5154 my $info = pci_device_info($1);
5155 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
5156 }
5157
5158 return 1;
5159}
5160
3e16d5fc
DM
5161# vzdump restore implementaion
5162
ed221350 5163sub tar_archive_read_firstfile {
3e16d5fc 5164 my $archive = shift;
afdb31d5 5165
3e16d5fc
DM
5166 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
5167
5168 # try to detect archive type first
387ba257 5169 my $pid = open (my $fh, '-|', 'tar', 'tf', $archive) ||
3e16d5fc 5170 die "unable to open file '$archive'\n";
387ba257 5171 my $firstfile = <$fh>;
3e16d5fc 5172 kill 15, $pid;
387ba257 5173 close $fh;
3e16d5fc
DM
5174
5175 die "ERROR: archive contaions no data\n" if !$firstfile;
5176 chomp $firstfile;
5177
5178 return $firstfile;
5179}
5180
ed221350
DM
5181sub tar_restore_cleanup {
5182 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
5183
5184 print STDERR "starting cleanup\n";
5185
5186 if (my $fd = IO::File->new($statfile, "r")) {
5187 while (defined(my $line = <$fd>)) {
5188 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5189 my $volid = $2;
5190 eval {
5191 if ($volid =~ m|^/|) {
5192 unlink $volid || die 'unlink failed\n';
5193 } else {
ed221350 5194 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 5195 }
afdb31d5 5196 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
5197 };
5198 print STDERR "unable to cleanup '$volid' - $@" if $@;
5199 } else {
5200 print STDERR "unable to parse line in statfile - $line";
afdb31d5 5201 }
3e16d5fc
DM
5202 }
5203 $fd->close();
5204 }
5205}
5206
5207sub restore_archive {
a0d1b1a2 5208 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 5209
91bd6c90
DM
5210 my $format = $opts->{format};
5211 my $comp;
5212
5213 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
5214 $format = 'tar' if !$format;
5215 $comp = 'gzip';
5216 } elsif ($archive =~ m/\.tar$/) {
5217 $format = 'tar' if !$format;
5218 } elsif ($archive =~ m/.tar.lzo$/) {
5219 $format = 'tar' if !$format;
5220 $comp = 'lzop';
5221 } elsif ($archive =~ m/\.vma$/) {
5222 $format = 'vma' if !$format;
5223 } elsif ($archive =~ m/\.vma\.gz$/) {
5224 $format = 'vma' if !$format;
5225 $comp = 'gzip';
5226 } elsif ($archive =~ m/\.vma\.lzo$/) {
5227 $format = 'vma' if !$format;
5228 $comp = 'lzop';
5229 } else {
5230 $format = 'vma' if !$format; # default
5231 }
5232
5233 # try to detect archive format
5234 if ($format eq 'tar') {
5235 return restore_tar_archive($archive, $vmid, $user, $opts);
5236 } else {
5237 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
5238 }
5239}
5240
5241sub restore_update_config_line {
5242 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
5243
5244 return if $line =~ m/^\#qmdump\#/;
5245 return if $line =~ m/^\#vzdump\#/;
5246 return if $line =~ m/^lock:/;
5247 return if $line =~ m/^unused\d+:/;
5248 return if $line =~ m/^parent:/;
ca3e4fa4 5249 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90 5250
b5b99790 5251 my $dc = PVE::Cluster::cfs_read_file('datacenter.cfg');
91bd6c90
DM
5252 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
5253 # try to convert old 1.X settings
5254 my ($id, $ind, $ethcfg) = ($1, $2, $3);
5255 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
5256 my ($model, $macaddr) = split(/\=/, $devconfig);
b5b99790 5257 $macaddr = PVE::Tools::random_ether_addr($dc->{mac_prefix}) if !$macaddr || $unique;
91bd6c90
DM
5258 my $net = {
5259 model => $model,
5260 bridge => "vmbr$ind",
5261 macaddr => $macaddr,
5262 };
5263 my $netstr = print_net($net);
5264
5265 print $outfd "net$cookie->{netcount}: $netstr\n";
5266 $cookie->{netcount}++;
5267 }
5268 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
5269 my ($id, $netstr) = ($1, $2);
5270 my $net = parse_net($netstr);
b5b99790 5271 $net->{macaddr} = PVE::Tools::random_ether_addr($dc->{mac_prefix}) if $net->{macaddr};
91bd6c90
DM
5272 $netstr = print_net($net);
5273 print $outfd "$id: $netstr\n";
6470743f 5274 } elsif ($line =~ m/^((ide|scsi|virtio|sata|efidisk)\d+):\s*(\S+)\s*$/) {
91bd6c90 5275 my $virtdev = $1;
907ea891 5276 my $value = $3;
d9faf790
WB
5277 my $di = parse_drive($virtdev, $value);
5278 if (defined($di->{backup}) && !$di->{backup}) {
91bd6c90 5279 print $outfd "#$line";
c0f7406e 5280 } elsif ($map->{$virtdev}) {
8fd57431 5281 delete $di->{format}; # format can change on restore
91bd6c90 5282 $di->{file} = $map->{$virtdev};
ed221350 5283 $value = print_drive($vmid, $di);
91bd6c90
DM
5284 print $outfd "$virtdev: $value\n";
5285 } else {
5286 print $outfd $line;
5287 }
5288 } else {
5289 print $outfd $line;
5290 }
5291}
5292
5293sub scan_volids {
5294 my ($cfg, $vmid) = @_;
5295
5296 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
5297
5298 my $volid_hash = {};
5299 foreach my $storeid (keys %$info) {
5300 foreach my $item (@{$info->{$storeid}}) {
5301 next if !($item->{volid} && $item->{size});
5996a936 5302 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
5303 $volid_hash->{$item->{volid}} = $item;
5304 }
5305 }
5306
5307 return $volid_hash;
5308}
5309
77019edf
WB
5310sub is_volume_in_use {
5311 my ($storecfg, $conf, $skip_drive, $volid) = @_;
a8e2f942 5312
77019edf 5313 my $path = PVE::Storage::path($storecfg, $volid);
a8e2f942
DM
5314
5315 my $scan_config = sub {
5316 my ($cref, $snapname) = @_;
5317
5318 foreach my $key (keys %$cref) {
5319 my $value = $cref->{$key};
74479ee9 5320 if (is_valid_drivename($key)) {
a8e2f942
DM
5321 next if $skip_drive && $key eq $skip_drive;
5322 my $drive = parse_drive($key, $value);
5323 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
77019edf 5324 return 1 if $volid eq $drive->{file};
a8e2f942 5325 if ($drive->{file} =~ m!^/!) {
77019edf 5326 return 1 if $drive->{file} eq $path;
a8e2f942
DM
5327 } else {
5328 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
5329 next if !$storeid;
5330 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
5331 next if !$scfg;
77019edf 5332 return 1 if $path eq PVE::Storage::path($storecfg, $drive->{file}, $snapname);
a8e2f942
DM
5333 }
5334 }
5335 }
77019edf
WB
5336
5337 return 0;
a8e2f942
DM
5338 };
5339
77019edf 5340 return 1 if &$scan_config($conf);
a8e2f942
DM
5341
5342 undef $skip_drive;
5343
77019edf
WB
5344 foreach my $snapname (keys %{$conf->{snapshots}}) {
5345 return 1 if &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
a8e2f942
DM
5346 }
5347
77019edf 5348 return 0;
a8e2f942
DM
5349}
5350
91bd6c90
DM
5351sub update_disksize {
5352 my ($vmid, $conf, $volid_hash) = @_;
be190583 5353
91bd6c90
DM
5354 my $changes;
5355
5356 my $used = {};
5357
5996a936
DM
5358 # Note: it is allowed to define multiple storages with same path (alias), so
5359 # we need to check both 'volid' and real 'path' (two different volid can point
5360 # to the same path).
5361
5362 my $usedpath = {};
be190583 5363
91bd6c90
DM
5364 # update size info
5365 foreach my $opt (keys %$conf) {
74479ee9 5366 if (is_valid_drivename($opt)) {
ed221350 5367 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
5368 my $volid = $drive->{file};
5369 next if !$volid;
5370
5371 $used->{$volid} = 1;
be190583 5372 if ($volid_hash->{$volid} &&
5996a936
DM
5373 (my $path = $volid_hash->{$volid}->{path})) {
5374 $usedpath->{$path} = 1;
5375 }
91bd6c90 5376
ed221350 5377 next if drive_is_cdrom($drive);
91bd6c90
DM
5378 next if !$volid_hash->{$volid};
5379
5380 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
5381 my $new = print_drive($vmid, $drive);
5382 if ($new ne $conf->{$opt}) {
5383 $changes = 1;
5384 $conf->{$opt} = $new;
5385 }
91bd6c90
DM
5386 }
5387 }
5388
5996a936
DM
5389 # remove 'unusedX' entry if volume is used
5390 foreach my $opt (keys %$conf) {
5391 next if $opt !~ m/^unused\d+$/;
5392 my $volid = $conf->{$opt};
5393 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 5394 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
5395 $changes = 1;
5396 delete $conf->{$opt};
5397 }
5398 }
5399
91bd6c90
DM
5400 foreach my $volid (sort keys %$volid_hash) {
5401 next if $volid =~ m/vm-$vmid-state-/;
5402 next if $used->{$volid};
5996a936
DM
5403 my $path = $volid_hash->{$volid}->{path};
5404 next if !$path; # just to be sure
5405 next if $usedpath->{$path};
91bd6c90 5406 $changes = 1;
8793d495 5407 PVE::QemuConfig->add_unused_volume($conf, $volid);
05937a14 5408 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
5409 }
5410
5411 return $changes;
5412}
5413
5414sub rescan {
5415 my ($vmid, $nolock) = @_;
5416
20519efc 5417 my $cfg = PVE::Storage::config();
91bd6c90
DM
5418
5419 my $volid_hash = scan_volids($cfg, $vmid);
5420
5421 my $updatefn = sub {
5422 my ($vmid) = @_;
5423
ffda963f 5424 my $conf = PVE::QemuConfig->load_config($vmid);
be190583 5425
ffda963f 5426 PVE::QemuConfig->check_lock($conf);
91bd6c90 5427
03da3f0d
DM
5428 my $vm_volids = {};
5429 foreach my $volid (keys %$volid_hash) {
5430 my $info = $volid_hash->{$volid};
5431 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
5432 }
5433
5434 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 5435
ffda963f 5436 PVE::QemuConfig->write_config($vmid, $conf) if $changes;
91bd6c90
DM
5437 };
5438
5439 if (defined($vmid)) {
5440 if ($nolock) {
5441 &$updatefn($vmid);
5442 } else {
ffda963f 5443 PVE::QemuConfig->lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
5444 }
5445 } else {
5446 my $vmlist = config_list();
5447 foreach my $vmid (keys %$vmlist) {
5448 if ($nolock) {
5449 &$updatefn($vmid);
5450 } else {
ffda963f 5451 PVE::QemuConfig->lock_config($vmid, $updatefn, $vmid);
be190583 5452 }
91bd6c90
DM
5453 }
5454 }
5455}
5456
5457sub restore_vma_archive {
5458 my ($archive, $vmid, $user, $opts, $comp) = @_;
5459
5460 my $input = $archive eq '-' ? "<&STDIN" : undef;
5461 my $readfrom = $archive;
5462
5463 my $uncomp = '';
5464 if ($comp) {
5465 $readfrom = '-';
5466 my $qarchive = PVE::Tools::shellquote($archive);
5467 if ($comp eq 'gzip') {
5468 $uncomp = "zcat $qarchive|";
5469 } elsif ($comp eq 'lzop') {
5470 $uncomp = "lzop -d -c $qarchive|";
5471 } else {
5472 die "unknown compression method '$comp'\n";
5473 }
be190583 5474
91bd6c90
DM
5475 }
5476
5477 my $tmpdir = "/var/tmp/vzdumptmp$$";
5478 rmtree $tmpdir;
5479
5480 # disable interrupts (always do cleanups)
5481 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5482 warn "got interrupt - ignored\n";
5483 };
5484
5485 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
5486 POSIX::mkfifo($mapfifo, 0600);
5487 my $fifofh;
5488
5489 my $openfifo = sub {
5490 open($fifofh, '>', $mapfifo) || die $!;
5491 };
5492
5493 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
5494
5495 my $oldtimeout;
5496 my $timeout = 5;
5497
5498 my $devinfo = {};
5499
5500 my $rpcenv = PVE::RPCEnvironment::get();
5501
ffda963f 5502 my $conffile = PVE::QemuConfig->config_file($vmid);
91bd6c90
DM
5503 my $tmpfn = "$conffile.$$.tmp";
5504
ed221350 5505 # Note: $oldconf is undef if VM does not exists
ffda963f
FG
5506 my $cfs_path = PVE::QemuConfig->cfs_config_path($vmid);
5507 my $oldconf = PVE::Cluster::cfs_read_file($cfs_path);
ed221350 5508
91bd6c90
DM
5509 my $print_devmap = sub {
5510 my $virtdev_hash = {};
5511
5512 my $cfgfn = "$tmpdir/qemu-server.conf";
5513
5514 # we can read the config - that is already extracted
5515 my $fh = IO::File->new($cfgfn, "r") ||
5516 "unable to read qemu-server.conf - $!\n";
5517
6738ab9c 5518 my $fwcfgfn = "$tmpdir/qemu-server.fw";
3457d090
WL
5519 if (-f $fwcfgfn) {
5520 my $pve_firewall_dir = '/etc/pve/firewall';
5521 mkdir $pve_firewall_dir; # make sure the dir exists
5522 PVE::Tools::file_copy($fwcfgfn, "${pve_firewall_dir}/$vmid.fw");
5523 }
6738ab9c 5524
91bd6c90
DM
5525 while (defined(my $line = <$fh>)) {
5526 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
5527 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
5528 die "archive does not contain data for drive '$virtdev'\n"
5529 if !$devinfo->{$devname};
5530 if (defined($opts->{storage})) {
5531 $storeid = $opts->{storage} || 'local';
5532 } elsif (!$storeid) {
5533 $storeid = 'local';
5534 }
5535 $format = 'raw' if !$format;
5536 $devinfo->{$devname}->{devname} = $devname;
5537 $devinfo->{$devname}->{virtdev} = $virtdev;
5538 $devinfo->{$devname}->{format} = $format;
5539 $devinfo->{$devname}->{storeid} = $storeid;
5540
be190583 5541 # check permission on storage
91bd6c90
DM
5542 my $pool = $opts->{pool}; # todo: do we need that?
5543 if ($user ne 'root@pam') {
5544 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
5545 }
5546
5547 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
5548 }
5549 }
5550
5551 foreach my $devname (keys %$devinfo) {
be190583
DM
5552 die "found no device mapping information for device '$devname'\n"
5553 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
5554 }
5555
20519efc 5556 my $cfg = PVE::Storage::config();
ed221350
DM
5557
5558 # create empty/temp config
be190583 5559 if ($oldconf) {
ed221350
DM
5560 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
5561 foreach_drive($oldconf, sub {
5562 my ($ds, $drive) = @_;
5563
5564 return if drive_is_cdrom($drive);
5565
5566 my $volid = $drive->{file};
5567
5568 return if !$volid || $volid =~ m|^/|;
5569
5570 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
5571 return if !$path || !$owner || ($owner != $vmid);
5572
5573 # Note: only delete disk we want to restore
5574 # other volumes will become unused
5575 if ($virtdev_hash->{$ds}) {
6b72854b
FG
5576 eval { PVE::Storage::vdisk_free($cfg, $volid); };
5577 if (my $err = $@) {
5578 warn $err;
5579 }
ed221350
DM
5580 }
5581 });
381b8fae
DC
5582
5583 # delete vmstate files
5584 # since after the restore we have no snapshots anymore
5585 foreach my $snapname (keys %{$oldconf->{snapshots}}) {
5586 my $snap = $oldconf->{snapshots}->{$snapname};
5587 if ($snap->{vmstate}) {
5588 eval { PVE::Storage::vdisk_free($cfg, $snap->{vmstate}); };
5589 if (my $err = $@) {
5590 warn $err;
5591 }
5592 }
5593 }
ed221350
DM
5594 }
5595
5596 my $map = {};
91bd6c90
DM
5597 foreach my $virtdev (sort keys %$virtdev_hash) {
5598 my $d = $virtdev_hash->{$virtdev};
5599 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
5600 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
5601
5602 # test if requested format is supported
5603 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
5604 my $supported = grep { $_ eq $d->{format} } @$validFormats;
5605 $d->{format} = $defFormat if !$supported;
5606
91bd6c90
DM
5607 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
5608 $d->{format}, undef, $alloc_size);
5609 print STDERR "new volume ID is '$volid'\n";
5610 $d->{volid} = $volid;
5611 my $path = PVE::Storage::path($cfg, $volid);
5612
5f96f4df
WL
5613 PVE::Storage::activate_volumes($cfg,[$volid]);
5614
91bd6c90 5615 my $write_zeros = 1;
88240a83 5616 if (PVE::Storage::volume_has_feature($cfg, 'sparseinit', $volid)) {
91bd6c90
DM
5617 $write_zeros = 0;
5618 }
5619
3c525055 5620 print $fifofh "format=$d->{format}:${write_zeros}:$d->{devname}=$path\n";
91bd6c90
DM
5621
5622 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
5623 $map->{$virtdev} = $volid;
5624 }
5625
5626 $fh->seek(0, 0) || die "seek failed - $!\n";
5627
5628 my $outfd = new IO::File ($tmpfn, "w") ||
5629 die "unable to write config for VM $vmid\n";
5630
5631 my $cookie = { netcount => 0 };
5632 while (defined(my $line = <$fh>)) {
be190583 5633 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
5634 }
5635
5636 $fh->close();
5637 $outfd->close();
5638 };
5639
5640 eval {
5641 # enable interrupts
5642 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5643 die "interrupted by signal\n";
5644 };
5645 local $SIG{ALRM} = sub { die "got timeout\n"; };
5646
5647 $oldtimeout = alarm($timeout);
5648
5649 my $parser = sub {
5650 my $line = shift;
5651
5652 print "$line\n";
5653
5654 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
5655 my ($dev_id, $size, $devname) = ($1, $2, $3);
5656 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
5657 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 5658 # we correctly received the vma config, so we can disable
3cf90d7a
DM
5659 # the timeout now for disk allocation (set to 10 minutes, so
5660 # that we always timeout if something goes wrong)
5661 alarm(600);
91bd6c90
DM
5662 &$print_devmap();
5663 print $fifofh "done\n";
5664 my $tmp = $oldtimeout || 0;
5665 $oldtimeout = undef;
5666 alarm($tmp);
5667 close($fifofh);
5668 }
5669 };
be190583 5670
91bd6c90
DM
5671 print "restore vma archive: $cmd\n";
5672 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
5673 };
5674 my $err = $@;
5675
5676 alarm($oldtimeout) if $oldtimeout;
5677
5f96f4df
WL
5678 my $vollist = [];
5679 foreach my $devname (keys %$devinfo) {
5680 my $volid = $devinfo->{$devname}->{volid};
5681 push @$vollist, $volid if $volid;
5682 }
5683
20519efc 5684 my $cfg = PVE::Storage::config();
5f96f4df
WL
5685 PVE::Storage::deactivate_volumes($cfg, $vollist);
5686
91bd6c90
DM
5687 unlink $mapfifo;
5688
5689 if ($err) {
5690 rmtree $tmpdir;
5691 unlink $tmpfn;
5692
91bd6c90
DM
5693 foreach my $devname (keys %$devinfo) {
5694 my $volid = $devinfo->{$devname}->{volid};
5695 next if !$volid;
5696 eval {
5697 if ($volid =~ m|^/|) {
5698 unlink $volid || die 'unlink failed\n';
5699 } else {
5700 PVE::Storage::vdisk_free($cfg, $volid);
5701 }
5702 print STDERR "temporary volume '$volid' sucessfuly removed\n";
5703 };
5704 print STDERR "unable to cleanup '$volid' - $@" if $@;
5705 }
5706 die $err;
5707 }
5708
5709 rmtree $tmpdir;
ed221350
DM
5710
5711 rename($tmpfn, $conffile) ||
91bd6c90
DM
5712 die "unable to commit configuration file '$conffile'\n";
5713
ed221350
DM
5714 PVE::Cluster::cfs_update(); # make sure we read new file
5715
91bd6c90
DM
5716 eval { rescan($vmid, 1); };
5717 warn $@ if $@;
5718}
5719
5720sub restore_tar_archive {
5721 my ($archive, $vmid, $user, $opts) = @_;
5722
9c502e26 5723 if ($archive ne '-') {
ed221350 5724 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
5725 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
5726 if $firstfile ne 'qemu-server.conf';
5727 }
3e16d5fc 5728
20519efc 5729 my $storecfg = PVE::Storage::config();
ebb55558 5730
ed221350 5731 # destroy existing data - keep empty config
ffda963f 5732 my $vmcfgfn = PVE::QemuConfig->config_file($vmid);
ebb55558 5733 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 5734
3e16d5fc
DM
5735 my $tocmd = "/usr/lib/qemu-server/qmextract";
5736
2415a446 5737 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 5738 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
5739 $tocmd .= ' --prealloc' if $opts->{prealloc};
5740 $tocmd .= ' --info' if $opts->{info};
5741
a0d1b1a2 5742 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 5743 # so we pipe to zcat
2415a446
DM
5744 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
5745 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
5746
5747 my $tmpdir = "/var/tmp/vzdumptmp$$";
5748 mkpath $tmpdir;
5749
5750 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
5751 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 5752 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 5753
ffda963f 5754 my $conffile = PVE::QemuConfig->config_file($vmid);
3e16d5fc
DM
5755 my $tmpfn = "$conffile.$$.tmp";
5756
5757 # disable interrupts (always do cleanups)
5758 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5759 print STDERR "got interrupt - ignored\n";
5760 };
5761
afdb31d5 5762 eval {
3e16d5fc
DM
5763 # enable interrupts
5764 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5765 die "interrupted by signal\n";
5766 };
5767
9c502e26
DM
5768 if ($archive eq '-') {
5769 print "extracting archive from STDIN\n";
5770 run_command($cmd, input => "<&STDIN");
5771 } else {
5772 print "extracting archive '$archive'\n";
5773 run_command($cmd);
5774 }
3e16d5fc
DM
5775
5776 return if $opts->{info};
5777
5778 # read new mapping
5779 my $map = {};
5780 my $statfile = "$tmpdir/qmrestore.stat";
5781 if (my $fd = IO::File->new($statfile, "r")) {
5782 while (defined (my $line = <$fd>)) {
5783 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5784 $map->{$1} = $2 if $1;
5785 } else {
5786 print STDERR "unable to parse line in statfile - $line\n";
5787 }
5788 }
5789 $fd->close();
5790 }
5791
5792 my $confsrc = "$tmpdir/qemu-server.conf";
5793
5794 my $srcfd = new IO::File($confsrc, "r") ||
5795 die "unable to open file '$confsrc'\n";
5796
5797 my $outfd = new IO::File ($tmpfn, "w") ||
5798 die "unable to write config for VM $vmid\n";
5799
91bd6c90 5800 my $cookie = { netcount => 0 };
3e16d5fc 5801 while (defined (my $line = <$srcfd>)) {
be190583 5802 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
5803 }
5804
5805 $srcfd->close();
5806 $outfd->close();
5807 };
5808 my $err = $@;
5809
afdb31d5 5810 if ($err) {
3e16d5fc
DM
5811
5812 unlink $tmpfn;
5813
ed221350 5814 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 5815
3e16d5fc 5816 die $err;
afdb31d5 5817 }
3e16d5fc
DM
5818
5819 rmtree $tmpdir;
5820
5821 rename $tmpfn, $conffile ||
5822 die "unable to commit configuration file '$conffile'\n";
91bd6c90 5823
ed221350
DM
5824 PVE::Cluster::cfs_update(); # make sure we read new file
5825
91bd6c90
DM
5826 eval { rescan($vmid, 1); };
5827 warn $@ if $@;
3e16d5fc
DM
5828};
5829
18bfb361
DM
5830sub foreach_writable_storage {
5831 my ($conf, $func) = @_;
5832
5833 my $sidhash = {};
5834
5835 foreach my $ds (keys %$conf) {
74479ee9 5836 next if !is_valid_drivename($ds);
18bfb361
DM
5837
5838 my $drive = parse_drive($ds, $conf->{$ds});
5839 next if !$drive;
5840 next if drive_is_cdrom($drive);
5841
5842 my $volid = $drive->{file};
5843
5844 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 5845 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
5846 }
5847
5848 foreach my $sid (sort keys %$sidhash) {
5849 &$func($sid);
5850 }
5851}
5852
e5eaa028
WL
5853sub do_snapshots_with_qemu {
5854 my ($storecfg, $volid) = @_;
5855
5856 my $storage_name = PVE::Storage::parse_volume_id($volid);
5857
116da784
WL
5858 if ($qemu_snap_storage->{$storecfg->{ids}->{$storage_name}->{type}}
5859 && !$storecfg->{ids}->{$storage_name}->{krbd}){
e5eaa028
WL
5860 return 1;
5861 }
5862
5863 if ($volid =~ m/\.(qcow2|qed)$/){
5864 return 1;
5865 }
5866
5867 return undef;
5868}
5869
4dcc780c
WL
5870sub qga_check_running {
5871 my ($vmid) = @_;
5872
5873 eval { vm_mon_cmd($vmid, "guest-ping", timeout => 3); };
5874 if ($@) {
5875 warn "Qemu Guest Agent are not running - $@";
5876 return 0;
5877 }
5878 return 1;
5879}
5880
04a69bb4
AD
5881sub template_create {
5882 my ($vmid, $conf, $disk) = @_;
5883
04a69bb4 5884 my $storecfg = PVE::Storage::config();
04a69bb4 5885
9cd07842
DM
5886 foreach_drive($conf, sub {
5887 my ($ds, $drive) = @_;
5888
5889 return if drive_is_cdrom($drive);
5890 return if $disk && $ds ne $disk;
5891
5892 my $volid = $drive->{file};
bbd56097 5893 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5894
04a69bb4
AD
5895 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5896 $drive->{file} = $voliddst;
152fe752 5897 $conf->{$ds} = print_drive($vmid, $drive);
ffda963f 5898 PVE::QemuConfig->write_config($vmid, $conf);
04a69bb4 5899 });
04a69bb4
AD
5900}
5901
5133de42 5902sub qemu_img_convert {
988e2714 5903 my ($src_volid, $dst_volid, $size, $snapname, $is_zero_initialized) = @_;
5133de42
AD
5904
5905 my $storecfg = PVE::Storage::config();
5906 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5907 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5908
5909 if ($src_storeid && $dst_storeid) {
6bb91c17
DM
5910
5911 PVE::Storage::activate_volumes($storecfg, [$src_volid], $snapname);
5912
5133de42
AD
5913 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5914 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5915
5916 my $src_format = qemu_img_format($src_scfg, $src_volname);
5917 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5918
5919 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5920 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5921
5922 my $cmd = [];
eed24303 5923 push @$cmd, '/usr/bin/qemu-img', 'convert', '-p', '-n';
5133de42 5924 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
988e2714
WB
5925 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path;
5926 if ($is_zero_initialized) {
5927 push @$cmd, "zeroinit:$dst_path";
5928 } else {
5929 push @$cmd, $dst_path;
5930 }
5133de42
AD
5931
5932 my $parser = sub {
5933 my $line = shift;
5934 if($line =~ m/\((\S+)\/100\%\)/){
5935 my $percent = $1;
5936 my $transferred = int($size * $percent / 100);
5937 my $remaining = $size - $transferred;
5938
5939 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5940 }
5941
5942 };
5943
5944 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5945 my $err = $@;
5946 die "copy failed: $err" if $err;
5947 }
5948}
5949
5950sub qemu_img_format {
5951 my ($scfg, $volname) = @_;
5952
d81f0f09 5953 if ($scfg->{path} && $volname =~ m/\.(raw|cow|qcow|qcow2|qed|vmdk|cloop)$/) {
5133de42 5954 return $1;
be190583 5955 } else {
5133de42 5956 return "raw";
5133de42
AD
5957 }
5958}
5959
cfad42af 5960sub qemu_drive_mirror {
5619e74a 5961 my ($vmid, $drive, $dst_volid, $vmiddst, $is_zero_initialized, $jobs, $skipcomplete, $qga) = @_;
cfad42af 5962
5a345967
AD
5963 $jobs = {} if !$jobs;
5964
5965 my $qemu_target;
5966 my $format;
35e4ab04 5967 $jobs->{"drive-$drive"} = {};
152fe752 5968
3b4cf0f0 5969 if ($dst_volid =~ /^nbd:(localhost|[\d\.]+|\[[\d\.:a-fA-F]+\]):(\d+):exportname=(\S+)/) {
5a345967
AD
5970 my $server = $1;
5971 my $port = $2;
35e4ab04
AD
5972 my $exportname = $3;
5973
5a345967 5974 $format = "nbd";
35e4ab04
AD
5975 my $unixsocket = "/run/qemu-server/$vmid.mirror-drive-$drive";
5976 $qemu_target = "nbd+unix:///$exportname?socket=$unixsocket";
923aaa9e 5977 my $cmd = ['socat', '-T30', "UNIX-LISTEN:$unixsocket,fork", "TCP:$server:$2,connect-timeout=5"];
35e4ab04
AD
5978
5979 my $pid = fork();
5980 if (!defined($pid)) {
bd2d5fe6 5981 die "forking socat tunnel failed\n";
35e4ab04
AD
5982 } elsif ($pid == 0) {
5983 exec(@$cmd);
ca5c27f0
WB
5984 warn "exec failed: $!\n";
5985 POSIX::_exit(-1);
5986 }
5987 $jobs->{"drive-$drive"}->{pid} = $pid;
35e4ab04 5988
ca5c27f0
WB
5989 my $timeout = 0;
5990 while (!-S $unixsocket) {
5991 die "nbd connection helper timed out\n"
5992 if $timeout++ > 5;
5993 sleep 1;
35e4ab04 5994 }
5a345967 5995 } else {
5a345967
AD
5996 my $storecfg = PVE::Storage::config();
5997 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
5998
5999 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 6000
5a345967 6001 $format = qemu_img_format($dst_scfg, $dst_volname);
21ccdb50 6002
5a345967 6003 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 6004
5a345967
AD
6005 $qemu_target = $is_zero_initialized ? "zeroinit:$dst_path" : $dst_path;
6006 }
988e2714
WB
6007
6008 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $qemu_target };
88383920
DM
6009 $opts->{format} = $format if $format;
6010
5a345967 6011 print "drive mirror is starting for drive-$drive\n";
21ccdb50 6012
5a345967 6013 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); }; #if a job already run for this device,it's throw an error
35e4ab04 6014
5a345967
AD
6015 if (my $err = $@) {
6016 eval { PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs) };
6017 die "mirroring error: $err";
6018 }
6019
5619e74a 6020 qemu_drive_mirror_monitor ($vmid, $vmiddst, $jobs, $skipcomplete, $qga);
5a345967
AD
6021}
6022
6023sub qemu_drive_mirror_monitor {
5619e74a 6024 my ($vmid, $vmiddst, $jobs, $skipcomplete, $qga) = @_;
2e953867 6025
08ac653f 6026 eval {
5a345967
AD
6027 my $err_complete = 0;
6028
08ac653f 6029 while (1) {
5a345967
AD
6030 die "storage migration timed out\n" if $err_complete > 300;
6031
08ac653f 6032 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
08ac653f 6033
5a345967
AD
6034 my $running_mirror_jobs = {};
6035 foreach my $stat (@$stats) {
6036 next if $stat->{type} ne 'mirror';
6037 $running_mirror_jobs->{$stat->{device}} = $stat;
6038 }
08ac653f 6039
5a345967 6040 my $readycounter = 0;
67fb9de6 6041
5a345967
AD
6042 foreach my $job (keys %$jobs) {
6043
6044 if(defined($jobs->{$job}->{complete}) && !defined($running_mirror_jobs->{$job})) {
6045 print "$job : finished\n";
6046 delete $jobs->{$job};
6047 next;
6048 }
6049
bd2d5fe6 6050 die "$job: mirroring has been cancelled\n" if !defined($running_mirror_jobs->{$job});
f34ebd52 6051
5a345967
AD
6052 my $busy = $running_mirror_jobs->{$job}->{busy};
6053 my $ready = $running_mirror_jobs->{$job}->{ready};
6054 if (my $total = $running_mirror_jobs->{$job}->{len}) {
6055 my $transferred = $running_mirror_jobs->{$job}->{offset} || 0;
6056 my $remaining = $total - $transferred;
6057 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
08ac653f 6058
5a345967
AD
6059 print "$job: transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy ready: $ready \n";
6060 }
f34ebd52 6061
d1782eba 6062 $readycounter++ if $running_mirror_jobs->{$job}->{ready};
5a345967 6063 }
b467f79a 6064
5a345967
AD
6065 last if scalar(keys %$jobs) == 0;
6066
6067 if ($readycounter == scalar(keys %$jobs)) {
6068 print "all mirroring jobs are ready \n";
6069 last if $skipcomplete; #do the complete later
6070
6071 if ($vmiddst && $vmiddst != $vmid) {
5619e74a
AD
6072 if ($qga) {
6073 print "freeze filesystem\n";
6074 eval { PVE::QemuServer::vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
6075 } else {
6076 print "suspend vm\n";
6077 eval { PVE::QemuServer::vm_suspend($vmid, 1); };
6078 }
6079
5a345967
AD
6080 # if we clone a disk for a new target vm, we don't switch the disk
6081 PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs);
5619e74a
AD
6082
6083 if ($qga) {
6084 print "unfreeze filesystem\n";
6085 eval { PVE::QemuServer::vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
6086 } else {
6087 print "resume vm\n";
6088 eval { PVE::QemuServer::vm_resume($vmid, 1, 1); };
6089 }
6090
2e953867 6091 last;
5a345967
AD
6092 } else {
6093
6094 foreach my $job (keys %$jobs) {
6095 # try to switch the disk if source and destination are on the same guest
bd2d5fe6 6096 print "$job: Completing block job...\n";
5a345967
AD
6097
6098 eval { vm_mon_cmd($vmid, "block-job-complete", device => $job) };
6099 if ($@ =~ m/cannot be completed/) {
bd2d5fe6 6100 print "$job: Block job cannot be completed, try again.\n";
5a345967
AD
6101 $err_complete++;
6102 }else {
bd2d5fe6 6103 print "$job: Completed successfully.\n";
5a345967 6104 $jobs->{$job}->{complete} = 1;
35e4ab04 6105 eval { qemu_blockjobs_finish_tunnel($vmid, $job, $jobs->{$job}->{pid}) } ;
5a345967
AD
6106 }
6107 }
2e953867 6108 }
08ac653f 6109 }
08ac653f 6110 sleep 1;
cfad42af 6111 }
08ac653f 6112 };
88383920 6113 my $err = $@;
08ac653f 6114
88383920 6115 if ($err) {
5a345967 6116 eval { PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs) };
88383920
DM
6117 die "mirroring error: $err";
6118 }
6119
5a345967
AD
6120}
6121
6122sub qemu_blockjobs_cancel {
6123 my ($vmid, $jobs) = @_;
6124
6125 foreach my $job (keys %$jobs) {
bd2d5fe6 6126 print "$job: Cancelling block job\n";
5a345967
AD
6127 eval { vm_mon_cmd($vmid, "block-job-cancel", device => $job); };
6128 $jobs->{$job}->{cancel} = 1;
6129 }
6130
6131 while (1) {
6132 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
6133
6134 my $running_jobs = {};
6135 foreach my $stat (@$stats) {
6136 $running_jobs->{$stat->{device}} = $stat;
6137 }
6138
6139 foreach my $job (keys %$jobs) {
6140
bd2d5fe6
WB
6141 if (defined($jobs->{$job}->{cancel}) && !defined($running_jobs->{$job})) {
6142 print "$job: Done.\n";
35e4ab04 6143 eval { qemu_blockjobs_finish_tunnel($vmid, $job, $jobs->{$job}->{pid}) } ;
5a345967
AD
6144 delete $jobs->{$job};
6145 }
6146 }
6147
6148 last if scalar(keys %$jobs) == 0;
6149
6150 sleep 1;
cfad42af
AD
6151 }
6152}
6153
35e4ab04
AD
6154sub qemu_blockjobs_finish_tunnel {
6155 my ($vmid, $job, $cpid) = @_;
6156
6157 return if !$cpid;
6158
6159 for (my $i = 1; $i < 20; $i++) {
6160 my $waitpid = waitpid($cpid, WNOHANG);
6161 last if (defined($waitpid) && ($waitpid == $cpid));
6162
6163 if ($i == 10) {
6164 kill(15, $cpid);
6165 } elsif ($i >= 15) {
6166 kill(9, $cpid);
6167 }
6168 sleep (1);
6169 }
6170 unlink "/run/qemu-server/$vmid.mirror-$job";
6171}
6172
152fe752 6173sub clone_disk {
be190583 6174 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
5619e74a 6175 $newvmid, $storage, $format, $full, $newvollist, $jobs, $skipcomplete, $qga) = @_;
152fe752
DM
6176
6177 my $newvolid;
6178
6179 if (!$full) {
6180 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 6181 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
6182 push @$newvollist, $newvolid;
6183 } else {
5a345967 6184
152fe752
DM
6185 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
6186 $storeid = $storage if $storage;
6187
44549149 6188 my $dst_format = resolve_dst_disk_format($storecfg, $storeid, $volname, $format);
152fe752
DM
6189 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
6190
6191 print "create full clone of drive $drivename ($drive->{file})\n";
44549149 6192 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $dst_format, undef, ($size/1024));
152fe752
DM
6193 push @$newvollist, $newvolid;
6194
3999f370 6195 PVE::Storage::activate_volumes($storecfg, [$newvolid]);
1dbd6d30 6196
988e2714 6197 my $sparseinit = PVE::Storage::volume_has_feature($storecfg, 'sparseinit', $newvolid);
152fe752 6198 if (!$running || $snapname) {
988e2714 6199 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname, $sparseinit);
152fe752 6200 } else {
2e541679
AD
6201
6202 my $kvmver = get_running_qemu_version ($vmid);
6203 if (!qemu_machine_feature_enabled (undef, $kvmver, 2, 7)) {
961af8a3
WB
6204 die "drive-mirror with iothread requires qemu version 2.7 or higher\n"
6205 if $drive->{iothread};
2e541679 6206 }
2af848a2 6207
5619e74a 6208 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid, $sparseinit, $jobs, $skipcomplete, $qga);
be190583 6209 }
152fe752
DM
6210 }
6211
6212 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
6213
6214 my $disk = $drive;
6215 $disk->{format} = undef;
6216 $disk->{file} = $newvolid;
6217 $disk->{size} = $size;
6218
6219 return $disk;
6220}
6221
ff556cf2
DM
6222# this only works if VM is running
6223sub get_current_qemu_machine {
6224 my ($vmid) = @_;
6225
6226 my $cmd = { execute => 'query-machines', arguments => {} };
8e90138a 6227 my $res = vm_qmp_command($vmid, $cmd);
ff556cf2
DM
6228
6229 my ($current, $default);
6230 foreach my $e (@$res) {
6231 $default = $e->{name} if $e->{'is-default'};
6232 $current = $e->{name} if $e->{'is-current'};
6233 }
6234
6235 # fallback to the default machine if current is not supported by qemu
6236 return $current || $default || 'pc';
6237}
6238
98cfd8b6
AD
6239sub get_running_qemu_version {
6240 my ($vmid) = @_;
6241 my $cmd = { execute => 'query-version', arguments => {} };
6242 my $res = vm_qmp_command($vmid, $cmd);
6243 return "$res->{qemu}->{major}.$res->{qemu}->{minor}";
6244}
6245
23f73120
AD
6246sub qemu_machine_feature_enabled {
6247 my ($machine, $kvmver, $version_major, $version_minor) = @_;
6248
6249 my $current_major;
6250 my $current_minor;
6251
6252 if ($machine && $machine =~ m/^(pc(-i440fx|-q35)?-(\d+)\.(\d+))/) {
6253
6254 $current_major = $3;
6255 $current_minor = $4;
6256
6257 } elsif ($kvmver =~ m/^(\d+)\.(\d+)/) {
6258
6259 $current_major = $1;
6260 $current_minor = $2;
6261 }
6262
6263 return 1 if $current_major >= $version_major && $current_minor >= $version_minor;
6264
6265
6266}
6267
42dbd2ee
AD
6268sub qemu_machine_pxe {
6269 my ($vmid, $conf, $machine) = @_;
6270
6271 $machine = PVE::QemuServer::get_current_qemu_machine($vmid) if !$machine;
6272
6273 foreach my $opt (keys %$conf) {
6274 next if $opt !~ m/^net(\d+)$/;
6275 my $net = PVE::QemuServer::parse_net($conf->{$opt});
6276 next if !$net;
6277 my $romfile = PVE::QemuServer::vm_mon_cmd_nocheck($vmid, 'qom-get', path => $opt, property => 'romfile');
6278 return $machine.".pxe" if $romfile =~ m/pxe/;
6279 last;
6280 }
6281
d1363934 6282 return $machine;
42dbd2ee
AD
6283}
6284
249c4a6c
AD
6285sub qemu_use_old_bios_files {
6286 my ($machine_type) = @_;
6287
6288 return if !$machine_type;
6289
6290 my $use_old_bios_files = undef;
6291
6292 if ($machine_type =~ m/^(\S+)\.pxe$/) {
6293 $machine_type = $1;
6294 $use_old_bios_files = 1;
6295 } else {
74cc511f 6296 my $kvmver = kvm_user_version();
249c4a6c
AD
6297 # Note: kvm version < 2.4 use non-efi pxe files, and have problems when we
6298 # load new efi bios files on migration. So this hack is required to allow
6299 # live migration from qemu-2.2 to qemu-2.4, which is sometimes used when
6300 # updrading from proxmox-ve-3.X to proxmox-ve 4.0
74cc511f 6301 $use_old_bios_files = !qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 4);
249c4a6c
AD
6302 }
6303
6304 return ($use_old_bios_files, $machine_type);
6305}
6306
4543ecf0
AD
6307sub lspci {
6308
6309 my $devices = {};
6310
6311 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
6312 my (undef, $id, $function) = @_;
6313 my $res = { id => $id, function => $function};
6314 push @{$devices->{$id}}, $res;
6315 });
6316
5ee38471
WB
6317 # Entries should be sorted by functions.
6318 foreach my $id (keys %$devices) {
6319 my $dev = $devices->{$id};
6320 $devices->{$id} = [ sort { $a->{function} <=> $b->{function} } @$dev ];
6321 }
6322
4543ecf0
AD
6323 return $devices;
6324}
6325
22de899a
AD
6326sub vm_iothreads_list {
6327 my ($vmid) = @_;
6328
6329 my $res = vm_mon_cmd($vmid, 'query-iothreads');
6330
6331 my $iothreads = {};
6332 foreach my $iothread (@$res) {
6333 $iothreads->{ $iothread->{id} } = $iothread->{"thread-id"};
6334 }
6335
6336 return $iothreads;
6337}
6338
ee034f5c
AD
6339sub scsihw_infos {
6340 my ($conf, $drive) = @_;
6341
6342 my $maxdev = 0;
6343
7fe1b688 6344 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)) {
ee034f5c 6345 $maxdev = 7;
a1511b3c 6346 } elsif ($conf->{scsihw} && ($conf->{scsihw} eq 'virtio-scsi-single')) {
ee034f5c
AD
6347 $maxdev = 1;
6348 } else {
6349 $maxdev = 256;
6350 }
6351
6352 my $controller = int($drive->{index} / $maxdev);
a1511b3c 6353 my $controller_prefix = ($conf->{scsihw} && $conf->{scsihw} eq 'virtio-scsi-single') ? "virtioscsi" : "scsihw";
ee034f5c
AD
6354
6355 return ($maxdev, $controller, $controller_prefix);
6356}
a1511b3c 6357
4317f69f
AD
6358sub add_hyperv_enlighments {
6359 my ($cpuFlags, $winversion, $machine_type, $kvmver, $nokvm, $bios, $gpu_passthrough) = @_;
6360
6361 return if $nokvm;
6362 return if $winversion < 6;
6363 return if $bios && $bios eq 'ovmf' && $winversion < 8;
6364
5aba3953
AD
6365 push @$cpuFlags , 'hv_vendor_id=proxmox' if $gpu_passthrough;
6366
4317f69f
AD
6367 if (qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 3)) {
6368 push @$cpuFlags , 'hv_spinlocks=0x1fff';
6369 push @$cpuFlags , 'hv_vapic';
6370 push @$cpuFlags , 'hv_time';
6371 } else {
6372 push @$cpuFlags , 'hv_spinlocks=0xffff';
6373 }
6374
6375 if (qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 6)) {
6376 push @$cpuFlags , 'hv_reset';
6377 push @$cpuFlags , 'hv_vpindex';
6378 push @$cpuFlags , 'hv_runtime';
6379 }
6380
6381 if ($winversion >= 7) {
6382 push @$cpuFlags , 'hv_relaxed';
4317f69f
AD
6383 }
6384}
6385
6386sub windows_version {
6387 my ($ostype) = @_;
6388
6389 return 0 if !$ostype;
6390
6391 my $winversion = 0;
6392
6393 if($ostype eq 'wxp' || $ostype eq 'w2k3' || $ostype eq 'w2k') {
6394 $winversion = 5;
6395 } elsif($ostype eq 'w2k8' || $ostype eq 'wvista') {
6396 $winversion = 6;
6397 } elsif ($ostype =~ m/^win(\d+)$/) {
6398 $winversion = $1;
6399 }
6400
6401 return $winversion;
6402}
6403
44549149
EK
6404sub resolve_dst_disk_format {
6405 my ($storecfg, $storeid, $src_volname, $format) = @_;
6406 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
6407
6408 if (!$format) {
6409 # if no target format is specified, use the source disk format as hint
6410 if ($src_volname) {
6411 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
6412 $format = qemu_img_format($scfg, $src_volname);
6413 } else {
6414 return $defFormat;
6415 }
6416 }
6417
6418 # test if requested format is supported - else use default
6419 my $supported = grep { $_ eq $format } @$validFormats;
6420 $format = $defFormat if !$supported;
6421 return $format;
6422}
6423
65e866e5
DM
6424# bash completion helper
6425
6426sub complete_backup_archives {
6427 my ($cmdname, $pname, $cvalue) = @_;
6428
6429 my $cfg = PVE::Storage::config();
6430
6431 my $storeid;
6432
6433 if ($cvalue =~ m/^([^:]+):/) {
6434 $storeid = $1;
6435 }
6436
6437 my $data = PVE::Storage::template_list($cfg, $storeid, 'backup');
6438
6439 my $res = [];
6440 foreach my $id (keys %$data) {
6441 foreach my $item (@{$data->{$id}}) {
6442 next if $item->{format} !~ m/^vma\.(gz|lzo)$/;
6443 push @$res, $item->{volid} if defined($item->{volid});
6444 }
6445 }
6446
6447 return $res;
6448}
6449
6450my $complete_vmid_full = sub {
6451 my ($running) = @_;
6452
6453 my $idlist = vmstatus();
6454
6455 my $res = [];
6456
6457 foreach my $id (keys %$idlist) {
6458 my $d = $idlist->{$id};
6459 if (defined($running)) {
6460 next if $d->{template};
6461 next if $running && $d->{status} ne 'running';
6462 next if !$running && $d->{status} eq 'running';
6463 }
6464 push @$res, $id;
6465
6466 }
6467 return $res;
6468};
6469
6470sub complete_vmid {
6471 return &$complete_vmid_full();
6472}
6473
6474sub complete_vmid_stopped {
6475 return &$complete_vmid_full(0);
6476}
6477
6478sub complete_vmid_running {
6479 return &$complete_vmid_full(1);
6480}
6481
335af808
DM
6482sub complete_storage {
6483
6484 my $cfg = PVE::Storage::config();
6485 my $ids = $cfg->{ids};
6486
6487 my $res = [];
6488 foreach my $sid (keys %$ids) {
6489 next if !PVE::Storage::storage_check_enabled($cfg, $sid, undef, 1);
c4c844ef 6490 next if !$ids->{$sid}->{content}->{images};
335af808
DM
6491 push @$res, $sid;
6492 }
6493
6494 return $res;
6495}
6496
63a09370
AD
6497sub nbd_stop {
6498 my ($vmid) = @_;
6499
6500 vm_mon_cmd($vmid, 'nbd-server-stop');
6501}
6502
1e3baf05 65031;