]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
get_replicatable_volumes: use PVE::QemuServer::foreach_volid
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
ffda963f 30use PVE::QemuConfig;
26f11676 31use PVE::QMPClient;
91bd6c90 32use PVE::RPCEnvironment;
de9768f0 33use PVE::QemuServer::PCI qw(print_pci_addr print_pcie_addr);
3f669af2 34use PVE::QemuServer::Memory;
d40e5e18 35use PVE::QemuServer::USB qw(parse_usb_device);
6b64503e 36use Time::HiRes qw(gettimeofday);
a783c78e 37use File::Copy qw(copy);
46630a5f 38use URI::Escape;
1e3baf05 39
2ddc0a5c
DC
40my $OVMF_CODE = '/usr/share/kvm/OVMF_CODE-pure-efi.fd';
41my $OVMF_VARS = '/usr/share/kvm/OVMF_VARS-pure-efi.fd';
42my $OVMF_IMG = '/usr/share/kvm/OVMF-pure-efi.fd';
43
e5eaa028
WL
44my $qemu_snap_storage = {rbd => 1, sheepdog => 1};
45
7f0b5beb 46my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 47
19672434 48# Note about locking: we use flock on the config file protect
1e3baf05
DM
49# against concurent actions.
50# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 51# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
52# allowed when such lock is set. But you can ignore this kind of
53# lock with the --skiplock flag.
54
97d62eb7 55cfs_register_file('/qemu-server/',
1858638f
DM
56 \&parse_vm_config,
57 \&write_vm_config);
1e3baf05 58
3ea94c60
DM
59PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
60 description => "Some command save/restore state from this location.",
61 type => 'string',
62 maxLength => 128,
63 optional => 1,
64});
65
8abd398b
DM
66PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
67 description => "The name of the snapshot.",
68 type => 'string', format => 'pve-configid',
69 maxLength => 40,
70});
71
c7d2b650
DM
72PVE::JSONSchema::register_standard_option('pve-qm-image-format', {
73 type => 'string',
74 enum => [qw(raw cow qcow qed qcow2 vmdk cloop)],
75 description => "The drive's backing file's data format.",
76 optional => 1,
77});
78
1e3baf05
DM
79#no warnings 'redefine';
80
c8effec3
AD
81sub cgroups_write {
82 my ($controller, $vmid, $option, $value) = @_;
83
3a515a88
DM
84 my $path = "/sys/fs/cgroup/$controller/qemu.slice/$vmid.scope/$option";
85 PVE::ProcFSTools::write_proc_entry($path, $value);
c8effec3
AD
86
87}
88
1e3baf05
DM
89my $nodename = PVE::INotify::nodename();
90
91mkdir "/etc/pve/nodes/$nodename";
92my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
93mkdir $confdir;
94
95my $var_run_tmpdir = "/var/run/qemu-server";
96mkdir $var_run_tmpdir;
97
98my $lock_dir = "/var/lock/qemu-server";
99mkdir $lock_dir;
100
101my $pcisysfs = "/sys/bus/pci";
102
8930da74
DM
103my $cpu_vendor_list = {
104 # Intel CPUs
105 486 => 'GenuineIntel',
106 pentium => 'GenuineIntel',
107 pentium2 => 'GenuineIntel',
108 pentium3 => 'GenuineIntel',
109 coreduo => 'GenuineIntel',
110 core2duo => 'GenuineIntel',
111 Conroe => 'GenuineIntel',
112 Penryn => 'GenuineIntel',
113 Nehalem => 'GenuineIntel',
114 Westmere => 'GenuineIntel',
115 SandyBridge => 'GenuineIntel',
116 IvyBridge => 'GenuineIntel',
117 Haswell => 'GenuineIntel',
118 'Haswell-noTSX' => 'GenuineIntel',
119 Broadwell => 'GenuineIntel',
120 'Broadwell-noTSX' => 'GenuineIntel',
3db920fc 121 'Skylake-Client' => 'GenuineIntel',
8930da74
DM
122
123 # AMD CPUs
124 athlon => 'AuthenticAMD',
125 phenom => 'AuthenticAMD',
126 Opteron_G1 => 'AuthenticAMD',
127 Opteron_G2 => 'AuthenticAMD',
128 Opteron_G3 => 'AuthenticAMD',
129 Opteron_G4 => 'AuthenticAMD',
130 Opteron_G5 => 'AuthenticAMD',
131
132 # generic types, use vendor from host node
133 host => 'default',
134 kvm32 => 'default',
135 kvm64 => 'default',
136 qemu32 => 'default',
137 qemu64 => 'default',
138};
139
ff6ffe20 140my $cpu_fmt = {
16a91d65
WB
141 cputype => {
142 description => "Emulated CPU type.",
143 type => 'string',
7f694a71 144 enum => [ sort { "\L$a" cmp "\L$b" } keys %$cpu_vendor_list ],
16a91d65
WB
145 default => 'kvm64',
146 default_key => 1,
147 },
148 hidden => {
149 description => "Do not identify as a KVM virtual machine.",
150 type => 'boolean',
151 optional => 1,
152 default => 0
153 },
154};
155
ec3582b5
WB
156my $watchdog_fmt = {
157 model => {
158 default_key => 1,
159 type => 'string',
160 enum => [qw(i6300esb ib700)],
161 description => "Watchdog type to emulate.",
162 default => 'i6300esb',
163 optional => 1,
164 },
165 action => {
166 type => 'string',
167 enum => [qw(reset shutdown poweroff pause debug none)],
168 description => "The action to perform if after activation the guest fails to poll the watchdog in time.",
169 optional => 1,
170 },
171};
172PVE::JSONSchema::register_format('pve-qm-watchdog', $watchdog_fmt);
173
1e3baf05
DM
174my $confdesc = {
175 onboot => {
176 optional => 1,
177 type => 'boolean',
178 description => "Specifies whether a VM will be started during system bootup.",
179 default => 0,
180 },
181 autostart => {
182 optional => 1,
183 type => 'boolean',
184 description => "Automatic restart after crash (currently ignored).",
185 default => 0,
186 },
2ff09f52
DA
187 hotplug => {
188 optional => 1,
b3c2bdd1
DM
189 type => 'string', format => 'pve-hotplug-features',
190 description => "Selectively enable hotplug features. This is a comma separated list of hotplug features: 'network', 'disk', 'cpu', 'memory' and 'usb'. Use '0' to disable hotplug completely. Value '1' is an alias for the default 'network,disk,usb'.",
191 default => 'network,disk,usb',
2ff09f52 192 },
1e3baf05
DM
193 reboot => {
194 optional => 1,
195 type => 'boolean',
196 description => "Allow reboot. If set to '0' the VM exit on reboot.",
197 default => 1,
198 },
199 lock => {
200 optional => 1,
201 type => 'string',
202 description => "Lock/unlock the VM.",
22c377f0 203 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
204 },
205 cpulimit => {
206 optional => 1,
c6f773b8 207 type => 'number',
52261945
DM
208 description => "Limit of CPU usage.",
209 verbose_description => "Limit of CPU usage.\n\nNOTE: If the computer has 2 CPUs, it has total of '2' CPU time. Value '0' indicates no CPU limit.",
1e3baf05 210 minimum => 0,
c6f773b8 211 maximum => 128,
52261945 212 default => 0,
1e3baf05
DM
213 },
214 cpuunits => {
215 optional => 1,
216 type => 'integer',
52261945
DM
217 description => "CPU weight for a VM.",
218 verbose_description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
1e3baf05
DM
219 minimum => 0,
220 maximum => 500000,
613d76a1 221 default => 1024,
1e3baf05
DM
222 },
223 memory => {
224 optional => 1,
225 type => 'integer',
7878afeb 226 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
227 minimum => 16,
228 default => 512,
229 },
13a48620
DA
230 balloon => {
231 optional => 1,
232 type => 'integer',
8b1accf7
DM
233 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
234 minimum => 0,
235 },
236 shares => {
237 optional => 1,
238 type => 'integer',
239 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
240 minimum => 0,
241 maximum => 50000,
242 default => 1000,
13a48620 243 },
1e3baf05
DM
244 keyboard => {
245 optional => 1,
246 type => 'string',
fad17f04 247 description => "Keybord layout for vnc server. Default is read from the '/etc/pve/datacenter.conf' configuration file.",
e95fe75f 248 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
249 default => 'en-us',
250 },
251 name => {
252 optional => 1,
7fabe17d 253 type => 'string', format => 'dns-name',
1e3baf05
DM
254 description => "Set a name for the VM. Only used on the configuration web interface.",
255 },
cdd20088
AD
256 scsihw => {
257 optional => 1,
258 type => 'string',
52261945 259 description => "SCSI controller model",
6731a4cf 260 enum => [qw(lsi lsi53c810 virtio-scsi-pci virtio-scsi-single megasas pvscsi)],
cdd20088
AD
261 default => 'lsi',
262 },
1e3baf05
DM
263 description => {
264 optional => 1,
265 type => 'string',
0581fe4f 266 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
267 },
268 ostype => {
269 optional => 1,
270 type => 'string',
0cb9971e 271 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 win10 l24 l26 solaris)],
52261945
DM
272 description => "Specify guest operating system.",
273 verbose_description => <<EODESC,
274Specify guest operating system. This is used to enable special
275optimization/features for specific operating systems:
276
277[horizontal]
278other;; unspecified OS
279wxp;; Microsoft Windows XP
280w2k;; Microsoft Windows 2000
281w2k3;; Microsoft Windows 2003
282w2k8;; Microsoft Windows 2008
283wvista;; Microsoft Windows Vista
284win7;; Microsoft Windows 7
285win8;; Microsoft Windows 8/2012
286l24;; Linux 2.4 Kernel
287l26;; Linux 2.6/3.X Kernel
288solaris;; Solaris/OpenSolaris/OpenIndiania kernel
1e3baf05
DM
289EODESC
290 },
291 boot => {
292 optional => 1,
293 type => 'string',
294 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
295 pattern => '[acdn]{1,4}',
32baffb4 296 default => 'cdn',
1e3baf05
DM
297 },
298 bootdisk => {
299 optional => 1,
300 type => 'string', format => 'pve-qm-bootdisk',
301 description => "Enable booting from specified disk.",
03e480fc 302 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
303 },
304 smp => {
305 optional => 1,
306 type => 'integer',
307 description => "The number of CPUs. Please use option -sockets instead.",
308 minimum => 1,
309 default => 1,
310 },
311 sockets => {
312 optional => 1,
313 type => 'integer',
314 description => "The number of CPU sockets.",
315 minimum => 1,
316 default => 1,
317 },
318 cores => {
319 optional => 1,
320 type => 'integer',
321 description => "The number of cores per socket.",
322 minimum => 1,
323 default => 1,
324 },
8a010eae
AD
325 numa => {
326 optional => 1,
327 type => 'boolean',
1917695c 328 description => "Enable/disable NUMA.",
8a010eae
AD
329 default => 0,
330 },
7023f3ea
AD
331 hugepages => {
332 optional => 1,
333 type => 'string',
334 description => "Enable/disable hugepages memory.",
335 enum => [qw(any 2 1024)],
336 },
de9d1e55 337 vcpus => {
3bd18e48
AD
338 optional => 1,
339 type => 'integer',
de9d1e55 340 description => "Number of hotplugged vcpus.",
3bd18e48 341 minimum => 1,
de9d1e55 342 default => 0,
3bd18e48 343 },
1e3baf05
DM
344 acpi => {
345 optional => 1,
346 type => 'boolean',
347 description => "Enable/disable ACPI.",
348 default => 1,
349 },
bc84dcca 350 agent => {
ab6a046f
AD
351 optional => 1,
352 type => 'boolean',
353 description => "Enable/disable Qemu GuestAgent.",
be79c214 354 default => 0,
ab6a046f 355 },
1e3baf05
DM
356 kvm => {
357 optional => 1,
358 type => 'boolean',
359 description => "Enable/disable KVM hardware virtualization.",
360 default => 1,
361 },
362 tdf => {
363 optional => 1,
364 type => 'boolean',
8c559505
DM
365 description => "Enable/disable time drift fix.",
366 default => 0,
1e3baf05 367 },
19672434 368 localtime => {
1e3baf05
DM
369 optional => 1,
370 type => 'boolean',
371 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
372 },
373 freeze => {
374 optional => 1,
375 type => 'boolean',
376 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
377 },
378 vga => {
379 optional => 1,
380 type => 'string',
52261945
DM
381 description => "Select the VGA type.",
382 verbose_description => "Select the VGA type. If you want to use high resolution" .
1917695c
TL
383 " modes (>= 1280x1024x16) then you should use the options " .
384 "'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and " .
385 "'cirrus' for other OS types. The 'qxl' option enables the SPICE " .
386 "display sever. For win* OS you can select how many independent " .
387 "displays you want, Linux guests can add displays them self. " .
388 "You can also run without any graphic card, using a serial device" .
389 " as terminal.",
2fa3151e 390 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 391 },
0ea9541d
DM
392 watchdog => {
393 optional => 1,
394 type => 'string', format => 'pve-qm-watchdog',
52261945
DM
395 description => "Create a virtual hardware watchdog device.",
396 verbose_description => "Create a virtual hardware watchdog device. Once enabled" .
1917695c
TL
397 " (by a guest action), the watchdog must be periodically polled " .
398 "by an agent inside the guest or else the watchdog will reset " .
399 "the guest (or execute the respective action specified)",
0ea9541d 400 },
1e3baf05
DM
401 startdate => {
402 optional => 1,
19672434 403 type => 'string',
1e3baf05
DM
404 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
405 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
406 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
407 default => 'now',
408 },
43574f73 409 startup => get_standard_option('pve-startup-order'),
68eda3ab
AD
410 template => {
411 optional => 1,
412 type => 'boolean',
413 description => "Enable/disable Template.",
414 default => 0,
415 },
1e3baf05
DM
416 args => {
417 optional => 1,
418 type => 'string',
52261945
DM
419 description => "Arbitrary arguments passed to kvm.",
420 verbose_description => <<EODESCR,
c7a8aad6 421Arbitrary arguments passed to kvm, for example:
1e3baf05
DM
422
423args: -no-reboot -no-hpet
c7a8aad6
FG
424
425NOTE: this option is for experts only.
1e3baf05
DM
426EODESCR
427 },
428 tablet => {
429 optional => 1,
430 type => 'boolean',
431 default => 1,
52261945
DM
432 description => "Enable/disable the USB tablet device.",
433 verbose_description => "Enable/disable the USB tablet device. This device is " .
1917695c
TL
434 "usually needed to allow absolute mouse positioning with VNC. " .
435 "Else the mouse runs out of sync with normal VNC clients. " .
436 "If you're running lots of console-only guests on one host, " .
437 "you may consider disabling this to save some context switches. " .
438 "This is turned off by default if you use spice (-vga=qxl).",
1e3baf05
DM
439 },
440 migrate_speed => {
441 optional => 1,
442 type => 'integer',
443 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
444 minimum => 0,
445 default => 0,
446 },
447 migrate_downtime => {
448 optional => 1,
04432191 449 type => 'number',
1e3baf05
DM
450 description => "Set maximum tolerated downtime (in seconds) for migrations.",
451 minimum => 0,
04432191 452 default => 0.1,
1e3baf05
DM
453 },
454 cdrom => {
455 optional => 1,
b799312f 456 type => 'string', format => 'pve-qm-ide',
8485b9ba 457 typetext => '<volume>',
1e3baf05
DM
458 description => "This is an alias for option -ide2",
459 },
460 cpu => {
461 optional => 1,
462 description => "Emulated CPU type.",
463 type => 'string',
ff6ffe20 464 format => $cpu_fmt,
1e3baf05 465 },
b7ba6b79
DM
466 parent => get_standard_option('pve-snapshot-name', {
467 optional => 1,
468 description => "Parent snapshot name. This is used internally, and should not be modified.",
469 }),
982c7f12
DM
470 snaptime => {
471 optional => 1,
472 description => "Timestamp for snapshots.",
473 type => 'integer',
474 minimum => 0,
475 },
18bfb361
DM
476 vmstate => {
477 optional => 1,
478 type => 'string', format => 'pve-volume-id',
479 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
480 },
3bafc510
DM
481 machine => {
482 description => "Specific the Qemu machine type.",
483 type => 'string',
7bac824e 484 pattern => '(pc|pc(-i440fx)?-\d+\.\d+(\.pxe)?|q35|pc-q35-\d+\.\d+(\.pxe)?)',
3bafc510
DM
485 maxLength => 40,
486 optional => 1,
487 },
2796e7d5
DM
488 smbios1 => {
489 description => "Specify SMBIOS type 1 fields.",
490 type => 'string', format => 'pve-qm-smbios1',
2796e7d5
DM
491 maxLength => 256,
492 optional => 1,
493 },
cb0e4540
AG
494 protection => {
495 optional => 1,
496 type => 'boolean',
52261945 497 description => "Sets the protection flag of the VM. This will disable the remove VM and remove disk operations.",
cb0e4540
AG
498 default => 0,
499 },
3edb45e7 500 bios => {
a783c78e 501 optional => 1,
3edb45e7
DM
502 type => 'string',
503 enum => [ qw(seabios ovmf) ],
504 description => "Select BIOS implementation.",
505 default => 'seabios',
a783c78e 506 },
1e3baf05
DM
507};
508
509# what about other qemu settings ?
510#cpu => 'string',
511#machine => 'string',
512#fda => 'file',
513#fdb => 'file',
514#mtdblock => 'file',
515#sd => 'file',
516#pflash => 'file',
517#snapshot => 'bool',
518#bootp => 'file',
519##tftp => 'dir',
520##smb => 'dir',
521#kernel => 'file',
522#append => 'string',
523#initrd => 'file',
524##soundhw => 'string',
525
526while (my ($k, $v) = each %$confdesc) {
527 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
528}
529
530my $MAX_IDE_DISKS = 4;
f62db2a4 531my $MAX_SCSI_DISKS = 14;
a2650619 532my $MAX_VIRTIO_DISKS = 16;
cdb0931f 533my $MAX_SATA_DISKS = 6;
1e3baf05 534my $MAX_USB_DEVICES = 5;
5bdcf937 535my $MAX_NETS = 32;
1e3baf05 536my $MAX_UNUSED_DISKS = 8;
5cffb2d2 537my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 538my $MAX_SERIAL_PORTS = 4;
1989a89c 539my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
540my $MAX_NUMA = 8;
541
ffc0d8c7
WB
542my $numa_fmt = {
543 cpus => {
544 type => "string",
545 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
52261945 546 description => "CPUs accessing this NUMA node.",
ffc0d8c7
WB
547 format_description => "id[-id];...",
548 },
549 memory => {
550 type => "number",
52261945 551 description => "Amount of memory this NUMA node provides.",
ffc0d8c7
WB
552 optional => 1,
553 },
554 hostnodes => {
555 type => "string",
556 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
52261945 557 description => "Host NUMA nodes to use.",
ffc0d8c7
WB
558 format_description => "id[-id];...",
559 optional => 1,
560 },
561 policy => {
562 type => 'string',
563 enum => [qw(preferred bind interleave)],
52261945 564 description => "NUMA allocation policy.",
ffc0d8c7
WB
565 optional => 1,
566 },
567};
568PVE::JSONSchema::register_format('pve-qm-numanode', $numa_fmt);
2ed5d572
AD
569my $numadesc = {
570 optional => 1,
ffc0d8c7 571 type => 'string', format => $numa_fmt,
52261945 572 description => "NUMA topology.",
2ed5d572
AD
573};
574PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
575
576for (my $i = 0; $i < $MAX_NUMA; $i++) {
577 $confdesc->{"numa$i"} = $numadesc;
578}
1e3baf05
DM
579
580my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
55034103
KT
581 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3',
582 'e1000-82540em', 'e1000-82544gc', 'e1000-82545em'];
6b64503e 583my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 584
52261945
DM
585my $net_fmt_bridge_descr = <<__EOD__;
586Bridge to attach the network device to. The Proxmox VE standard bridge
587is called 'vmbr0'.
588
589If you do not specify a bridge, we create a kvm user (NATed) network
590device, which provides DHCP and DNS services. The following addresses
591are used:
592
593 10.0.2.2 Gateway
594 10.0.2.3 DNS Server
595 10.0.2.4 SMB Server
596
597The DHCP server assign addresses to the guest starting from 10.0.2.15.
598__EOD__
599
cd9c34d1
WB
600my $net_fmt = {
601 macaddr => {
602 type => 'string',
603 pattern => qr/[0-9a-f]{2}(?::[0-9a-f]{2}){5}/i,
52261945 604 description => "MAC address. That address must be unique withing your network. This is automatically generated if not specified.",
cd9c34d1
WB
605 format_description => "XX:XX:XX:XX:XX:XX",
606 optional => 1,
607 },
7f694a71
DM
608 model => {
609 type => 'string',
52261945 610 description => "Network Card Model. The 'virtio' model provides the best performance with very low CPU overhead. If your guest does not support this driver, it is usually best to use 'e1000'.",
7f694a71
DM
611 enum => $nic_model_list,
612 default_key => 1,
613 },
614 (map { $_ => { keyAlias => 'model', alias => 'macaddr' }} @$nic_model_list),
cd9c34d1
WB
615 bridge => {
616 type => 'string',
52261945 617 description => $net_fmt_bridge_descr,
cd9c34d1
WB
618 format_description => 'bridge',
619 optional => 1,
620 },
621 queues => {
622 type => 'integer',
623 minimum => 0, maximum => 16,
624 description => 'Number of packet queues to be used on the device.',
cd9c34d1
WB
625 optional => 1,
626 },
627 rate => {
628 type => 'number',
629 minimum => 0,
52261945 630 description => "Rate limit in mbps (megabytes per second) as floating point number.",
cd9c34d1
WB
631 optional => 1,
632 },
633 tag => {
634 type => 'integer',
9f41a659 635 minimum => 1, maximum => 4094,
cd9c34d1 636 description => 'VLAN tag to apply to packets on this interface.',
cd9c34d1
WB
637 optional => 1,
638 },
639 trunks => {
640 type => 'string',
641 pattern => qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
642 description => 'VLAN trunks to pass through this interface.',
7f694a71 643 format_description => 'vlanid[;vlanid...]',
cd9c34d1
WB
644 optional => 1,
645 },
646 firewall => {
647 type => 'boolean',
648 description => 'Whether this interface should be protected by the firewall.',
cd9c34d1
WB
649 optional => 1,
650 },
651 link_down => {
652 type => 'boolean',
52261945 653 description => 'Whether this interface should be disconnected (like pulling the plug).',
cd9c34d1
WB
654 optional => 1,
655 },
656};
52261945 657
1e3baf05
DM
658my $netdesc = {
659 optional => 1,
7f694a71 660 type => 'string', format => $net_fmt,
52261945 661 description => "Specify network devices.",
1e3baf05 662};
52261945 663
1e3baf05
DM
664PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
665
666for (my $i = 0; $i < $MAX_NETS; $i++) {
667 $confdesc->{"net$i"} = $netdesc;
668}
669
ffa42b86
DC
670PVE::JSONSchema::register_format('pve-volume-id-or-qm-path', \&verify_volume_id_or_qm_path);
671sub verify_volume_id_or_qm_path {
822c8a07
WB
672 my ($volid, $noerr) = @_;
673
ffa42b86
DC
674 if ($volid eq 'none' || $volid eq 'cdrom' || $volid =~ m|^/|) {
675 return $volid;
676 }
677
678 # if its neither 'none' nor 'cdrom' nor a path, check if its a volume-id
822c8a07
WB
679 $volid = eval { PVE::JSONSchema::check_format('pve-volume-id', $volid, '') };
680 if ($@) {
681 return undef if $noerr;
682 die $@;
683 }
684 return $volid;
685}
686
1e3baf05 687my $drivename_hash;
19672434 688
0541eeb8
WB
689my %drivedesc_base = (
690 volume => { alias => 'file' },
691 file => {
93c0971c 692 type => 'string',
ffa42b86 693 format => 'pve-volume-id-or-qm-path',
0541eeb8
WB
694 default_key => 1,
695 format_description => 'volume',
696 description => "The drive's backing volume.",
697 },
698 media => {
699 type => 'string',
0541eeb8
WB
700 enum => [qw(cdrom disk)],
701 description => "The drive's media type.",
702 default => 'disk',
703 optional => 1
704 },
705 cyls => {
706 type => 'integer',
0541eeb8
WB
707 description => "Force the drive's physical geometry to have a specific cylinder count.",
708 optional => 1
709 },
710 heads => {
711 type => 'integer',
0541eeb8
WB
712 description => "Force the drive's physical geometry to have a specific head count.",
713 optional => 1
714 },
715 secs => {
716 type => 'integer',
0541eeb8
WB
717 description => "Force the drive's physical geometry to have a specific sector count.",
718 optional => 1
719 },
720 trans => {
721 type => 'string',
0541eeb8
WB
722 enum => [qw(none lba auto)],
723 description => "Force disk geometry bios translation mode.",
724 optional => 1,
725 },
726 snapshot => {
727 type => 'boolean',
0541eeb8
WB
728 description => "Whether the drive should be included when making snapshots.",
729 optional => 1,
730 },
731 cache => {
732 type => 'string',
0541eeb8
WB
733 enum => [qw(none writethrough writeback unsafe directsync)],
734 description => "The drive's cache mode",
735 optional => 1,
736 },
c7d2b650 737 format => get_standard_option('pve-qm-image-format'),
0541eeb8 738 size => {
47c28a68
WB
739 type => 'string',
740 format => 'disk-size',
7f694a71 741 format_description => 'DiskSize',
0541eeb8
WB
742 description => "Disk size. This is purely informational and has no effect.",
743 optional => 1,
744 },
745 backup => {
746 type => 'boolean',
0541eeb8
WB
747 description => "Whether the drive should be included when making backups.",
748 optional => 1,
749 },
8557d01f 750 replicate => {
9edac22f 751 type => 'boolean',
3ab7663a 752 description => 'Whether the drive should considered for replication jobs.',
9edac22f
WL
753 optional => 1,
754 default => 1,
755 },
6e9d2550
AD
756 rerror => {
757 type => 'string',
758 enum => [qw(ignore report stop)],
759 description => 'Read error action.',
760 optional => 1,
761 },
0541eeb8
WB
762 werror => {
763 type => 'string',
0541eeb8
WB
764 enum => [qw(enospc ignore report stop)],
765 description => 'Write error action.',
766 optional => 1,
767 },
768 aio => {
769 type => 'string',
0541eeb8
WB
770 enum => [qw(native threads)],
771 description => 'AIO type to use.',
772 optional => 1,
773 },
774 discard => {
775 type => 'string',
0541eeb8
WB
776 enum => [qw(ignore on)],
777 description => 'Controls whether to pass discard/trim requests to the underlying storage.',
778 optional => 1,
779 },
780 detect_zeroes => {
781 type => 'boolean',
782 description => 'Controls whether to detect and try to optimize writes of zeroes.',
783 optional => 1,
784 },
785 serial => {
786 type => 'string',
46630a5f 787 format => 'urlencoded',
0541eeb8 788 format_description => 'serial',
ba8fc5d1
WB
789 maxLength => 20*3, # *3 since it's %xx url enoded
790 description => "The drive's reported serial number, url-encoded, up to 20 bytes long.",
0541eeb8
WB
791 optional => 1,
792 }
793);
794
0541eeb8
WB
795my %iothread_fmt = ( iothread => {
796 type => 'boolean',
0541eeb8
WB
797 description => "Whether to use iothreads for this drive",
798 optional => 1,
799});
800
801my %model_fmt = (
802 model => {
803 type => 'string',
46630a5f 804 format => 'urlencoded',
0541eeb8 805 format_description => 'model',
ba8fc5d1
WB
806 maxLength => 40*3, # *3 since it's %xx url enoded
807 description => "The drive's reported model name, url-encoded, up to 40 bytes long.",
0541eeb8
WB
808 optional => 1,
809 },
810);
811
812my %queues_fmt = (
813 queues => {
814 type => 'integer',
0541eeb8
WB
815 description => "Number of queues.",
816 minimum => 2,
817 optional => 1
818 }
819);
820
8e3c33ab
FG
821my %scsiblock_fmt = (
822 scsiblock => {
823 type => 'boolean',
824 description => "whether to use scsi-block for full passthrough of host block device\n\nWARNING: can lead to I/O errors in combination with low memory or high memory fragmentation on host",
825 optional => 1,
826 default => 0,
827 },
828);
829
0541eeb8 830my $add_throttle_desc = sub {
9196a8ec
WB
831 my ($key, $type, $what, $unit, $longunit, $minimum) = @_;
832 my $d = {
0541eeb8 833 type => $type,
7f694a71 834 format_description => $unit,
9196a8ec 835 description => "Maximum $what in $longunit.",
0541eeb8
WB
836 optional => 1,
837 };
9196a8ec
WB
838 $d->{minimum} = $minimum if defined($minimum);
839 $drivedesc_base{$key} = $d;
0541eeb8
WB
840};
841# throughput: (leaky bucket)
d3f3f1b3
DM
842$add_throttle_desc->('bps', 'integer', 'r/w speed', 'bps', 'bytes per second');
843$add_throttle_desc->('bps_rd', 'integer', 'read speed', 'bps', 'bytes per second');
844$add_throttle_desc->('bps_wr', 'integer', 'write speed', 'bps', 'bytes per second');
845$add_throttle_desc->('mbps', 'number', 'r/w speed', 'mbps', 'megabytes per second');
846$add_throttle_desc->('mbps_rd', 'number', 'read speed', 'mbps', 'megabytes per second');
847$add_throttle_desc->('mbps_wr', 'number', 'write speed', 'mbps', 'megabytes per second');
848$add_throttle_desc->('iops', 'integer', 'r/w I/O', 'iops', 'operations per second');
849$add_throttle_desc->('iops_rd', 'integer', 'read I/O', 'iops', 'operations per second');
850$add_throttle_desc->('iops_wr', 'integer', 'write I/O', 'iops', 'operations per second');
0541eeb8
WB
851
852# pools: (pool of IO before throttling starts taking effect)
d3f3f1b3
DM
853$add_throttle_desc->('mbps_max', 'number', 'unthrottled r/w pool', 'mbps', 'megabytes per second');
854$add_throttle_desc->('mbps_rd_max', 'number', 'unthrottled read pool', 'mbps', 'megabytes per second');
855$add_throttle_desc->('mbps_wr_max', 'number', 'unthrottled write pool', 'mbps', 'megabytes per second');
856$add_throttle_desc->('iops_max', 'integer', 'unthrottled r/w I/O pool', 'iops', 'operations per second');
857$add_throttle_desc->('iops_rd_max', 'integer', 'unthrottled read I/O pool', 'iops', 'operations per second');
858$add_throttle_desc->('iops_wr_max', 'integer', 'unthrottled write I/O pool', 'iops', 'operations per second');
9196a8ec
WB
859
860# burst lengths
fb8e95a2
WB
861$add_throttle_desc->('bps_max_length', 'integer', 'length of I/O bursts', 'seconds', 'seconds', 1);
862$add_throttle_desc->('bps_rd_max_length', 'integer', 'length of read I/O bursts', 'seconds', 'seconds', 1);
863$add_throttle_desc->('bps_wr_max_length', 'integer', 'length of write I/O bursts', 'seconds', 'seconds', 1);
864$add_throttle_desc->('iops_max_length', 'integer', 'length of I/O bursts', 'seconds', 'seconds', 1);
865$add_throttle_desc->('iops_rd_max_length', 'integer', 'length of read I/O bursts', 'seconds', 'seconds', 1);
866$add_throttle_desc->('iops_wr_max_length', 'integer', 'length of write I/O bursts', 'seconds', 'seconds', 1);
867
868# legacy support
869$drivedesc_base{'bps_rd_length'} = { alias => 'bps_rd_max_length' };
870$drivedesc_base{'bps_wr_length'} = { alias => 'bps_wr_max_length' };
871$drivedesc_base{'iops_rd_length'} = { alias => 'iops_rd_max_length' };
872$drivedesc_base{'iops_wr_length'} = { alias => 'iops_wr_max_length' };
0541eeb8
WB
873
874my $ide_fmt = {
875 %drivedesc_base,
0541eeb8
WB
876 %model_fmt,
877};
b799312f 878PVE::JSONSchema::register_format("pve-qm-ide", $ide_fmt);
0541eeb8 879
1e3baf05
DM
880my $idedesc = {
881 optional => 1,
0541eeb8 882 type => 'string', format => $ide_fmt,
3c770faa 883 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
884};
885PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
886
0541eeb8
WB
887my $scsi_fmt = {
888 %drivedesc_base,
889 %iothread_fmt,
890 %queues_fmt,
8e3c33ab 891 %scsiblock_fmt,
0541eeb8 892};
1e3baf05
DM
893my $scsidesc = {
894 optional => 1,
0541eeb8 895 type => 'string', format => $scsi_fmt,
3c770faa 896 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
897};
898PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
899
0541eeb8
WB
900my $sata_fmt = {
901 %drivedesc_base,
0541eeb8 902};
cdb0931f
DA
903my $satadesc = {
904 optional => 1,
0541eeb8 905 type => 'string', format => $sata_fmt,
3c770faa 906 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
907};
908PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
909
0541eeb8
WB
910my $virtio_fmt = {
911 %drivedesc_base,
912 %iothread_fmt,
0541eeb8 913};
1e3baf05
DM
914my $virtiodesc = {
915 optional => 1,
0541eeb8 916 type => 'string', format => $virtio_fmt,
3c770faa 917 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
918};
919PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
920
0541eeb8
WB
921my $alldrive_fmt = {
922 %drivedesc_base,
0541eeb8
WB
923 %iothread_fmt,
924 %model_fmt,
925 %queues_fmt,
8e3c33ab 926 %scsiblock_fmt,
0541eeb8
WB
927};
928
6470743f
DC
929my $efidisk_fmt = {
930 volume => { alias => 'file' },
931 file => {
932 type => 'string',
933 format => 'pve-volume-id-or-qm-path',
934 default_key => 1,
935 format_description => 'volume',
936 description => "The drive's backing volume.",
937 },
c7d2b650 938 format => get_standard_option('pve-qm-image-format'),
6470743f
DC
939 size => {
940 type => 'string',
941 format => 'disk-size',
942 format_description => 'DiskSize',
943 description => "Disk size. This is purely informational and has no effect.",
944 optional => 1,
945 },
946};
947
948my $efidisk_desc = {
949 optional => 1,
950 type => 'string', format => $efidisk_fmt,
951 description => "Configure a Disk for storing EFI vars",
952};
953
954PVE::JSONSchema::register_standard_option("pve-qm-efidisk", $efidisk_desc);
955
ff6ffe20 956my $usb_fmt = {
a6b9aee4
DC
957 host => {
958 default_key => 1,
959 type => 'string', format => 'pve-qm-usb-device',
960 format_description => 'HOSTUSBDEVICE|spice',
52261945
DM
961 description => <<EODESCR,
962The Host USB device or port or the value 'spice'. HOSTUSBDEVICE syntax is:
963
964 'bus-port(.port)*' (decimal numbers) or
965 'vendor_id:product_id' (hexadeciaml numbers) or
966 'spice'
967
968You can use the 'lsusb -t' command to list existing usb devices.
969
970NOTE: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
971
972The value 'spice' can be used to add a usb redirection devices for spice.
973EODESCR
a6b9aee4
DC
974 },
975 usb3 => {
976 optional => 1,
977 type => 'boolean',
52261945
DM
978 description => "Specifies whether if given host option is a USB3 device or port (this does currently not work reliably with spice redirection and is then ignored).",
979 default => 0,
a6b9aee4
DC
980 },
981};
982
1e3baf05
DM
983my $usbdesc = {
984 optional => 1,
ff6ffe20 985 type => 'string', format => $usb_fmt,
52261945 986 description => "Configure an USB device (n is 0 to 4).",
1e3baf05
DM
987};
988PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
989
1f4f447b
WB
990# NOTE: the match-groups of this regex are used in parse_hostpci
991my $PCIRE = qr/([a-f0-9]{2}:[a-f0-9]{2})(?:\.([a-f0-9]))?/;
992my $hostpci_fmt = {
993 host => {
994 default_key => 1,
995 type => 'string',
996 pattern => qr/$PCIRE(;$PCIRE)*/,
997 format_description => 'HOSTPCIID[;HOSTPCIID2...]',
52261945
DM
998 description => <<EODESCR,
999Host PCI device pass through. The PCI ID of a host's PCI device or a list
1000of PCI virtual functions of the host. HOSTPCIID syntax is:
1001
1002'bus:dev.func' (hexadecimal numbers)
1003
1004You can us the 'lspci' command to list existing PCI devices.
52261945 1005EODESCR
1f4f447b
WB
1006 },
1007 rombar => {
1008 type => 'boolean',
52261945 1009 description => "Specify whether or not the device's ROM will be visible in the guest's memory map.",
1f4f447b
WB
1010 optional => 1,
1011 default => 1,
1012 },
456a6fec
AD
1013 romfile => {
1014 type => 'string',
1015 pattern => '[^,;]+',
1016 format_description => 'string',
1017 description => "Custom pci device rom filename (must be located in /usr/share/kvm/).",
1018 optional => 1,
1019 },
1f4f447b
WB
1020 pcie => {
1021 type => 'boolean',
52261945 1022 description => "Choose the PCI-express bus (needs the 'q35' machine model).",
1f4f447b
WB
1023 optional => 1,
1024 default => 0,
1025 },
1026 'x-vga' => {
1027 type => 'boolean',
52261945 1028 description => "Enable vfio-vga device support.",
1f4f447b
WB
1029 optional => 1,
1030 default => 0,
1031 },
1032};
1033PVE::JSONSchema::register_format('pve-qm-hostpci', $hostpci_fmt);
1034
040b06b7
DA
1035my $hostpcidesc = {
1036 optional => 1,
1037 type => 'string', format => 'pve-qm-hostpci',
52261945 1038 description => "Map host PCI devices into guest.",
faab5306
DM
1039 verbose_description => <<EODESCR,
1040Map host PCI devices into guest.
1041
1042NOTE: This option allows direct access to host hardware. So it is no longer
1043possible to migrate such machines - use with special care.
1044
1045CAUTION: Experimental! User reported problems with this option.
1046EODESCR
040b06b7
DA
1047};
1048PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
1049
bae179aa
DA
1050my $serialdesc = {
1051 optional => 1,
ca0cef26 1052 type => 'string',
1b0b51ed 1053 pattern => '(/dev/.+|socket)',
52261945
DM
1054 description => "Create a serial device inside the VM (n is 0 to 3)",
1055 verbose_description => <<EODESCR,
52261945
DM
1056Create a serial device inside the VM (n is 0 to 3), and pass through a
1057host serial device (i.e. /dev/ttyS0), or create a unix socket on the
1058host side (use 'qm terminal' to open a terminal connection).
bae179aa 1059
8a61e0fd 1060NOTE: If you pass through a host serial device, it is no longer possible to migrate such machines - use with special care.
bae179aa 1061
52261945 1062CAUTION: Experimental! User reported problems with this option.
bae179aa
DA
1063EODESCR
1064};
bae179aa 1065
1989a89c
DA
1066my $paralleldesc= {
1067 optional => 1,
ca0cef26 1068 type => 'string',
9ecc8431 1069 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
52261945
DM
1070 description => "Map host parallel devices (n is 0 to 2).",
1071 verbose_description => <<EODESCR,
19672434 1072Map host parallel devices (n is 0 to 2).
1989a89c 1073
8a61e0fd 1074NOTE: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
1989a89c 1075
52261945 1076CAUTION: Experimental! User reported problems with this option.
1989a89c
DA
1077EODESCR
1078};
1989a89c
DA
1079
1080for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
1081 $confdesc->{"parallel$i"} = $paralleldesc;
1082}
1083
bae179aa
DA
1084for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
1085 $confdesc->{"serial$i"} = $serialdesc;
1086}
1087
040b06b7
DA
1088for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
1089 $confdesc->{"hostpci$i"} = $hostpcidesc;
1090}
1e3baf05
DM
1091
1092for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
1093 $drivename_hash->{"ide$i"} = 1;
1094 $confdesc->{"ide$i"} = $idedesc;
1095}
1096
cdb0931f
DA
1097for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
1098 $drivename_hash->{"sata$i"} = 1;
1099 $confdesc->{"sata$i"} = $satadesc;
1100}
1101
1e3baf05
DM
1102for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
1103 $drivename_hash->{"scsi$i"} = 1;
1104 $confdesc->{"scsi$i"} = $scsidesc ;
1105}
1106
1107for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
1108 $drivename_hash->{"virtio$i"} = 1;
1109 $confdesc->{"virtio$i"} = $virtiodesc;
1110}
1111
6470743f
DC
1112$drivename_hash->{efidisk0} = 1;
1113$confdesc->{efidisk0} = $efidisk_desc;
1114
1e3baf05
DM
1115for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
1116 $confdesc->{"usb$i"} = $usbdesc;
1117}
1118
1119my $unuseddesc = {
1120 optional => 1,
1121 type => 'string', format => 'pve-volume-id',
52261945 1122 description => "Reference to unused volumes. This is used internally, and should not be modified manually.",
1e3baf05
DM
1123};
1124
1125for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
1126 $confdesc->{"unused$i"} = $unuseddesc;
1127}
1128
1129my $kvm_api_version = 0;
1130
1131sub kvm_version {
1132
1133 return $kvm_api_version if $kvm_api_version;
1134
6b64503e 1135 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
1136 return 0;
1137
6b64503e 1138 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
1139 $kvm_api_version = $v;
1140 }
1141
1142 $fh->close();
1143
1144 return $kvm_api_version;
1145}
1146
1147my $kvm_user_version;
1148
1149sub kvm_user_version {
1150
1151 return $kvm_user_version if $kvm_user_version;
1152
1153 $kvm_user_version = 'unknown';
1154
09b11429
TL
1155 my $code = sub {
1156 my $line = shift;
1157 if ($line =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)(\.\d+)?[,\s]/) {
1158 $kvm_user_version = $2;
1159 }
1160 };
19672434 1161
09b11429
TL
1162 eval { run_command("kvm -version", outfunc => $code); };
1163 warn $@ if $@;
1e3baf05
DM
1164
1165 return $kvm_user_version;
1166
1167}
1168
1169my $kernel_has_vhost_net = -c '/dev/vhost-net';
1170
74479ee9 1171sub valid_drive_names {
1e3baf05 1172 # order is important - used to autoselect boot disk
19672434 1173 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 1174 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f 1175 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
6470743f
DC
1176 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))),
1177 'efidisk0');
1e3baf05
DM
1178}
1179
74479ee9 1180sub is_valid_drivename {
1e3baf05
DM
1181 my $dev = shift;
1182
6b64503e 1183 return defined($drivename_hash->{$dev});
1e3baf05
DM
1184}
1185
1186sub option_exists {
1187 my $key = shift;
1188 return defined($confdesc->{$key});
19672434 1189}
1e3baf05
DM
1190
1191sub nic_models {
1192 return $nic_model_list;
1193}
1194
1195sub os_list_description {
1196
1197 return {
1198 other => 'Other',
1199 wxp => 'Windows XP',
1200 w2k => 'Windows 2000',
1201 w2k3 =>, 'Windows 2003',
1202 w2k8 => 'Windows 2008',
1203 wvista => 'Windows Vista',
1204 win7 => 'Windows 7',
a70ebde3 1205 win8 => 'Windows 8/2012',
0cb9971e 1206 win10 => 'Windows 10/2016',
1e3baf05
DM
1207 l24 => 'Linux 2.4',
1208 l26 => 'Linux 2.6',
19672434 1209 };
1e3baf05
DM
1210}
1211
1e3baf05
DM
1212my $cdrom_path;
1213
1214sub get_cdrom_path {
1215
1216 return $cdrom_path if $cdrom_path;
1217
1218 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
1219 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
1220 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
1221}
1222
1223sub get_iso_path {
1224 my ($storecfg, $vmid, $cdrom) = @_;
1225
1226 if ($cdrom eq 'cdrom') {
1227 return get_cdrom_path();
1228 } elsif ($cdrom eq 'none') {
1229 return '';
1230 } elsif ($cdrom =~ m|^/|) {
1231 return $cdrom;
1232 } else {
6b64503e 1233 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
1234 }
1235}
1236
1237# try to convert old style file names to volume IDs
1238sub filename_to_volume_id {
1239 my ($vmid, $file, $media) = @_;
1240
1241 if (!($file eq 'none' || $file eq 'cdrom' ||
1242 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 1243
1e3baf05 1244 return undef if $file =~ m|/|;
19672434 1245
1e3baf05
DM
1246 if ($media && $media eq 'cdrom') {
1247 $file = "local:iso/$file";
1248 } else {
1249 $file = "local:$vmid/$file";
1250 }
1251 }
1252
1253 return $file;
1254}
1255
1256sub verify_media_type {
1257 my ($opt, $vtype, $media) = @_;
1258
1259 return if !$media;
1260
1261 my $etype;
1262 if ($media eq 'disk') {
a125592c 1263 $etype = 'images';
1e3baf05
DM
1264 } elsif ($media eq 'cdrom') {
1265 $etype = 'iso';
1266 } else {
1267 die "internal error";
1268 }
1269
1270 return if ($vtype eq $etype);
19672434 1271
1e3baf05
DM
1272 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
1273}
1274
1275sub cleanup_drive_path {
1276 my ($opt, $storecfg, $drive) = @_;
1277
1278 # try to convert filesystem paths to volume IDs
1279
1280 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
1281 ($drive->{file} !~ m|^/dev/.+|) &&
1282 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 1283 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
1284 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
1285 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
1286 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
1287 verify_media_type($opt, $vtype, $drive->{media});
1288 $drive->{file} = $volid;
1289 }
1290
1291 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
1292}
1293
b3c2bdd1
DM
1294sub parse_hotplug_features {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 return $res if $data eq '0';
a1b7d579 1300
b3c2bdd1
DM
1301 $data = $confdesc->{hotplug}->{default} if $data eq '1';
1302
45827685 1303 foreach my $feature (PVE::Tools::split_list($data)) {
b3c2bdd1
DM
1304 if ($feature =~ m/^(network|disk|cpu|memory|usb)$/) {
1305 $res->{$1} = 1;
1306 } else {
596a0a20 1307 die "invalid hotplug feature '$feature'\n";
b3c2bdd1
DM
1308 }
1309 }
1310 return $res;
1311}
1312
1313PVE::JSONSchema::register_format('pve-hotplug-features', \&pve_verify_hotplug_features);
1314sub pve_verify_hotplug_features {
1315 my ($value, $noerr) = @_;
1316
1317 return $value if parse_hotplug_features($value);
1318
1319 return undef if $noerr;
1320
1321 die "unable to parse hotplug option\n";
1322}
1323
1e3baf05
DM
1324# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
1325# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 1326# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
6e47c3b4
WB
1327# [,aio=native|threads][,discard=ignore|on][,detect_zeroes=on|off]
1328# [,iothread=on][,serial=serial][,model=model]
1e3baf05
DM
1329
1330sub parse_drive {
1331 my ($key, $data) = @_;
1332
0541eeb8 1333 my ($interface, $index);
19672434 1334
0541eeb8
WB
1335 if ($key =~ m/^([^\d]+)(\d+)$/) {
1336 $interface = $1;
1337 $index = $2;
1e3baf05
DM
1338 } else {
1339 return undef;
1340 }
1341
0541eeb8
WB
1342 my $desc = $key =~ /^unused\d+$/ ? $alldrive_fmt
1343 : $confdesc->{$key}->{format};
1344 if (!$desc) {
1345 warn "invalid drive key: $key\n";
1346 return undef;
1347 }
1348 my $res = eval { PVE::JSONSchema::parse_property_string($desc, $data) };
1349 return undef if !$res;
1350 $res->{interface} = $interface;
1351 $res->{index} = $index;
1352
1353 my $error = 0;
1354 foreach my $opt (qw(bps bps_rd bps_wr)) {
1355 if (my $bps = defined(delete $res->{$opt})) {
1356 if (defined($res->{"m$opt"})) {
1357 warn "both $opt and m$opt specified\n";
1358 ++$error;
1359 next;
1e3baf05 1360 }
0541eeb8 1361 $res->{"m$opt"} = sprintf("%.3f", $bps / (1024*1024.0));
1e3baf05
DM
1362 }
1363 }
9196a8ec
WB
1364
1365 # can't use the schema's 'requires' because of the mbps* => bps* "transforming aliases"
1366 for my $requirement (
fb8e95a2
WB
1367 [mbps_max => 'mbps'],
1368 [mbps_rd_max => 'mbps_rd'],
1369 [mbps_wr_max => 'mbps_wr'],
1370 [miops_max => 'miops'],
1371 [miops_rd_max => 'miops_rd'],
1372 [miops_wr_max => 'miops_wr'],
9196a8ec
WB
1373 [bps_max_length => 'mbps_max'],
1374 [bps_rd_max_length => 'mbps_rd_max'],
1375 [bps_wr_max_length => 'mbps_wr_max'],
1376 [iops_max_length => 'iops_max'],
1377 [iops_rd_max_length => 'iops_rd_max'],
1378 [iops_wr_max_length => 'iops_wr_max']) {
1379 my ($option, $requires) = @$requirement;
1380 if ($res->{$option} && !$res->{$requires}) {
1381 warn "$option requires $requires\n";
1382 ++$error;
1383 }
1384 }
1385
0541eeb8 1386 return undef if $error;
be190583 1387
9bf371a6
DM
1388 return undef if $res->{mbps_rd} && $res->{mbps};
1389 return undef if $res->{mbps_wr} && $res->{mbps};
affd2f88
AD
1390 return undef if $res->{iops_rd} && $res->{iops};
1391 return undef if $res->{iops_wr} && $res->{iops};
74edd76b 1392
1e3baf05
DM
1393 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1394 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1395 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1396 return undef if $res->{interface} eq 'virtio';
1397 }
1398
0541eeb8
WB
1399 if (my $size = $res->{size}) {
1400 return undef if !defined($res->{size} = PVE::JSONSchema::parse_size($size));
1e3baf05
DM
1401 }
1402
1403 return $res;
1404}
1405
1e3baf05
DM
1406sub print_drive {
1407 my ($vmid, $drive) = @_;
0541eeb8
WB
1408 my $data = { %$drive };
1409 delete $data->{$_} for qw(index interface);
1410 return PVE::JSONSchema::print_property_string($data, $alldrive_fmt);
1e3baf05
DM
1411}
1412
28ef82d3
DM
1413sub scsi_inquiry {
1414 my($fh, $noerr) = @_;
1415
1416 my $SG_IO = 0x2285;
1417 my $SG_GET_VERSION_NUM = 0x2282;
1418
1419 my $versionbuf = "\x00" x 8;
1420 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1421 if (!$ret) {
1422 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1423 return undef;
1424 }
97d62eb7 1425 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1426 if ($version < 30000) {
1427 die "scsi generic interface too old\n" if !$noerr;
1428 return undef;
1429 }
97d62eb7 1430
28ef82d3
DM
1431 my $buf = "\x00" x 36;
1432 my $sensebuf = "\x00" x 8;
f334aa3e 1433 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1434
28ef82d3
DM
1435 # see /usr/include/scsi/sg.h
1436 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1437
97d62eb7
DM
1438 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1439 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1440 $cmd, $sensebuf, 6000);
1441
1442 $ret = ioctl($fh, $SG_IO, $packet);
1443 if (!$ret) {
1444 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1445 return undef;
1446 }
97d62eb7 1447
28ef82d3
DM
1448 my @res = unpack($sg_io_hdr_t, $packet);
1449 if ($res[17] || $res[18]) {
1450 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1451 return undef;
1452 }
1453
1454 my $res = {};
09984754 1455 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1456 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1457
09984754
DM
1458 $res->{removable} = $byte1 & 128 ? 1 : 0;
1459 $res->{type} = $byte0 & 31;
1460
28ef82d3
DM
1461 return $res;
1462}
1463
1464sub path_is_scsi {
1465 my ($path) = @_;
1466
1467 my $fh = IO::File->new("+<$path") || return undef;
1468 my $res = scsi_inquiry($fh, 1);
1469 close($fh);
1470
1471 return $res;
1472}
1473
db656e5f
DM
1474sub machine_type_is_q35 {
1475 my ($conf) = @_;
b467f79a 1476
db656e5f
DM
1477 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1478}
1479
1480sub print_tabletdevice_full {
1481 my ($conf) = @_;
b467f79a 1482
db656e5f
DM
1483 my $q35 = machine_type_is_q35($conf);
1484
1485 # we use uhci for old VMs because tablet driver was buggy in older qemu
1486 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1487
db656e5f
DM
1488 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1489}
1490
ca916ecc 1491sub print_drivedevice_full {
5bdcf937 1492 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1493
1494 my $device = '';
1495 my $maxdev = 0;
19672434 1496
ca916ecc 1497 if ($drive->{interface} eq 'virtio') {
5bdcf937 1498 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1499 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
51f492cd 1500 $device .= ",iothread=iothread-$drive->{interface}$drive->{index}" if $drive->{iothread};
2ed36a41 1501 } elsif ($drive->{interface} eq 'scsi') {
6731a4cf 1502
ee034f5c 1503 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $drive);
2ed36a41
DM
1504 my $unit = $drive->{index} % $maxdev;
1505 my $devicetype = 'hd';
69bcf246
WB
1506 my $path = '';
1507 if (drive_is_cdrom($drive)) {
1508 $devicetype = 'cd';
29b19529 1509 } else {
69bcf246
WB
1510 if ($drive->{file} =~ m|^/|) {
1511 $path = $drive->{file};
1512 if (my $info = path_is_scsi($path)) {
8e3c33ab 1513 if ($info->{type} == 0 && $drive->{scsiblock}) {
69bcf246
WB
1514 $devicetype = 'block';
1515 } elsif ($info->{type} == 1) { # tape
1516 $devicetype = 'generic';
1517 }
1518 }
1519 } else {
1520 $path = PVE::Storage::path($storecfg, $drive->{file});
1521 }
1522
1523 if($path =~ m/^iscsi\:\/\//){
1524 $devicetype = 'generic';
1525 }
1526 }
1527
1528 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1529 $device = "scsi-$devicetype,bus=$controller_prefix$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1530 } else {
1531 $device = "scsi-$devicetype,bus=$controller_prefix$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1532 }
cdd20088 1533
2ed36a41
DM
1534 } elsif ($drive->{interface} eq 'ide'){
1535 $maxdev = 2;
1536 my $controller = int($drive->{index} / $maxdev);
1537 my $unit = $drive->{index} % $maxdev;
1538 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1539
7ebe888a 1540 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
0f2812c2 1541 if ($devicetype eq 'hd' && (my $model = $drive->{model})) {
46630a5f 1542 $model = URI::Escape::uri_unescape($model);
0f2812c2
WB
1543 $device .= ",model=$model";
1544 }
cdb0931f
DA
1545 } elsif ($drive->{interface} eq 'sata'){
1546 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1547 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1548 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1549 } elsif ($drive->{interface} eq 'usb') {
1550 die "implement me";
1551 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1552 } else {
1553 die "unsupported interface type";
ca916ecc
DA
1554 }
1555
3b408e82
DM
1556 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1557
ca916ecc
DA
1558 return $device;
1559}
1560
15b21acc 1561sub get_initiator_name {
46f58b5f 1562 my $initiator;
15b21acc 1563
46f58b5f
DM
1564 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1565 while (defined(my $line = <$fh>)) {
1566 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1567 $initiator = $1;
1568 last;
1569 }
46f58b5f
DM
1570 $fh->close();
1571
15b21acc
MR
1572 return $initiator;
1573}
1574
1e3baf05
DM
1575sub print_drive_full {
1576 my ($storecfg, $vmid, $drive) = @_;
1577
d81f0f09
DM
1578 my $path;
1579 my $volid = $drive->{file};
1580 my $format;
1581
1582 if (drive_is_cdrom($drive)) {
1583 $path = get_iso_path($storecfg, $vmid, $volid);
1584 } else {
1585 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
1586 if ($storeid) {
1587 $path = PVE::Storage::path($storecfg, $volid);
1588 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
1589 $format = qemu_img_format($scfg, $volname);
1590 } else {
1591 $path = $volid;
5b61bff2 1592 $format = "raw";
d81f0f09
DM
1593 }
1594 }
1595
1e3baf05 1596 my $opts = '';
fb8e95a2 1597 my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard);
1e3baf05
DM
1598 foreach my $o (@qemu_drive_options) {
1599 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1600 }
fb8e95a2
WB
1601 foreach my $type (['', '-total'], [_rd => '-read'], [_wr => '-write']) {
1602 my ($dir, $qmpname) = @$type;
1603 if (my $v = $drive->{"mbps$dir"}) {
1604 $opts .= ",throttling.bps$qmpname=".int($v*1024*1024);
1605 }
1606 if (my $v = $drive->{"mbps${dir}_max"}) {
1607 $opts .= ",throttling.bps$qmpname-max=".int($v*1024*1024);
1608 }
1609 if (my $v = $drive->{"bps${dir}_max_length"}) {
1610 $opts .= ",throttling.bps$qmpname-max-length=$v";
1611 }
1612 if (my $v = $drive->{"iops${dir}"}) {
1613 $opts .= ",throttling.iops$qmpname=$v";
1614 }
1615 if (my $v = $drive->{"iops${dir}_max"}) {
1616 $opts .= ",throttling.iops$qmpname=-max$v";
1617 }
1618 if (my $v = $drive->{"iops${dir}_max_length"}) {
1619 $opts .= ",throttling.iops$qmpname=-max-length$v";
1620 }
1621 }
1622
46630a5f
WB
1623 if (my $serial = $drive->{serial}) {
1624 $serial = URI::Escape::uri_unescape($serial);
1625 $opts .= ",serial=$serial";
1626 }
1e3baf05 1627
d81f0f09
DM
1628 $opts .= ",format=$format" if $format && !$drive->{format};
1629
b2ee900e
WB
1630 my $cache_direct = 0;
1631
1632 if (my $cache = $drive->{cache}) {
1633 $cache_direct = $cache =~ /^(?:off|none|directsync)$/;
1634 } elsif (!drive_is_cdrom($drive)) {
1635 $opts .= ",cache=none";
1636 $cache_direct = 1;
1637 }
1638
1639 # aio native works only with O_DIRECT
1640 if (!$drive->{aio}) {
1641 if($cache_direct) {
1642 $opts .= ",aio=native";
1643 } else {
1644 $opts .= ",aio=threads";
1645 }
1646 }
11490cf2 1647
6e47c3b4
WB
1648 if (!drive_is_cdrom($drive)) {
1649 my $detectzeroes;
7d4e30f3 1650 if (defined($drive->{detect_zeroes}) && !$drive->{detect_zeroes}) {
6e47c3b4
WB
1651 $detectzeroes = 'off';
1652 } elsif ($drive->{discard}) {
1653 $detectzeroes = $drive->{discard} eq 'on' ? 'unmap' : 'on';
1654 } else {
1655 # This used to be our default with discard not being specified:
1656 $detectzeroes = 'on';
1657 }
1658 $opts .= ",detect-zeroes=$detectzeroes" if $detectzeroes;
1659 }
f1e05305 1660
1e3baf05
DM
1661 my $pathinfo = $path ? "file=$path," : '';
1662
3ebfcc86 1663 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1664}
1665
cc4d6182 1666sub print_netdevice_full {
ba9e1000 1667 my ($vmid, $conf, $net, $netid, $bridges, $use_old_bios_files) = @_;
cc4d6182
DA
1668
1669 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1670
1671 my $device = $net->{model};
1672 if ($net->{model} eq 'virtio') {
1673 $device = 'virtio-net-pci';
1674 };
1675
5bdcf937 1676 my $pciaddr = print_pci_addr("$netid", $bridges);
5e2068d2 1677 my $tmpstr = "$device,mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1678 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1679 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1680 my $vectors = $net->{queues} * 2 + 2;
1681 $tmpstr .= ",vectors=$vectors,mq=on";
1682 }
cc4d6182 1683 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
ba9e1000
DM
1684
1685 if ($use_old_bios_files) {
1686 my $romfile;
1687 if ($device eq 'virtio-net-pci') {
1688 $romfile = 'pxe-virtio.rom';
1689 } elsif ($device eq 'e1000') {
1690 $romfile = 'pxe-e1000.rom';
1691 } elsif ($device eq 'ne2k') {
1692 $romfile = 'pxe-ne2k_pci.rom';
1693 } elsif ($device eq 'pcnet') {
1694 $romfile = 'pxe-pcnet.rom';
1695 } elsif ($device eq 'rtl8139') {
1696 $romfile = 'pxe-rtl8139.rom';
1697 }
1698 $tmpstr .= ",romfile=$romfile" if $romfile;
1699 }
1700
cc4d6182
DA
1701 return $tmpstr;
1702}
1703
1704sub print_netdev_full {
208ba94e 1705 my ($vmid, $conf, $net, $netid, $hotplug) = @_;
cc4d6182
DA
1706
1707 my $i = '';
1708 if ($netid =~ m/^net(\d+)$/) {
1709 $i = int($1);
1710 }
1711
1712 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1713
1714 my $ifname = "tap${vmid}i$i";
1715
1716 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1717 die "interface name '$ifname' is too long (max 15 character)\n"
1718 if length($ifname) >= 16;
1719
1720 my $vhostparam = '';
1721 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1722
1723 my $vmname = $conf->{name} || "vm$vmid";
1724
a9410357 1725 my $netdev = "";
208ba94e 1726 my $script = $hotplug ? "pve-bridge-hotplug" : "pve-bridge";
a9410357 1727
cc4d6182 1728 if ($net->{bridge}) {
208ba94e 1729 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/$script,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1730 } else {
a9410357 1731 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1732 }
a9410357
AD
1733
1734 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1735
1736 return $netdev;
cc4d6182 1737}
1e3baf05 1738
0efb537e
AD
1739
1740sub print_cpu_device {
1741 my ($conf, $id) = @_;
1742
1743 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
1744 my $cpu = $nokvm ? "qemu64" : "kvm64";
1745 if (my $cputype = $conf->{cpu}) {
1746 my $cpuconf = PVE::JSONSchema::parse_property_string($cpu_fmt, $cputype)
1747 or die "Cannot parse cpu description: $cputype\n";
1748 $cpu = $cpuconf->{cputype};
1749 }
1750
0efb537e
AD
1751 my $cores = $conf->{cores} || 1;
1752
1753 my $current_core = ($id - 1) % $cores;
7032e08c 1754 my $current_socket = int(($id - 1 - $current_core)/$cores);
0efb537e
AD
1755
1756 return "$cpu-x86_64-cpu,id=cpu$id,socket-id=$current_socket,core-id=$current_core,thread-id=0";
1757}
1758
1e3baf05
DM
1759sub drive_is_cdrom {
1760 my ($drive) = @_;
1761
1762 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1763
1764}
1765
ffc0d8c7
WB
1766sub parse_number_sets {
1767 my ($set) = @_;
1768 my $res = [];
1769 foreach my $part (split(/;/, $set)) {
1770 if ($part =~ /^\s*(\d+)(?:-(\d+))?\s*$/) {
1771 die "invalid range: $part ($2 < $1)\n" if defined($2) && $2 < $1;
1772 push @$res, [ $1, $2 ];
2ed5d572 1773 } else {
ffc0d8c7 1774 die "invalid range: $part\n";
2ed5d572
AD
1775 }
1776 }
ffc0d8c7
WB
1777 return $res;
1778}
2ed5d572 1779
ffc0d8c7
WB
1780sub parse_numa {
1781 my ($data) = @_;
1782
1783 my $res = PVE::JSONSchema::parse_property_string($numa_fmt, $data);
1784 $res->{cpus} = parse_number_sets($res->{cpus}) if defined($res->{cpus});
1785 $res->{hostnodes} = parse_number_sets($res->{hostnodes}) if defined($res->{hostnodes});
2ed5d572
AD
1786 return $res;
1787}
1788
040b06b7
DA
1789sub parse_hostpci {
1790 my ($value) = @_;
1791
1792 return undef if !$value;
1793
1f4f447b 1794 my $res = PVE::JSONSchema::parse_property_string($hostpci_fmt, $value);
0cea6a01 1795
1f4f447b
WB
1796 my @idlist = split(/;/, $res->{host});
1797 delete $res->{host};
1798 foreach my $id (@idlist) {
1799 if ($id =~ /^$PCIRE$/) {
a3139f90
WB
1800 if (defined($2)) {
1801 push @{$res->{pciid}}, { id => $1, function => $2 };
1802 } else {
1803 my $pcidevices = lspci($1);
1804 $res->{pciid} = $pcidevices->{$1};
1805 }
0cea6a01 1806 } else {
1f4f447b
WB
1807 # should have been caught by parse_property_string already
1808 die "failed to parse PCI id: $id\n";
0cea6a01 1809 }
040b06b7 1810 }
040b06b7
DA
1811 return $res;
1812}
1813
1e3baf05
DM
1814# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1815sub parse_net {
1816 my ($data) = @_;
1817
cd9c34d1
WB
1818 my $res = eval { PVE::JSONSchema::parse_property_string($net_fmt, $data) };
1819 if ($@) {
1820 warn $@;
1821 return undef;
1e3baf05 1822 }
b5b99790
WB
1823 if (!defined($res->{macaddr})) {
1824 my $dc = PVE::Cluster::cfs_read_file('datacenter.cfg');
1825 $res->{macaddr} = PVE::Tools::random_ether_addr($dc->{mac_prefix});
1826 }
1e3baf05
DM
1827 return $res;
1828}
1829
1830sub print_net {
1831 my $net = shift;
1832
cd9c34d1 1833 return PVE::JSONSchema::print_property_string($net, $net_fmt);
1e3baf05
DM
1834}
1835
1836sub add_random_macs {
1837 my ($settings) = @_;
1838
1839 foreach my $opt (keys %$settings) {
1840 next if $opt !~ m/^net(\d+)$/;
1841 my $net = parse_net($settings->{$opt});
1842 next if !$net;
1843 $settings->{$opt} = print_net($net);
1844 }
1845}
1846
055d554d
DM
1847sub vm_is_volid_owner {
1848 my ($storecfg, $vmid, $volid) = @_;
1849
1850 if ($volid !~ m|^/|) {
1851 my ($path, $owner);
1852 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1853 if ($owner && ($owner == $vmid)) {
1854 return 1;
1855 }
1856 }
1857
1858 return undef;
1859}
1860
3dc38fbb
WB
1861sub split_flagged_list {
1862 my $text = shift || '';
1863 $text =~ s/[,;]/ /g;
1864 $text =~ s/^\s+//;
1865 return { map { /^(!?)(.*)$/ && ($2, $1) } ($text =~ /\S+/g) };
1866}
1867
1868sub join_flagged_list {
1869 my ($how, $lst) = @_;
1870 join $how, map { $lst->{$_} . $_ } keys %$lst;
1871}
1872
055d554d 1873sub vmconfig_delete_pending_option {
3dc38fbb 1874 my ($conf, $key, $force) = @_;
055d554d
DM
1875
1876 delete $conf->{pending}->{$key};
3dc38fbb
WB
1877 my $pending_delete_hash = split_flagged_list($conf->{pending}->{delete});
1878 $pending_delete_hash->{$key} = $force ? '!' : '';
1879 $conf->{pending}->{delete} = join_flagged_list(',', $pending_delete_hash);
055d554d
DM
1880}
1881
1882sub vmconfig_undelete_pending_option {
1883 my ($conf, $key) = @_;
1884
3dc38fbb 1885 my $pending_delete_hash = split_flagged_list($conf->{pending}->{delete});
055d554d
DM
1886 delete $pending_delete_hash->{$key};
1887
3dc38fbb
WB
1888 if (%$pending_delete_hash) {
1889 $conf->{pending}->{delete} = join_flagged_list(',', $pending_delete_hash);
055d554d
DM
1890 } else {
1891 delete $conf->{pending}->{delete};
1892 }
1893}
1894
1895sub vmconfig_register_unused_drive {
1896 my ($storecfg, $vmid, $conf, $drive) = @_;
1897
1898 if (!drive_is_cdrom($drive)) {
1899 my $volid = $drive->{file};
1900 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
8793d495 1901 PVE::QemuConfig->add_unused_volume($conf, $volid, $vmid);
055d554d
DM
1902 }
1903 }
1904}
1905
c750e90a
DM
1906sub vmconfig_cleanup_pending {
1907 my ($conf) = @_;
1908
1909 # remove pending changes when nothing changed
1910 my $changes;
1911 foreach my $opt (keys %{$conf->{pending}}) {
1912 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1913 $changes = 1;
1914 delete $conf->{pending}->{$opt};
1915 }
1916 }
1917
3dc38fbb 1918 my $current_delete_hash = split_flagged_list($conf->{pending}->{delete});
c750e90a 1919 my $pending_delete_hash = {};
3dc38fbb 1920 while (my ($opt, $force) = each %$current_delete_hash) {
c750e90a 1921 if (defined($conf->{$opt})) {
3dc38fbb 1922 $pending_delete_hash->{$opt} = $force;
c750e90a
DM
1923 } else {
1924 $changes = 1;
1925 }
1926 }
1927
3dc38fbb
WB
1928 if (%$pending_delete_hash) {
1929 $conf->{pending}->{delete} = join_flagged_list(',', $pending_delete_hash);
c750e90a
DM
1930 } else {
1931 delete $conf->{pending}->{delete};
1932 }
1933
1934 return $changes;
1935}
1936
bd27e851 1937# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
ff6ffe20 1938my $smbios1_fmt = {
bd27e851
WB
1939 uuid => {
1940 type => 'string',
1941 pattern => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1942 format_description => 'UUID',
52261945 1943 description => "Set SMBIOS1 UUID.",
bd27e851
WB
1944 optional => 1,
1945 },
1946 version => {
1947 type => 'string',
1948 pattern => '\S+',
7f694a71 1949 format_description => 'string',
52261945 1950 description => "Set SMBIOS1 version.",
bd27e851
WB
1951 optional => 1,
1952 },
1953 serial => {
1954 type => 'string',
1955 pattern => '\S+',
7f694a71 1956 format_description => 'string',
52261945 1957 description => "Set SMBIOS1 serial number.",
bd27e851
WB
1958 optional => 1,
1959 },
1960 manufacturer => {
1961 type => 'string',
1962 pattern => '\S+',
7f694a71 1963 format_description => 'string',
52261945 1964 description => "Set SMBIOS1 manufacturer.",
bd27e851
WB
1965 optional => 1,
1966 },
1967 product => {
1968 type => 'string',
1969 pattern => '\S+',
7f694a71 1970 format_description => 'string',
52261945 1971 description => "Set SMBIOS1 product ID.",
bd27e851
WB
1972 optional => 1,
1973 },
1974 sku => {
1975 type => 'string',
1976 pattern => '\S+',
7f694a71 1977 format_description => 'string',
52261945 1978 description => "Set SMBIOS1 SKU string.",
bd27e851
WB
1979 optional => 1,
1980 },
1981 family => {
1982 type => 'string',
1983 pattern => '\S+',
7f694a71 1984 format_description => 'string',
52261945 1985 description => "Set SMBIOS1 family string.",
bd27e851
WB
1986 optional => 1,
1987 },
2796e7d5
DM
1988};
1989
2796e7d5
DM
1990sub parse_smbios1 {
1991 my ($data) = @_;
1992
ff6ffe20 1993 my $res = eval { PVE::JSONSchema::parse_property_string($smbios1_fmt, $data) };
bd27e851 1994 warn $@ if $@;
2796e7d5
DM
1995 return $res;
1996}
1997
cd11416f
DM
1998sub print_smbios1 {
1999 my ($smbios1) = @_;
ff6ffe20 2000 return PVE::JSONSchema::print_property_string($smbios1, $smbios1_fmt);
cd11416f
DM
2001}
2002
ff6ffe20 2003PVE::JSONSchema::register_format('pve-qm-smbios1', $smbios1_fmt);
2796e7d5 2004
1e3baf05
DM
2005PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
2006sub verify_bootdisk {
2007 my ($value, $noerr) = @_;
2008
74479ee9 2009 return $value if is_valid_drivename($value);
1e3baf05
DM
2010
2011 return undef if $noerr;
2012
2013 die "invalid boot disk '$value'\n";
2014}
2015
0ea9541d
DM
2016sub parse_watchdog {
2017 my ($value) = @_;
2018
2019 return undef if !$value;
2020
ec3582b5
WB
2021 my $res = eval { PVE::JSONSchema::parse_property_string($watchdog_fmt, $value) };
2022 warn $@ if $@;
0ea9541d
DM
2023 return $res;
2024}
2025
1e3baf05
DM
2026PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
2027sub verify_usb_device {
2028 my ($value, $noerr) = @_;
2029
2030 return $value if parse_usb_device($value);
2031
2032 return undef if $noerr;
19672434 2033
1e3baf05
DM
2034 die "unable to parse usb device\n";
2035}
2036
1e3baf05
DM
2037# add JSON properties for create and set function
2038sub json_config_properties {
2039 my $prop = shift;
2040
2041 foreach my $opt (keys %$confdesc) {
18bfb361 2042 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
2043 $prop->{$opt} = $confdesc->{$opt};
2044 }
2045
2046 return $prop;
2047}
2048
2049sub check_type {
2050 my ($key, $value) = @_;
2051
2052 die "unknown setting '$key'\n" if !$confdesc->{$key};
2053
2054 my $type = $confdesc->{$key}->{type};
2055
6b64503e 2056 if (!defined($value)) {
1e3baf05
DM
2057 die "got undefined value\n";
2058 }
2059
2060 if ($value =~ m/[\n\r]/) {
2061 die "property contains a line feed\n";
2062 }
2063
2064 if ($type eq 'boolean') {
19672434
DM
2065 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
2066 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
2067 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
2068 } elsif ($type eq 'integer') {
2069 return int($1) if $value =~ m/^(\d+)$/;
2070 die "type check ('integer') failed - got '$value'\n";
04432191
AD
2071 } elsif ($type eq 'number') {
2072 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
2073 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
2074 } elsif ($type eq 'string') {
2075 if (my $fmt = $confdesc->{$key}->{format}) {
1e3baf05 2076 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
2077 return $value;
2078 }
1e3baf05 2079 $value =~ s/^\"(.*)\"$/$1/;
19672434 2080 return $value;
1e3baf05
DM
2081 } else {
2082 die "internal error"
2083 }
2084}
2085
040b06b7
DA
2086sub check_iommu_support{
2087 #fixme : need to check IOMMU support
2088 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
2089
2090 my $iommu=1;
2091 return $iommu;
2092
2093}
2094
1e3baf05
DM
2095sub touch_config {
2096 my ($vmid) = @_;
2097
ffda963f 2098 my $conf = PVE::QemuConfig->config_file($vmid);
1e3baf05
DM
2099 utime undef, undef, $conf;
2100}
2101
1e3baf05 2102sub destroy_vm {
15cc8784 2103 my ($storecfg, $vmid, $keep_empty_config, $skiplock) = @_;
1e3baf05 2104
ffda963f 2105 my $conffile = PVE::QemuConfig->config_file($vmid);
1e3baf05 2106
ffda963f 2107 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 2108
ffda963f 2109 PVE::QemuConfig->check_lock($conf) if !$skiplock;
1e3baf05 2110
19672434 2111 # only remove disks owned by this VM
1e3baf05
DM
2112 foreach_drive($conf, sub {
2113 my ($ds, $drive) = @_;
2114
6b64503e 2115 return if drive_is_cdrom($drive);
1e3baf05
DM
2116
2117 my $volid = $drive->{file};
ed221350 2118
ff1a2432 2119 return if !$volid || $volid =~ m|^/|;
1e3baf05 2120
6b64503e 2121 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 2122 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 2123
31b52247
FG
2124 eval {
2125 PVE::Storage::vdisk_free($storecfg, $volid);
2126 };
2127 warn "Could not remove disk '$volid', check manually: $@" if $@;
2128
1e3baf05 2129 });
19672434 2130
a6af7b3e 2131 if ($keep_empty_config) {
9c502e26 2132 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
2133 } else {
2134 unlink $conffile;
2135 }
1e3baf05
DM
2136
2137 # also remove unused disk
2138 eval {
6b64503e 2139 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
2140
2141 eval {
6b64503e 2142 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 2143 my ($volid, $sid, $volname, $d) = @_;
6b64503e 2144 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
2145 });
2146 };
2147 warn $@ if $@;
2148
2149 };
2150 warn $@ if $@;
2151}
2152
1e3baf05
DM
2153sub parse_vm_config {
2154 my ($filename, $raw) = @_;
2155
2156 return undef if !defined($raw);
2157
554ac7e7 2158 my $res = {
fc1ddcdc 2159 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 2160 snapshots => {},
0d732d16 2161 pending => {},
554ac7e7 2162 };
1e3baf05 2163
19672434 2164 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
2165 || die "got strange filename '$filename'";
2166
2167 my $vmid = $1;
2168
0d18dcfc 2169 my $conf = $res;
b0ec896e 2170 my $descr;
e297c490 2171 my $section = '';
0581fe4f 2172
0d18dcfc
DM
2173 my @lines = split(/\n/, $raw);
2174 foreach my $line (@lines) {
1e3baf05 2175 next if $line =~ m/^\s*$/;
be190583 2176
eab09f4e 2177 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 2178 $section = 'pending';
b0ec896e
DM
2179 if (defined($descr)) {
2180 $descr =~ s/\s+$//;
2181 $conf->{description} = $descr;
2182 }
2183 $descr = undef;
e297c490 2184 $conf = $res->{$section} = {};
eab09f4e
AD
2185 next;
2186
0d732d16 2187 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 2188 $section = $1;
b0ec896e
DM
2189 if (defined($descr)) {
2190 $descr =~ s/\s+$//;
2191 $conf->{description} = $descr;
2192 }
2193 $descr = undef;
e297c490 2194 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
2195 next;
2196 }
1e3baf05 2197
0581fe4f 2198 if ($line =~ m/^\#(.*)\s*$/) {
b0ec896e 2199 $descr = '' if !defined($descr);
0581fe4f
DM
2200 $descr .= PVE::Tools::decode_text($1) . "\n";
2201 next;
2202 }
2203
1e3baf05 2204 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
b0ec896e 2205 $descr = '' if !defined($descr);
0581fe4f 2206 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
2207 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
2208 $conf->{snapstate} = $1;
1e3baf05
DM
2209 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
2210 my $key = $1;
2211 my $value = $2;
0d18dcfc 2212 $conf->{$key} = $value;
ef824322 2213 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
e297c490 2214 my $value = $1;
ef824322
DM
2215 if ($section eq 'pending') {
2216 $conf->{delete} = $value; # we parse this later
2217 } else {
2218 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
eab09f4e 2219 }
1e3baf05
DM
2220 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
2221 my $key = $1;
2222 my $value = $2;
2223 eval { $value = check_type($key, $value); };
2224 if ($@) {
2225 warn "vm $vmid - unable to parse value of '$key' - $@";
2226 } else {
b799312f 2227 $key = 'ide2' if $key eq 'cdrom';
1e3baf05 2228 my $fmt = $confdesc->{$key}->{format};
b799312f 2229 if ($fmt && $fmt =~ /^pve-qm-(?:ide|scsi|virtio|sata)$/) {
1e3baf05
DM
2230 my $v = parse_drive($key, $value);
2231 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
2232 $v->{file} = $volid;
6b64503e 2233 $value = print_drive($vmid, $v);
1e3baf05
DM
2234 } else {
2235 warn "vm $vmid - unable to parse value of '$key'\n";
2236 next;
2237 }
2238 }
2239
b799312f 2240 $conf->{$key} = $value;
1e3baf05
DM
2241 }
2242 }
2243 }
2244
b0ec896e
DM
2245 if (defined($descr)) {
2246 $descr =~ s/\s+$//;
2247 $conf->{description} = $descr;
2248 }
0d18dcfc 2249 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
2250
2251 return $res;
2252}
2253
1858638f
DM
2254sub write_vm_config {
2255 my ($filename, $conf) = @_;
1e3baf05 2256
0d18dcfc
DM
2257 delete $conf->{snapstate}; # just to be sure
2258
1858638f
DM
2259 if ($conf->{cdrom}) {
2260 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2261 $conf->{ide2} = $conf->{cdrom};
2262 delete $conf->{cdrom};
2263 }
1e3baf05
DM
2264
2265 # we do not use 'smp' any longer
1858638f
DM
2266 if ($conf->{sockets}) {
2267 delete $conf->{smp};
2268 } elsif ($conf->{smp}) {
2269 $conf->{sockets} = $conf->{smp};
2270 delete $conf->{cores};
2271 delete $conf->{smp};
1e3baf05
DM
2272 }
2273
ee2f90b1 2274 my $used_volids = {};
0d18dcfc 2275
ee2f90b1 2276 my $cleanup_config = sub {
ef824322 2277 my ($cref, $pending, $snapname) = @_;
1858638f 2278
ee2f90b1
DM
2279 foreach my $key (keys %$cref) {
2280 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
ef824322 2281 $key eq 'snapstate' || $key eq 'pending';
ee2f90b1 2282 my $value = $cref->{$key};
ef824322
DM
2283 if ($key eq 'delete') {
2284 die "propertry 'delete' is only allowed in [PENDING]\n"
2285 if !$pending;
2286 # fixme: check syntax?
2287 next;
2288 }
ee2f90b1
DM
2289 eval { $value = check_type($key, $value); };
2290 die "unable to parse value of '$key' - $@" if $@;
1858638f 2291
ee2f90b1
DM
2292 $cref->{$key} = $value;
2293
74479ee9 2294 if (!$snapname && is_valid_drivename($key)) {
ed221350 2295 my $drive = parse_drive($key, $value);
ee2f90b1
DM
2296 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2297 }
1e3baf05 2298 }
ee2f90b1
DM
2299 };
2300
2301 &$cleanup_config($conf);
ef824322
DM
2302
2303 &$cleanup_config($conf->{pending}, 1);
2304
ee2f90b1 2305 foreach my $snapname (keys %{$conf->{snapshots}}) {
ef824322
DM
2306 die "internal error" if $snapname eq 'pending';
2307 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
1e3baf05
DM
2308 }
2309
1858638f
DM
2310 # remove 'unusedX' settings if we re-add a volume
2311 foreach my $key (keys %$conf) {
2312 my $value = $conf->{$key};
ee2f90b1 2313 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 2314 delete $conf->{$key};
1e3baf05 2315 }
1858638f 2316 }
be190583 2317
0d18dcfc 2318 my $generate_raw_config = sub {
b0ec896e 2319 my ($conf, $pending) = @_;
0581fe4f 2320
0d18dcfc
DM
2321 my $raw = '';
2322
2323 # add description as comment to top of file
b0ec896e
DM
2324 if (defined(my $descr = $conf->{description})) {
2325 if ($descr) {
2326 foreach my $cl (split(/\n/, $descr)) {
2327 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2328 }
2329 } else {
2330 $raw .= "#\n" if $pending;
2331 }
0d18dcfc
DM
2332 }
2333
2334 foreach my $key (sort keys %$conf) {
ef824322 2335 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
0d18dcfc
DM
2336 $raw .= "$key: $conf->{$key}\n";
2337 }
2338 return $raw;
2339 };
0581fe4f 2340
0d18dcfc 2341 my $raw = &$generate_raw_config($conf);
ef824322
DM
2342
2343 if (scalar(keys %{$conf->{pending}})){
2344 $raw .= "\n[PENDING]\n";
b0ec896e 2345 $raw .= &$generate_raw_config($conf->{pending}, 1);
ef824322
DM
2346 }
2347
0d18dcfc
DM
2348 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2349 $raw .= "\n[$snapname]\n";
2350 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2351 }
1e3baf05 2352
1858638f
DM
2353 return $raw;
2354}
1e3baf05 2355
19672434 2356sub load_defaults {
1e3baf05
DM
2357
2358 my $res = {};
2359
2360 # we use static defaults from our JSON schema configuration
2361 foreach my $key (keys %$confdesc) {
2362 if (defined(my $default = $confdesc->{$key}->{default})) {
2363 $res->{$key} = $default;
2364 }
2365 }
19672434 2366
1e3baf05
DM
2367 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2368 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2369
2370 return $res;
2371}
2372
2373sub config_list {
2374 my $vmlist = PVE::Cluster::get_vmlist();
2375 my $res = {};
2376 return $res if !$vmlist || !$vmlist->{ids};
2377 my $ids = $vmlist->{ids};
2378
1e3baf05
DM
2379 foreach my $vmid (keys %$ids) {
2380 my $d = $ids->{$vmid};
2381 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2382 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2383 $res->{$vmid}->{exists} = 1;
2384 }
2385 return $res;
2386}
2387
64e13401
DM
2388# test if VM uses local resources (to prevent migration)
2389sub check_local_resources {
2390 my ($conf, $noerr) = @_;
2391
2392 my $loc_res = 0;
19672434 2393
e0ab7331
DM
2394 $loc_res = 1 if $conf->{hostusb}; # old syntax
2395 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2396
0d29ab3b 2397 foreach my $k (keys %$conf) {
49ca581d 2398 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
d44712fc
EK
2399 # sockets are safe: they will recreated be on the target side post-migrate
2400 next if $k =~ m/^serial/ && ($conf->{$k} eq 'socket');
2fe1a152 2401 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2402 }
2403
2404 die "VM uses local resources\n" if $loc_res && !$noerr;
2405
2406 return $loc_res;
2407}
2408
719893a9 2409# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2410sub check_storage_availability {
2411 my ($storecfg, $conf, $node) = @_;
2412
2413 foreach_drive($conf, sub {
2414 my ($ds, $drive) = @_;
2415
2416 my $volid = $drive->{file};
2417 return if !$volid;
2418
2419 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2420 return if !$sid;
2421
2422 # check if storage is available on both nodes
2423 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2424 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2425 });
2426}
2427
719893a9
DM
2428# list nodes where all VM images are available (used by has_feature API)
2429sub shared_nodes {
2430 my ($conf, $storecfg) = @_;
2431
2432 my $nodelist = PVE::Cluster::get_nodelist();
2433 my $nodehash = { map { $_ => 1 } @$nodelist };
2434 my $nodename = PVE::INotify::nodename();
be190583 2435
719893a9
DM
2436 foreach_drive($conf, sub {
2437 my ($ds, $drive) = @_;
2438
2439 my $volid = $drive->{file};
2440 return if !$volid;
2441
2442 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2443 if ($storeid) {
2444 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2445 if ($scfg->{disable}) {
2446 $nodehash = {};
2447 } elsif (my $avail = $scfg->{nodes}) {
2448 foreach my $node (keys %$nodehash) {
2449 delete $nodehash->{$node} if !$avail->{$node};
2450 }
2451 } elsif (!$scfg->{shared}) {
2452 foreach my $node (keys %$nodehash) {
2453 delete $nodehash->{$node} if $node ne $nodename
2454 }
2455 }
2456 }
2457 });
2458
2459 return $nodehash
2460}
2461
1e3baf05
DM
2462sub check_cmdline {
2463 my ($pidfile, $pid) = @_;
2464
6b64503e
DM
2465 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2466 if (defined($fh)) {
1e3baf05
DM
2467 my $line = <$fh>;
2468 $fh->close;
2469 return undef if !$line;
6b64503e 2470 my @param = split(/\0/, $line);
1e3baf05
DM
2471
2472 my $cmd = $param[0];
06094efd 2473 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2474
2475 for (my $i = 0; $i < scalar (@param); $i++) {
2476 my $p = $param[$i];
2477 next if !$p;
2478 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2479 my $p = $param[$i+1];
2480 return 1 if $p && ($p eq $pidfile);
2481 return undef;
2482 }
2483 }
2484 }
2485 return undef;
2486}
2487
2488sub check_running {
7e8dcf2c 2489 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2490
ffda963f 2491 my $filename = PVE::QemuConfig->config_file($vmid, $node);
1e3baf05
DM
2492
2493 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2494 if !$nocheck && ! -f $filename;
1e3baf05 2495
e6c3b671 2496 my $pidfile = pidfile_name($vmid);
1e3baf05 2497
e6c3b671
DM
2498 if (my $fd = IO::File->new("<$pidfile")) {
2499 my $st = stat($fd);
1e3baf05 2500 my $line = <$fd>;
6b64503e 2501 close($fd);
1e3baf05
DM
2502
2503 my $mtime = $st->mtime;
2504 if ($mtime > time()) {
2505 warn "file '$filename' modified in future\n";
2506 }
2507
2508 if ($line =~ m/^(\d+)$/) {
2509 my $pid = $1;
e6c3b671
DM
2510 if (check_cmdline($pidfile, $pid)) {
2511 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2512 return $pid;
2513 }
2514 }
1e3baf05
DM
2515 }
2516 }
2517
2518 return undef;
2519}
2520
2521sub vzlist {
19672434 2522
1e3baf05
DM
2523 my $vzlist = config_list();
2524
6b64503e 2525 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2526
19672434 2527 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2528 next if $de !~ m/^(\d+)\.pid$/;
2529 my $vmid = $1;
6b64503e
DM
2530 next if !defined($vzlist->{$vmid});
2531 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2532 $vzlist->{$vmid}->{pid} = $pid;
2533 }
2534 }
2535
2536 return $vzlist;
2537}
2538
1e3baf05
DM
2539sub disksize {
2540 my ($storecfg, $conf) = @_;
2541
2542 my $bootdisk = $conf->{bootdisk};
2543 return undef if !$bootdisk;
74479ee9 2544 return undef if !is_valid_drivename($bootdisk);
1e3baf05
DM
2545
2546 return undef if !$conf->{$bootdisk};
2547
2548 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2549 return undef if !defined($drive);
2550
2551 return undef if drive_is_cdrom($drive);
2552
2553 my $volid = $drive->{file};
2554 return undef if !$volid;
2555
24afaca0 2556 return $drive->{size};
1e3baf05
DM
2557}
2558
2559my $last_proc_pid_stat;
2560
03a33f30
DM
2561# get VM status information
2562# This must be fast and should not block ($full == false)
2563# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2564sub vmstatus {
03a33f30 2565 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2566
2567 my $res = {};
2568
19672434 2569 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2570
2571 my $list = vzlist();
694fcad4 2572 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2573
ae4915a2
DM
2574 my $cpucount = $cpuinfo->{cpus} || 1;
2575
1e3baf05
DM
2576 foreach my $vmid (keys %$list) {
2577 next if $opt_vmid && ($vmid ne $opt_vmid);
2578
ffda963f 2579 my $cfspath = PVE::QemuConfig->cfs_config_path($vmid);
1e3baf05
DM
2580 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2581
2582 my $d = {};
2583 $d->{pid} = $list->{$vmid}->{pid};
2584
2585 # fixme: better status?
2586 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2587
af990afe
DM
2588 my $size = disksize($storecfg, $conf);
2589 if (defined($size)) {
2590 $d->{disk} = 0; # no info available
1e3baf05
DM
2591 $d->{maxdisk} = $size;
2592 } else {
2593 $d->{disk} = 0;
2594 $d->{maxdisk} = 0;
2595 }
2596
2597 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2 2598 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
d7c8364b 2599 $d->{cpus} = $conf->{vcpus} if $conf->{vcpus};
ae4915a2 2600
1e3baf05 2601 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2602 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2603
8b1accf7 2604 if ($conf->{balloon}) {
4bdb0514 2605 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2606 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2607 }
2608
1e3baf05
DM
2609 $d->{uptime} = 0;
2610 $d->{cpu} = 0;
1e3baf05
DM
2611 $d->{mem} = 0;
2612
2613 $d->{netout} = 0;
2614 $d->{netin} = 0;
2615
2616 $d->{diskread} = 0;
2617 $d->{diskwrite} = 0;
2618
ffda963f 2619 $d->{template} = PVE::QemuConfig->is_template($conf);
4d8c851b 2620
1e3baf05
DM
2621 $res->{$vmid} = $d;
2622 }
2623
2624 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2625 foreach my $dev (keys %$netdev) {
2626 next if $dev !~ m/^tap([1-9]\d*)i/;
2627 my $vmid = $1;
2628 my $d = $res->{$vmid};
2629 next if !$d;
19672434 2630
1e3baf05
DM
2631 $d->{netout} += $netdev->{$dev}->{receive};
2632 $d->{netin} += $netdev->{$dev}->{transmit};
604ea644
AD
2633
2634 if ($full) {
2635 $d->{nics}->{$dev}->{netout} = $netdev->{$dev}->{receive};
2636 $d->{nics}->{$dev}->{netin} = $netdev->{$dev}->{transmit};
2637 }
2638
1e3baf05
DM
2639 }
2640
1e3baf05
DM
2641 my $ctime = gettimeofday;
2642
2643 foreach my $vmid (keys %$list) {
2644
2645 my $d = $res->{$vmid};
2646 my $pid = $d->{pid};
2647 next if !$pid;
2648
694fcad4
DM
2649 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2650 next if !$pstat; # not running
19672434 2651
694fcad4 2652 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2653
694fcad4 2654 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2655
694fcad4 2656 if ($pstat->{vsize}) {
6b64503e 2657 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2658 }
2659
2660 my $old = $last_proc_pid_stat->{$pid};
2661 if (!$old) {
19672434
DM
2662 $last_proc_pid_stat->{$pid} = {
2663 time => $ctime,
1e3baf05
DM
2664 used => $used,
2665 cpu => 0,
1e3baf05
DM
2666 };
2667 next;
2668 }
2669
7f0b5beb 2670 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2671
2672 if ($dtime > 1000) {
2673 my $dutime = $used - $old->{used};
2674
ae4915a2 2675 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2676 $last_proc_pid_stat->{$pid} = {
19672434 2677 time => $ctime,
1e3baf05
DM
2678 used => $used,
2679 cpu => $d->{cpu},
1e3baf05
DM
2680 };
2681 } else {
2682 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2683 }
2684 }
2685
f5eb281a 2686 return $res if !$full;
03a33f30
DM
2687
2688 my $qmpclient = PVE::QMPClient->new();
2689
64e7fcf2
DM
2690 my $ballooncb = sub {
2691 my ($vmid, $resp) = @_;
2692
2693 my $info = $resp->{'return'};
38babf81
DM
2694 return if !$info->{max_mem};
2695
64e7fcf2
DM
2696 my $d = $res->{$vmid};
2697
38babf81
DM
2698 # use memory assigned to VM
2699 $d->{maxmem} = $info->{max_mem};
2700 $d->{balloon} = $info->{actual};
2701
2702 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2703 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2704 $d->{freemem} = $info->{free_mem};
64e7fcf2
DM
2705 }
2706
604ea644 2707 $d->{ballooninfo} = $info;
64e7fcf2
DM
2708 };
2709
03a33f30
DM
2710 my $blockstatscb = sub {
2711 my ($vmid, $resp) = @_;
2712 my $data = $resp->{'return'} || [];
2713 my $totalrdbytes = 0;
2714 my $totalwrbytes = 0;
604ea644 2715
03a33f30
DM
2716 for my $blockstat (@$data) {
2717 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2718 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
604ea644
AD
2719
2720 $blockstat->{device} =~ s/drive-//;
2721 $res->{$vmid}->{blockstat}->{$blockstat->{device}} = $blockstat->{stats};
03a33f30
DM
2722 }
2723 $res->{$vmid}->{diskread} = $totalrdbytes;
2724 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2725 };
2726
2727 my $statuscb = sub {
2728 my ($vmid, $resp) = @_;
64e7fcf2 2729
03a33f30 2730 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2731 # this fails if ballon driver is not loaded, so this must be
2732 # the last commnand (following command are aborted if this fails).
38babf81 2733 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2734
2735 my $status = 'unknown';
2736 if (!defined($status = $resp->{'return'}->{status})) {
2737 warn "unable to get VM status\n";
2738 return;
2739 }
2740
2741 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2742 };
2743
2744 foreach my $vmid (keys %$list) {
2745 next if $opt_vmid && ($vmid ne $opt_vmid);
2746 next if !$res->{$vmid}->{pid}; # not running
2747 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2748 }
2749
b017fbda 2750 $qmpclient->queue_execute(undef, 2);
03a33f30
DM
2751
2752 foreach my $vmid (keys %$list) {
2753 next if $opt_vmid && ($vmid ne $opt_vmid);
2754 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2755 }
2756
1e3baf05
DM
2757 return $res;
2758}
2759
2760sub foreach_drive {
b74ff047 2761 my ($conf, $func, @param) = @_;
1e3baf05 2762
74479ee9
FG
2763 foreach my $ds (valid_drive_names()) {
2764 next if !defined($conf->{$ds});
1e3baf05 2765
6b64503e 2766 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2767 next if !$drive;
2768
b74ff047 2769 &$func($ds, $drive, @param);
1e3baf05
DM
2770 }
2771}
2772
d5769dc2 2773sub foreach_volid {
b6adff33 2774 my ($conf, $func, @param) = @_;
be190583 2775
d5769dc2
DM
2776 my $volhash = {};
2777
2778 my $test_volid = sub {
392f8b5d 2779 my ($volid, $is_cdrom, $replicate) = @_;
d5769dc2
DM
2780
2781 return if !$volid;
be190583 2782
392f8b5d
DM
2783 $volhash->{$volid}->{cdrom} //= 1;
2784 $volhash->{$volid}->{cdrom} = 0 if !$is_cdrom;
2785
2786 $volhash->{$volid}->{replicate} //= 0;
2787 $volhash->{$volid}->{replicate} = 1 if $replicate;
d5769dc2
DM
2788 };
2789
ed221350 2790 foreach_drive($conf, sub {
d5769dc2 2791 my ($ds, $drive) = @_;
392f8b5d 2792 &$test_volid($drive->{file}, drive_is_cdrom($drive), $drive->{replicate} // 1);
d5769dc2
DM
2793 });
2794
2795 foreach my $snapname (keys %{$conf->{snapshots}}) {
2796 my $snap = $conf->{snapshots}->{$snapname};
392f8b5d 2797 &$test_volid($snap->{vmstate}, 0, 1);
ed221350 2798 foreach_drive($snap, sub {
d5769dc2 2799 my ($ds, $drive) = @_;
392f8b5d 2800 &$test_volid($drive->{file}, drive_is_cdrom($drive), $drive->{replicate} // 1);
d5769dc2
DM
2801 });
2802 }
2803
2804 foreach my $volid (keys %$volhash) {
b6adff33 2805 &$func($volid, $volhash->{$volid}, @param);
d5769dc2
DM
2806 }
2807}
2808
86b8228b
DM
2809sub vga_conf_has_spice {
2810 my ($vga) = @_;
2811
590e698c
DM
2812 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2813
2814 return $1 || 1;
86b8228b
DM
2815}
2816
1e3baf05 2817sub config_to_command {
67812f9c 2818 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2819
2820 my $cmd = [];
8c559505
DM
2821 my $globalFlags = [];
2822 my $machineFlags = [];
2823 my $rtcFlags = [];
519ed28c 2824 my $cpuFlags = [];
5bdcf937 2825 my $devices = [];
b78ebef7 2826 my $pciaddr = '';
5bdcf937 2827 my $bridges = {};
1e3baf05
DM
2828 my $kvmver = kvm_user_version();
2829 my $vernum = 0; # unknown
b42d3cf9 2830 my $ostype = $conf->{ostype};
4317f69f
AD
2831 my $winversion = windows_version($ostype);
2832
a3c52213
DM
2833 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2834 $vernum = $1*1000000+$2*1000;
2835 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2836 $vernum = $1*1000000+$2*1000+$3;
2837 }
2838
a3c52213 2839 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2840
2841 my $have_ovz = -f '/proc/vz/vestat';
2842
db656e5f 2843 my $q35 = machine_type_is_q35($conf);
4d3f29ed 2844 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
23f73120 2845 my $machine_type = $forcemachine || $conf->{machine};
249c4a6c
AD
2846 my $use_old_bios_files = undef;
2847 ($use_old_bios_files, $machine_type) = qemu_use_old_bios_files($machine_type);
db656e5f 2848
f08e17c7
AD
2849 my $cpuunits = defined($conf->{cpuunits}) ?
2850 $conf->{cpuunits} : $defaults->{cpuunits};
2851
1e3baf05
DM
2852 push @$cmd, '/usr/bin/kvm';
2853
2854 push @$cmd, '-id', $vmid;
2855
2856 my $use_virtio = 0;
2857
c971c4f2
AD
2858 my $qmpsocket = qmp_socket($vmid);
2859 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2860 push @$cmd, '-mon', "chardev=qmp,mode=control";
2861
1e3baf05 2862
6b64503e 2863 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2864
1e3baf05
DM
2865 push @$cmd, '-daemonize';
2866
2796e7d5
DM
2867 if ($conf->{smbios1}) {
2868 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2869 }
2870
3edb45e7 2871 if ($conf->{bios} && $conf->{bios} eq 'ovmf') {
2ddc0a5c
DC
2872 my $ovmfbase;
2873
2874 # prefer the OVMF_CODE variant
2875 if (-f $OVMF_CODE) {
2876 $ovmfbase = $OVMF_CODE;
2877 } elsif (-f $OVMF_IMG) {
2878 $ovmfbase = $OVMF_IMG;
2879 }
2880
2881 die "no uefi base img found\n" if !$ovmfbase;
2882 push @$cmd, '-drive', "if=pflash,unit=0,format=raw,readonly,file=$ovmfbase";
4a5cf64a
WL
2883
2884 if (defined($conf->{efidisk0}) && ($ovmfbase eq $OVMF_CODE)) {
2885 my $d = PVE::JSONSchema::parse_property_string($efidisk_fmt, $conf->{efidisk0});
2ddc0a5c
DC
2886 my $format = $d->{format} // 'raw';
2887 my $path;
2888 my ($storeid, $volname) = PVE::Storage::parse_volume_id($d->{file}, 1);
2889 if ($storeid) {
2890 $path = PVE::Storage::path($storecfg, $d->{file});
2891 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2892 $format = qemu_img_format($scfg, $volname);
2893 } else {
2894 $path = $d->{file};
2895 $format = "raw";
2896 }
2897 push @$cmd, '-drive', "if=pflash,unit=1,id=drive-efidisk0,format=$format,file=$path";
2898 } elsif ($ovmfbase eq $OVMF_CODE) {
2899 warn "using uefi without permanent efivars disk\n";
2900 my $ovmfvar_dst = "/tmp/$vmid-ovmf.fd";
2901 PVE::Tools::file_copy($OVMF_VARS, $ovmfvar_dst, 256*1024);
2902 push @$cmd, '-drive', "if=pflash,unit=1,format=raw,file=$ovmfvar_dst";
2903 } else {
2904 # if the base img is not OVMF_CODE, we do not have to bother
2905 # to create/use a vars image, since it will not be used anyway
2906 # this can only happen if someone manually deletes the OVMF_CODE image
2907 # or has an old pve-qemu-kvm version installed.
2908 # both should not happen, but we ignore it here
2909 }
a783c78e
AD
2910 }
2911
da8b4189 2912
d40e5e18
DC
2913 # add usb controllers
2914 my @usbcontrollers = PVE::QemuServer::USB::get_usb_controllers($conf, $bridges, $q35, $usbdesc->{format}, $MAX_USB_DEVICES);
2915 push @$devices, @usbcontrollers if @usbcontrollers;
5acbfe9e 2916 my $vga = $conf->{vga};
2fa3151e 2917
590e698c
DM
2918 my $qxlnum = vga_conf_has_spice($vga);
2919 $vga = 'qxl' if $qxlnum;
2fa3151e 2920
5acbfe9e 2921 if (!$vga) {
4317f69f 2922 $vga = $winversion >= 6 ? 'std' : 'cirrus';
5acbfe9e
DM
2923 }
2924
1e3baf05 2925 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2926 my $tablet;
2927 if (defined($conf->{tablet})) {
2928 $tablet = $conf->{tablet};
2929 } else {
2930 $tablet = $defaults->{tablet};
590e698c 2931 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2932 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2933 }
2934
db656e5f 2935 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2936
16a91d65 2937 my $kvm_off = 0;
4317f69f
AD
2938 my $gpu_passthrough;
2939
1e3baf05 2940 # host pci devices
040b06b7 2941 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2942 my $d = parse_hostpci($conf->{"hostpci$i"});
2943 next if !$d;
2944
2945 my $pcie = $d->{pcie};
2946 if($pcie){
2947 die "q35 machine model is not enabled" if !$q35;
2948 $pciaddr = print_pcie_addr("hostpci$i");
2949 }else{
2950 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2951 }
2952
1f4f447b 2953 my $rombar = defined($d->{rombar}) && !$d->{rombar} ? ',rombar=0' : '';
9009150b 2954 my $romfile = $d->{romfile};
456a6fec 2955
1f4f447b
WB
2956 my $xvga = '';
2957 if ($d->{'x-vga'}) {
2958 $xvga = ',x-vga=on';
16a91d65 2959 $kvm_off = 1;
137483c0 2960 $vga = 'none';
4317f69f
AD
2961 $gpu_passthrough = 1;
2962
230a4382
AD
2963 if ($conf->{bios} && $conf->{bios} eq 'ovmf') {
2964 $xvga = "";
2965 }
137483c0 2966 }
4543ecf0
AD
2967 my $pcidevices = $d->{pciid};
2968 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2969
4543ecf0
AD
2970 my $j=0;
2971 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2972
4543ecf0
AD
2973 my $id = "hostpci$i";
2974 $id .= ".$j" if $multifunction;
2975 my $addr = $pciaddr;
2976 $addr .= ".$j" if $multifunction;
6ea8cd3b 2977 my $devicestr = "vfio-pci,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
4543ecf0
AD
2978
2979 if($j == 0){
2980 $devicestr .= "$rombar$xvga";
2981 $devicestr .= ",multifunction=on" if $multifunction;
456a6fec 2982 $devicestr .= ",romfile=/usr/share/kvm/$romfile" if $romfile;
4543ecf0
AD
2983 }
2984
2985 push @$devices, '-device', $devicestr;
2986 $j++;
2987 }
1e3baf05
DM
2988 }
2989
2990 # usb devices
d40e5e18
DC
2991 my @usbdevices = PVE::QemuServer::USB::get_usb_devices($conf, $usbdesc->{format}, $MAX_USB_DEVICES);
2992 push @$devices, @usbdevices if @usbdevices;
1e3baf05 2993 # serial devices
bae179aa 2994 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2995 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2996 if ($path eq 'socket') {
2997 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2998 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2999 push @$devices, '-device', "isa-serial,chardev=serial$i";
3000 } else {
3001 die "no such serial device\n" if ! -c $path;
3002 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
3003 push @$devices, '-device', "isa-serial,chardev=serial$i";
3004 }
34978be3 3005 }
1e3baf05
DM
3006 }
3007
3008 # parallel devices
1989a89c 3009 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 3010 if (my $path = $conf->{"parallel$i"}) {
19672434 3011 die "no such parallel device\n" if ! -c $path;
32e69805 3012 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 3013 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 3014 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 3015 }
1e3baf05
DM
3016 }
3017
3018 my $vmname = $conf->{name} || "vm$vmid";
3019
3020 push @$cmd, '-name', $vmname;
19672434 3021
1e3baf05
DM
3022 my $sockets = 1;
3023 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
3024 $sockets = $conf->{sockets} if $conf->{sockets};
3025
3026 my $cores = $conf->{cores} || 1;
3bd18e48 3027
de9d1e55 3028 my $maxcpus = $sockets * $cores;
76267728 3029
de9d1e55 3030 my $vcpus = $conf->{vcpus} ? $conf->{vcpus} : $maxcpus;
76267728 3031
de9d1e55
AD
3032 my $allowed_vcpus = $cpuinfo->{cpus};
3033
6965d5d1 3034 die "MAX $allowed_vcpus vcpus allowed per VM on this node\n"
de9d1e55
AD
3035 if ($allowed_vcpus < $maxcpus);
3036
69c81430 3037 if($hotplug_features->{cpu} && qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 7)) {
1e3baf05 3038
69c81430
AD
3039 push @$cmd, '-smp', "1,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
3040 for (my $i = 2; $i <= $vcpus; $i++) {
3041 my $cpustr = print_cpu_device($conf,$i);
3042 push @$cmd, '-device', $cpustr;
3043 }
3044
3045 } else {
3046
3047 push @$cmd, '-smp', "$vcpus,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
3048 }
1e3baf05
DM
3049 push @$cmd, '-nodefaults';
3050
32baffb4 3051 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 3052
0888fdce
DM
3053 my $bootindex_hash = {};
3054 my $i = 1;
3055 foreach my $o (split(//, $bootorder)) {
3056 $bootindex_hash->{$o} = $i*100;
3057 $i++;
afdb31d5 3058 }
3b408e82 3059
dbea4415 3060 push @$cmd, '-boot', "menu=on,strict=on,reboot-timeout=1000,splash=/usr/share/qemu-server/bootsplash.jpg";
1e3baf05 3061
6b64503e 3062 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 3063
6b64503e 3064 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 3065
ef5e2be2 3066 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05 3067
b7be4ba9
AD
3068 if ($vga && $vga !~ m/^serial\d+$/ && $vga ne 'none'){
3069 my $socket = vnc_socket($vmid);
3070 push @$cmd, '-vnc', "unix:$socket,x509,password";
3071 } else {
3072 push @$cmd, '-nographic';
3073 }
3074
1e3baf05 3075 # time drift fix
6b64503e 3076 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 3077
6b64503e 3078 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 3079 my $useLocaltime = $conf->{localtime};
1e3baf05 3080
4317f69f
AD
3081 if ($winversion >= 5) { # windows
3082 $useLocaltime = 1 if !defined($conf->{localtime});
7a131888 3083
4317f69f
AD
3084 # use time drift fix when acpi is enabled
3085 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
3086 $tdf = 1 if !defined($conf->{tdf});
462e8d19 3087 }
4317f69f 3088 }
462e8d19 3089
4317f69f
AD
3090 if ($winversion >= 6) {
3091 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
3092 push @$cmd, '-no-hpet';
1e3baf05
DM
3093 }
3094
8c559505
DM
3095 push @$rtcFlags, 'driftfix=slew' if $tdf;
3096
7f0b5beb 3097 if ($nokvm) {
8c559505 3098 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
3099 } else {
3100 die "No accelerator found!\n" if !$cpuinfo->{hvm};
3101 }
1e3baf05 3102
952958bc
DM
3103 if ($machine_type) {
3104 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
3105 }
3106
8c559505
DM
3107 if ($conf->{startdate}) {
3108 push @$rtcFlags, "base=$conf->{startdate}";
3109 } elsif ($useLocaltime) {
3110 push @$rtcFlags, 'base=localtime';
3111 }
1e3baf05 3112
519ed28c 3113 my $cpu = $nokvm ? "qemu64" : "kvm64";
16a91d65 3114 if (my $cputype = $conf->{cpu}) {
ff6ffe20 3115 my $cpuconf = PVE::JSONSchema::parse_property_string($cpu_fmt, $cputype)
16a91d65
WB
3116 or die "Cannot parse cpu description: $cputype\n";
3117 $cpu = $cpuconf->{cputype};
3118 $kvm_off = 1 if $cpuconf->{hidden};
3119 }
519ed28c 3120
4dc339e7
AD
3121 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
3122
d853f40a
DM
3123 push @$cpuFlags , '-x2apic'
3124 if $conf->{ostype} && $conf->{ostype} eq 'solaris';
519ed28c 3125
2e1a5389
AD
3126 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
3127
0dc48c3d
AD
3128 push @$cpuFlags, '-rdtscp' if $cpu =~ m/^Opteron/;
3129
117a0414
AD
3130 if (qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 3)) {
3131
3132 push @$cpuFlags , '+kvm_pv_unhalt' if !$nokvm;
0da5a08c 3133 push @$cpuFlags , '+kvm_pv_eoi' if !$nokvm;
117a0414
AD
3134 }
3135
4317f69f
AD
3136 add_hyperv_enlighments($cpuFlags, $winversion, $machine_type, $kvmver, $nokvm, $conf->{bios}, $gpu_passthrough);
3137
f1f7ea88 3138 push @$cpuFlags, 'enforce' if $cpu ne 'host' && !$nokvm;
dac7c619 3139
16a91d65
WB
3140 push @$cpuFlags, 'kvm=off' if $kvm_off;
3141
8930da74
DM
3142 my $cpu_vendor = $cpu_vendor_list->{$cpu} ||
3143 die "internal error"; # should not happen
3144
3145 push @$cpuFlags, "vendor=${cpu_vendor}"
3146 if $cpu_vendor ne 'default';
3147
be190583 3148 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 3149
dac7c619 3150 push @$cmd, '-cpu', $cpu;
519ed28c 3151
0567a4d5
AD
3152 PVE::QemuServer::Memory::config($conf, $vmid, $sockets, $cores, $defaults, $hotplug_features, $cmd);
3153
1e3baf05
DM
3154 push @$cmd, '-S' if $conf->{freeze};
3155
3156 # set keyboard layout
3157 my $kb = $conf->{keyboard} || $defaults->{keyboard};
3158 push @$cmd, '-k', $kb if $kb;
3159
3160 # enable sound
3161 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
3162 #push @$cmd, '-soundhw', 'es1370';
3163 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 3164
bc84dcca 3165 if($conf->{agent}) {
7a6c2150 3166 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
3167 my $pciaddr = print_pci_addr("qga0", $bridges);
3168 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
3169 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
3170 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
3171 }
3172
1d794448 3173 my $spice_port;
2fa3151e 3174
590e698c
DM
3175 if ($qxlnum) {
3176 if ($qxlnum > 1) {
ac087616 3177 if ($winversion){
590e698c
DM
3178 for(my $i = 1; $i < $qxlnum; $i++){
3179 my $pciaddr = print_pci_addr("vga$i", $bridges);
3180 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
3181 }
3182 } else {
3183 # assume other OS works like Linux
3184 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
3185 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
3186 }
3187 }
3188
1011b570 3189 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 3190
af0eba7e
WB
3191 my $nodename = PVE::INotify::nodename();
3192 my $pfamily = PVE::Tools::get_host_address_family($nodename);
91152441
WB
3193 my @nodeaddrs = PVE::Tools::getaddrinfo_all('localhost', family => $pfamily);
3194 die "failed to get an ip address of type $pfamily for 'localhost'\n" if !@nodeaddrs;
3195 my $localhost = PVE::Network::addr_to_ip($nodeaddrs[0]->{addr});
3196 $spice_port = PVE::Tools::next_spice_port($pfamily, $localhost);
943340a6 3197
91152441 3198 push @$devices, '-spice', "tls-port=${spice_port},addr=$localhost,tls-ciphers=HIGH,seamless-migration=on";
1011b570 3199
d2da6d9b
AD
3200 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
3201 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
3202 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
3203 }
3204
8d9ae0d2
DM
3205 # enable balloon by default, unless explicitly disabled
3206 if (!defined($conf->{balloon}) || $conf->{balloon}) {
3207 $pciaddr = print_pci_addr("balloon0", $bridges);
3208 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
3209 }
1e3baf05 3210
0ea9541d
DM
3211 if ($conf->{watchdog}) {
3212 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 3213 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 3214 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
3215 push @$devices, '-device', "$watchdog$pciaddr";
3216 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
3217 }
3218
1e3baf05 3219 my $vollist = [];
941e0c42 3220 my $scsicontroller = {};
26ee04b6 3221 my $ahcicontroller = {};
cdd20088 3222 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 3223
5881b913
DM
3224 # Add iscsi initiator name if available
3225 if (my $initiator = get_initiator_name()) {
3226 push @$devices, '-iscsi', "initiator-name=$initiator";
3227 }
3228
1e3baf05
DM
3229 foreach_drive($conf, sub {
3230 my ($ds, $drive) = @_;
3231
ff1a2432 3232 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 3233 push @$vollist, $drive->{file};
ff1a2432 3234 }
afdb31d5 3235
1e3baf05 3236 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
3237
3238 if (drive_is_cdrom ($drive)) {
3239 if ($bootindex_hash->{d}) {
3240 $drive->{bootindex} = $bootindex_hash->{d};
3241 $bootindex_hash->{d} += 1;
3242 }
3243 } else {
3244 if ($bootindex_hash->{c}) {
3245 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3246 $bootindex_hash->{c} += 1;
3247 }
3248 }
3249
51f492cd
AD
3250 if($drive->{interface} eq 'virtio'){
3251 push @$cmd, '-object', "iothread,id=iothread-$ds" if $drive->{iothread};
3252 }
3253
941e0c42 3254 if ($drive->{interface} eq 'scsi') {
cdd20088 3255
ee034f5c 3256 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $drive);
6731a4cf 3257
6731a4cf 3258 $pciaddr = print_pci_addr("$controller_prefix$controller", $bridges);
a1b7d579 3259 my $scsihw_type = $scsihw =~ m/^virtio-scsi-single/ ? "virtio-scsi-pci" : $scsihw;
fc8b40fd
AD
3260
3261 my $iothread = '';
3262 if($conf->{scsihw} && $conf->{scsihw} eq "virtio-scsi-single" && $drive->{iothread}){
3263 $iothread .= ",iothread=iothread-$controller_prefix$controller";
3264 push @$cmd, '-object', "iothread,id=iothread-$controller_prefix$controller";
e7a5104d
DC
3265 } elsif ($drive->{iothread}) {
3266 warn "iothread is only valid with virtio disk or virtio-scsi-single controller, ignoring\n";
fc8b40fd
AD
3267 }
3268
6e11f143
AD
3269 my $queues = '';
3270 if($conf->{scsihw} && $conf->{scsihw} eq "virtio-scsi-single" && $drive->{queues}){
3271 $queues = ",num_queues=$drive->{queues}";
3272 }
3273
3274 push @$devices, '-device', "$scsihw_type,id=$controller_prefix$controller$pciaddr$iothread$queues" if !$scsicontroller->{$controller};
cdd20088 3275 $scsicontroller->{$controller}=1;
941e0c42 3276 }
3b408e82 3277
26ee04b6
DA
3278 if ($drive->{interface} eq 'sata') {
3279 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
3280 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3281 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
3282 $ahcicontroller->{$controller}=1;
3283 }
46f58b5f 3284
6470743f
DC
3285 if ($drive->{interface} eq 'efidisk') {
3286 # this will be added somewhere else
3287 return;
3288 }
3289
15b21acc
MR
3290 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3291 push @$devices, '-drive',$drive_cmd;
46f58b5f 3292 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
3293 });
3294
cc4d6182 3295 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 3296 next if !$conf->{"net$i"};
cc4d6182
DA
3297 my $d = parse_net($conf->{"net$i"});
3298 next if !$d;
1e3baf05 3299
cc4d6182 3300 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 3301
cc4d6182
DA
3302 if ($bootindex_hash->{n}) {
3303 $d->{bootindex} = $bootindex_hash->{n};
3304 $bootindex_hash->{n} += 1;
3305 }
1e3baf05 3306
cc4d6182 3307 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
3308 push @$devices, '-netdev', $netdevfull;
3309
ba9e1000 3310 my $netdevicefull = print_netdevice_full($vmid, $conf, $d, "net$i", $bridges, $use_old_bios_files);
5bdcf937
AD
3311 push @$devices, '-device', $netdevicefull;
3312 }
1e3baf05 3313
db656e5f
DM
3314 if (!$q35) {
3315 # add pci bridges
fc79e813
AD
3316 if (qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 3)) {
3317 $bridges->{1} = 1;
3318 $bridges->{2} = 1;
3319 }
3320
6731a4cf
AD
3321 $bridges->{3} = 1 if $scsihw =~ m/^virtio-scsi-single/;
3322
f8e83f05
AD
3323 while (my ($k, $v) = each %$bridges) {
3324 $pciaddr = print_pci_addr("pci.$k");
3325 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3326 }
19672434
DM
3327 }
3328
1e3baf05
DM
3329 # add custom args
3330 if ($conf->{args}) {
3ada46c9 3331 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
3332 push @$cmd, @$aa;
3333 }
3334
5bdcf937 3335 push @$cmd, @$devices;
be190583 3336 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 3337 if scalar(@$rtcFlags);
be190583 3338 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
3339 if scalar(@$machineFlags);
3340 push @$cmd, '-global', join(',', @$globalFlags)
3341 if scalar(@$globalFlags);
3342
1d794448 3343 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 3344}
19672434 3345
1e3baf05
DM
3346sub vnc_socket {
3347 my ($vmid) = @_;
3348 return "${var_run_tmpdir}/$vmid.vnc";
3349}
3350
943340a6 3351sub spice_port {
1011b570 3352 my ($vmid) = @_;
943340a6 3353
1d794448 3354 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
3355
3356 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3357}
3358
c971c4f2 3359sub qmp_socket {
693d12a2
AD
3360 my ($vmid, $qga) = @_;
3361 my $sockettype = $qga ? 'qga' : 'qmp';
3362 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3363}
3364
1e3baf05
DM
3365sub pidfile_name {
3366 my ($vmid) = @_;
3367 return "${var_run_tmpdir}/$vmid.pid";
3368}
3369
86fdcfb2
DA
3370sub vm_devices_list {
3371 my ($vmid) = @_;
3372
ceea9078 3373 my $res = vm_mon_cmd($vmid, 'query-pci');
ceea9078
DM
3374 my $devices = {};
3375 foreach my $pcibus (@$res) {
3376 foreach my $device (@{$pcibus->{devices}}) {
6e62a21f 3377 next if !$device->{'qdev_id'};
200644a7 3378 if ($device->{'pci_bridge'}) {
200644a7
AD
3379 $devices->{$device->{'qdev_id'}} = 1;
3380 foreach my $bridge_device (@{$device->{'pci_bridge'}->{devices}}) {
3381 next if !$bridge_device->{'qdev_id'};
3382 $devices->{$bridge_device->{'qdev_id'}} = 1;
3383 $devices->{$device->{'qdev_id'}}++;
3384 }
3385 } else {
200644a7
AD
3386 $devices->{$device->{'qdev_id'}} = 1;
3387 }
f78cc802
AD
3388 }
3389 }
3390
3391 my $resblock = vm_mon_cmd($vmid, 'query-block');
3392 foreach my $block (@$resblock) {
3393 if($block->{device} =~ m/^drive-(\S+)/){
3394 $devices->{$1} = 1;
1dc4f496
DM
3395 }
3396 }
86fdcfb2 3397
3d7389fe
DM
3398 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3399 foreach my $mice (@$resmice) {
3400 if ($mice->{name} eq 'QEMU HID Tablet') {
3401 $devices->{tablet} = 1;
3402 last;
3403 }
3404 }
3405
deb091c5
DC
3406 # for usb devices there is no query-usb
3407 # but we can iterate over the entries in
3408 # qom-list path=/machine/peripheral
3409 my $resperipheral = vm_mon_cmd($vmid, 'qom-list', path => '/machine/peripheral');
3410 foreach my $per (@$resperipheral) {
3411 if ($per->{name} =~ m/^usb\d+$/) {
3412 $devices->{$per->{name}} = 1;
3413 }
3414 }
3415
1dc4f496 3416 return $devices;
86fdcfb2
DA
3417}
3418
ec21aa11 3419sub vm_deviceplug {
f19d1c47 3420 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3421
db656e5f
DM
3422 my $q35 = machine_type_is_q35($conf);
3423
95d6343b
DA
3424 my $devices_list = vm_devices_list($vmid);
3425 return 1 if defined($devices_list->{$deviceid});
3426
fee46675
DM
3427 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid); # add PCI bridge if we need it for the device
3428
3d7389fe 3429 if ($deviceid eq 'tablet') {
fee46675 3430
3d7389fe 3431 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3d7389fe 3432
4eb68604
DC
3433 } elsif ($deviceid =~ m/^usb(\d+)$/) {
3434
f745762b
DC
3435 die "usb hotplug currently not reliable\n";
3436 # since we can't reliably hot unplug all added usb devices
3437 # and usb passthrough disables live migration
3438 # we disable usb hotplugging for now
4eb68604
DC
3439 qemu_deviceadd($vmid, PVE::QemuServer::USB::print_usbdevice_full($conf, $deviceid, $device));
3440
fee46675 3441 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
40f28a9f 3442
22de899a
AD
3443 qemu_iothread_add($vmid, $deviceid, $device);
3444
fee46675 3445 qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3446 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
fee46675 3447
5e5dcb73 3448 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3449 eval { qemu_deviceaddverify($vmid, $deviceid); };
3450 if (my $err = $@) {
63c2da2f
DM
3451 eval { qemu_drivedel($vmid, $deviceid); };
3452 warn $@ if $@;
fee46675 3453 die $err;
5e5dcb73 3454 }
cfc817c7 3455
2733141c 3456 } elsif ($deviceid =~ m/^(virtioscsi|scsihw)(\d+)$/) {
fee46675 3457
fc8b40fd 3458
cdd20088 3459 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3460 my $pciaddr = print_pci_addr($deviceid);
a1b7d579 3461 my $scsihw_type = $scsihw eq 'virtio-scsi-single' ? "virtio-scsi-pci" : $scsihw;
2733141c
AD
3462
3463 my $devicefull = "$scsihw_type,id=$deviceid$pciaddr";
fee46675 3464
fc8b40fd
AD
3465 if($deviceid =~ m/^virtioscsi(\d+)$/ && $device->{iothread}) {
3466 qemu_iothread_add($vmid, $deviceid, $device);
3467 $devicefull .= ",iothread=iothread-$deviceid";
3468 }
3469
6e11f143
AD
3470 if($deviceid =~ m/^virtioscsi(\d+)$/ && $device->{queues}) {
3471 $devicefull .= ",num_queues=$device->{queues}";
3472 }
3473
cfc817c7 3474 qemu_deviceadd($vmid, $devicefull);
fee46675 3475 qemu_deviceaddverify($vmid, $deviceid);
cfc817c7 3476
fee46675
DM
3477 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3478
3479 qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
3480 qemu_driveadd($storecfg, $vmid, $device);
a1b7d579 3481
fee46675
DM
3482 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3483 eval { qemu_deviceadd($vmid, $devicefull); };
3484 if (my $err = $@) {
63c2da2f
DM
3485 eval { qemu_drivedel($vmid, $deviceid); };
3486 warn $@ if $@;
fee46675 3487 die $err;
a4f091a0 3488 }
a4f091a0 3489
fee46675
DM
3490 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3491
2630d2a9 3492 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
8718099c
AD
3493
3494 my $machine_type = PVE::QemuServer::qemu_machine_pxe($vmid, $conf);
3495 my $use_old_bios_files = undef;
3496 ($use_old_bios_files, $machine_type) = qemu_use_old_bios_files($machine_type);
3497
3498 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid, undef, $use_old_bios_files);
2630d2a9 3499 qemu_deviceadd($vmid, $netdevicefull);
fee46675
DM
3500 eval { qemu_deviceaddverify($vmid, $deviceid); };
3501 if (my $err = $@) {
3502 eval { qemu_netdevdel($vmid, $deviceid); };
3503 warn $@ if $@;
3504 die $err;
2630d2a9 3505 }
2630d2a9 3506
fee46675 3507 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
b467f79a 3508
40f28a9f
AD
3509 my $bridgeid = $2;
3510 my $pciaddr = print_pci_addr($deviceid);
3511 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
a1b7d579 3512
40f28a9f 3513 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3514 qemu_deviceaddverify($vmid, $deviceid);
3515
3516 } else {
a1b7d579 3517 die "can't hotplug device '$deviceid'\n";
40f28a9f
AD
3518 }
3519
5e5dcb73 3520 return 1;
a4dea331
DA
3521}
3522
3eec5767 3523# fixme: this should raise exceptions on error!
ec21aa11 3524sub vm_deviceunplug {
f19d1c47 3525 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3526
95d6343b
DA
3527 my $devices_list = vm_devices_list($vmid);
3528 return 1 if !defined($devices_list->{$deviceid});
3529
63c2da2f
DM
3530 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3531
3d7389fe 3532 if ($deviceid eq 'tablet') {
63c2da2f 3533
3d7389fe 3534 qemu_devicedel($vmid, $deviceid);
3d7389fe 3535
4eb68604
DC
3536 } elsif ($deviceid =~ m/^usb\d+$/) {
3537
f745762b
DC
3538 die "usb hotplug currently not reliable\n";
3539 # when unplugging usb devices this way,
3540 # there may be remaining usb controllers/hubs
3541 # so we disable it for now
4eb68604
DC
3542 qemu_devicedel($vmid, $deviceid);
3543 qemu_devicedelverify($vmid, $deviceid);
3544
63c2da2f 3545 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
f19d1c47 3546
5e5dcb73 3547 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3548 qemu_devicedelverify($vmid, $deviceid);
3549 qemu_drivedel($vmid, $deviceid);
22de899a
AD
3550 qemu_iothread_del($conf, $vmid, $deviceid);
3551
2733141c 3552 } elsif ($deviceid =~ m/^(virtioscsi|scsihw)(\d+)$/) {
a1b7d579 3553
63c2da2f 3554 qemu_devicedel($vmid, $deviceid);
8ce30dde 3555 qemu_devicedelverify($vmid, $deviceid);
fc8b40fd 3556 qemu_iothread_del($conf, $vmid, $deviceid);
a1b7d579 3557
63c2da2f 3558 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
cfc817c7 3559
8bcf3068
AD
3560 #qemu 2.3 segfault on drive_del with virtioscsi + iothread
3561 my $device = parse_drive($deviceid, $conf->{$deviceid});
3562 die "virtioscsi with iothread is not hot-unplugglable currently" if $device->{iothread};
3563
63c2da2f
DM
3564 qemu_devicedel($vmid, $deviceid);
3565 qemu_drivedel($vmid, $deviceid);
a1b7d579 3566 qemu_deletescsihw($conf, $vmid, $deviceid);
8ce30dde 3567
63c2da2f 3568 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
a4f091a0 3569
2630d2a9 3570 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3571 qemu_devicedelverify($vmid, $deviceid);
3572 qemu_netdevdel($vmid, $deviceid);
3573
3574 } else {
3575 die "can't unplug device '$deviceid'\n";
2630d2a9
DA
3576 }
3577
5e5dcb73
DA
3578 return 1;
3579}
3580
3581sub qemu_deviceadd {
3582 my ($vmid, $devicefull) = @_;
873c2d69 3583
d695b5b7
AD
3584 $devicefull = "driver=".$devicefull;
3585 my %options = split(/[=,]/, $devicefull);
f19d1c47 3586
d695b5b7 3587 vm_mon_cmd($vmid, "device_add" , %options);
5e5dcb73 3588}
afdb31d5 3589
5e5dcb73 3590sub qemu_devicedel {
fee46675 3591 my ($vmid, $deviceid) = @_;
63c2da2f 3592
5a77d8c1 3593 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
5e5dcb73
DA
3594}
3595
22de899a
AD
3596sub qemu_iothread_add {
3597 my($vmid, $deviceid, $device) = @_;
3598
3599 if ($device->{iothread}) {
3600 my $iothreads = vm_iothreads_list($vmid);
3601 qemu_objectadd($vmid, "iothread-$deviceid", "iothread") if !$iothreads->{"iothread-$deviceid"};
3602 }
3603}
3604
3605sub qemu_iothread_del {
3606 my($conf, $vmid, $deviceid) = @_;
3607
3608 my $device = parse_drive($deviceid, $conf->{$deviceid});
3609 if ($device->{iothread}) {
3610 my $iothreads = vm_iothreads_list($vmid);
3611 qemu_objectdel($vmid, "iothread-$deviceid") if $iothreads->{"iothread-$deviceid"};
3612 }
3613}
3614
4d3f29ed
AD
3615sub qemu_objectadd {
3616 my($vmid, $objectid, $qomtype) = @_;
3617
3618 vm_mon_cmd($vmid, "object-add", id => $objectid, "qom-type" => $qomtype);
3619
3620 return 1;
3621}
3622
3623sub qemu_objectdel {
3624 my($vmid, $objectid) = @_;
3625
3626 vm_mon_cmd($vmid, "object-del", id => $objectid);
3627
3628 return 1;
3629}
3630
5e5dcb73 3631sub qemu_driveadd {
fee46675 3632 my ($storecfg, $vmid, $device) = @_;
5e5dcb73
DA
3633
3634 my $drive = print_drive_full($storecfg, $vmid, $device);
7a69fc3c 3635 $drive =~ s/\\/\\\\/g;
8ead5ec7 3636 my $ret = vm_human_monitor_command($vmid, "drive_add auto \"$drive\"");
fee46675 3637
5e5dcb73 3638 # If the command succeeds qemu prints: "OK"
fee46675
DM
3639 return 1 if $ret =~ m/OK/s;
3640
3641 die "adding drive failed: $ret\n";
5e5dcb73 3642}
afdb31d5 3643
5e5dcb73
DA
3644sub qemu_drivedel {
3645 my($vmid, $deviceid) = @_;
873c2d69 3646
7b7c6d1b 3647 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73 3648 $ret =~ s/^\s+//;
a1b7d579 3649
63c2da2f 3650 return 1 if $ret eq "";
a1b7d579 3651
63c2da2f 3652 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
a1b7d579
DM
3653 return 1 if $ret =~ m/Device \'.*?\' not found/s;
3654
63c2da2f 3655 die "deleting drive $deviceid failed : $ret\n";
5e5dcb73 3656}
f19d1c47 3657
5e5dcb73 3658sub qemu_deviceaddverify {
fee46675 3659 my ($vmid, $deviceid) = @_;
873c2d69 3660
5e5dcb73
DA
3661 for (my $i = 0; $i <= 5; $i++) {
3662 my $devices_list = vm_devices_list($vmid);
3663 return 1 if defined($devices_list->{$deviceid});
3664 sleep 1;
afdb31d5 3665 }
fee46675
DM
3666
3667 die "error on hotplug device '$deviceid'\n";
5e5dcb73 3668}
afdb31d5 3669
5e5dcb73
DA
3670
3671sub qemu_devicedelverify {
63c2da2f
DM
3672 my ($vmid, $deviceid) = @_;
3673
a1b7d579 3674 # need to verify that the device is correctly removed as device_del
63c2da2f 3675 # is async and empty return is not reliable
5e5dcb73 3676
5e5dcb73
DA
3677 for (my $i = 0; $i <= 5; $i++) {
3678 my $devices_list = vm_devices_list($vmid);
3679 return 1 if !defined($devices_list->{$deviceid});
3680 sleep 1;
afdb31d5 3681 }
63c2da2f
DM
3682
3683 die "error on hot-unplugging device '$deviceid'\n";
873c2d69
DA
3684}
3685
cdd20088 3686sub qemu_findorcreatescsihw {
cfc817c7
DA
3687 my ($storecfg, $conf, $vmid, $device) = @_;
3688
ee034f5c 3689 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $device);
2733141c
AD
3690
3691 my $scsihwid="$controller_prefix$controller";
cfc817c7
DA
3692 my $devices_list = vm_devices_list($vmid);
3693
cdd20088 3694 if(!defined($devices_list->{$scsihwid})) {
fc8b40fd 3695 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid, $device);
cfc817c7 3696 }
fee46675 3697
cfc817c7
DA
3698 return 1;
3699}
3700
8ce30dde
AD
3701sub qemu_deletescsihw {
3702 my ($conf, $vmid, $opt) = @_;
3703
3704 my $device = parse_drive($opt, $conf->{$opt});
3705
a1511b3c 3706 if ($conf->{scsihw} && ($conf->{scsihw} eq 'virtio-scsi-single')) {
2733141c
AD
3707 vm_deviceunplug($vmid, $conf, "virtioscsi$device->{index}");
3708 return 1;
3709 }
3710
ee034f5c 3711 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $device);
8ce30dde
AD
3712
3713 my $devices_list = vm_devices_list($vmid);
3714 foreach my $opt (keys %{$devices_list}) {
74479ee9 3715 if (PVE::QemuServer::is_valid_drivename($opt)) {
8ce30dde
AD
3716 my $drive = PVE::QemuServer::parse_drive($opt, $conf->{$opt});
3717 if($drive->{interface} eq 'scsi' && $drive->{index} < (($maxdev-1)*($controller+1))) {
3718 return 1;
3719 }
3720 }
3721 }
3722
3723 my $scsihwid="scsihw$controller";
3724
3725 vm_deviceunplug($vmid, $conf, $scsihwid);
3726
3727 return 1;
3728}
3729
281fedb3 3730sub qemu_add_pci_bridge {
40f28a9f
AD
3731 my ($storecfg, $conf, $vmid, $device) = @_;
3732
3733 my $bridges = {};
281fedb3
DM
3734
3735 my $bridgeid;
3736
40f28a9f
AD
3737 print_pci_addr($device, $bridges);
3738
3739 while (my ($k, $v) = each %$bridges) {
3740 $bridgeid = $k;
3741 }
fee46675 3742 return 1 if !defined($bridgeid) || $bridgeid < 1;
281fedb3 3743
40f28a9f
AD
3744 my $bridge = "pci.$bridgeid";
3745 my $devices_list = vm_devices_list($vmid);
3746
281fedb3 3747 if (!defined($devices_list->{$bridge})) {
fee46675 3748 vm_deviceplug($storecfg, $conf, $vmid, $bridge);
40f28a9f 3749 }
281fedb3 3750
40f28a9f
AD
3751 return 1;
3752}
3753
25088687
DM
3754sub qemu_set_link_status {
3755 my ($vmid, $device, $up) = @_;
3756
a1b7d579 3757 vm_mon_cmd($vmid, "set_link", name => $device,
25088687
DM
3758 up => $up ? JSON::true : JSON::false);
3759}
3760
2630d2a9
DA
3761sub qemu_netdevadd {
3762 my ($vmid, $conf, $device, $deviceid) = @_;
3763
208ba94e 3764 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid, 1);
73aa03b8 3765 my %options = split(/[=,]/, $netdev);
2630d2a9 3766
73aa03b8
AD
3767 vm_mon_cmd($vmid, "netdev_add", %options);
3768 return 1;
2630d2a9
DA
3769}
3770
3771sub qemu_netdevdel {
3772 my ($vmid, $deviceid) = @_;
3773
89c1e0f4 3774 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
2630d2a9
DA
3775}
3776
16521d63
DC
3777sub qemu_usb_hotplug {
3778 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
3779
3780 return if !$device;
3781
3782 # remove the old one first
3783 vm_deviceunplug($vmid, $conf, $deviceid);
3784
3785 # check if xhci controller is necessary and available
3786 if ($device->{usb3}) {
3787
3788 my $devicelist = vm_devices_list($vmid);
3789
3790 if (!$devicelist->{xhci}) {
3791 my $pciaddr = print_pci_addr("xhci");
3792 qemu_deviceadd($vmid, "nec-usb-xhci,id=xhci$pciaddr");
3793 }
3794 }
3795 my $d = parse_usb_device($device->{host});
3796 $d->{usb3} = $device->{usb3};
3797
3798 # add the new one
3799 vm_deviceplug($storecfg, $conf, $vmid, $deviceid, $d);
3800}
3801
838776ab 3802sub qemu_cpu_hotplug {
8edc9c08 3803 my ($vmid, $conf, $vcpus) = @_;
838776ab 3804
1e881b75
AD
3805 my $machine_type = PVE::QemuServer::get_current_qemu_machine($vmid);
3806
8edc9c08
AD
3807 my $sockets = 1;
3808 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
3809 $sockets = $conf->{sockets} if $conf->{sockets};
3810 my $cores = $conf->{cores} || 1;
3811 my $maxcpus = $sockets * $cores;
838776ab 3812
8edc9c08 3813 $vcpus = $maxcpus if !$vcpus;
3a11fadb 3814
8edc9c08
AD
3815 die "you can't add more vcpus than maxcpus\n"
3816 if $vcpus > $maxcpus;
3a11fadb 3817
8edc9c08 3818 my $currentvcpus = $conf->{vcpus} || $maxcpus;
1e881b75 3819
eba3e64d 3820 if ($vcpus < $currentvcpus) {
1e881b75
AD
3821
3822 if (qemu_machine_feature_enabled ($machine_type, undef, 2, 7)) {
3823
3824 for (my $i = $currentvcpus; $i > $vcpus; $i--) {
3825 qemu_devicedel($vmid, "cpu$i");
3826 my $retry = 0;
3827 my $currentrunningvcpus = undef;
3828 while (1) {
3829 $currentrunningvcpus = vm_mon_cmd($vmid, "query-cpus");
3830 last if scalar(@{$currentrunningvcpus}) == $i-1;
961af8a3 3831 raise_param_exc({ vcpus => "error unplugging cpu$i" }) if $retry > 5;
1e881b75
AD
3832 $retry++;
3833 sleep 1;
3834 }
3835 #update conf after each succesfull cpu unplug
3836 $conf->{vcpus} = scalar(@{$currentrunningvcpus});
3837 PVE::QemuConfig->write_config($vmid, $conf);
3838 }
3839 } else {
961af8a3 3840 die "cpu hot-unplugging requires qemu version 2.7 or higher\n";
1e881b75
AD
3841 }
3842
3843 return;
3844 }
838776ab 3845
8edc9c08 3846 my $currentrunningvcpus = vm_mon_cmd($vmid, "query-cpus");
961af8a3 3847 die "vcpus in running vm does not match its configuration\n"
8edc9c08 3848 if scalar(@{$currentrunningvcpus}) != $currentvcpus;
838776ab 3849
eba3e64d
AD
3850 if (qemu_machine_feature_enabled ($machine_type, undef, 2, 7)) {
3851
3852 for (my $i = $currentvcpus+1; $i <= $vcpus; $i++) {
3853 my $cpustr = print_cpu_device($conf, $i);
3854 qemu_deviceadd($vmid, $cpustr);
3855
3856 my $retry = 0;
3857 my $currentrunningvcpus = undef;
3858 while (1) {
3859 $currentrunningvcpus = vm_mon_cmd($vmid, "query-cpus");
3860 last if scalar(@{$currentrunningvcpus}) == $i;
961af8a3 3861 raise_param_exc({ vcpus => "error hotplugging cpu$i" }) if $retry > 10;
eba3e64d
AD
3862 sleep 1;
3863 $retry++;
3864 }
3865 #update conf after each succesfull cpu hotplug
3866 $conf->{vcpus} = scalar(@{$currentrunningvcpus});
3867 PVE::QemuConfig->write_config($vmid, $conf);
3868 }
3869 } else {
3870
3871 for (my $i = $currentvcpus; $i < $vcpus; $i++) {
3872 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3873 }
838776ab
AD
3874 }
3875}
3876
affd2f88 3877sub qemu_block_set_io_throttle {
277ca170
WB
3878 my ($vmid, $deviceid,
3879 $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr,
9196a8ec
WB
3880 $bps_max, $bps_rd_max, $bps_wr_max, $iops_max, $iops_rd_max, $iops_wr_max,
3881 $bps_max_length, $bps_rd_max_length, $bps_wr_max_length,
3882 $iops_max_length, $iops_rd_max_length, $iops_wr_max_length) = @_;
affd2f88 3883
f3f323a3
AD
3884 return if !check_running($vmid) ;
3885
277ca170
WB
3886 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid,
3887 bps => int($bps),
3888 bps_rd => int($bps_rd),
3889 bps_wr => int($bps_wr),
3890 iops => int($iops),
3891 iops_rd => int($iops_rd),
3892 iops_wr => int($iops_wr),
3893 bps_max => int($bps_max),
3894 bps_rd_max => int($bps_rd_max),
3895 bps_wr_max => int($bps_wr_max),
3896 iops_max => int($iops_max),
3897 iops_rd_max => int($iops_rd_max),
9196a8ec
WB
3898 iops_wr_max => int($iops_wr_max),
3899 bps_max_length => int($bps_max_length),
3900 bps_rd_max_length => int($bps_rd_max_length),
3901 bps_wr_max_length => int($bps_wr_max_length),
3902 iops_max_length => int($iops_max_length),
3903 iops_rd_max_length => int($iops_rd_max_length),
3904 iops_wr_max_length => int($iops_wr_max_length),
277ca170 3905 );
f3f323a3 3906
affd2f88
AD
3907}
3908
f5eb281a 3909# old code, only used to shutdown old VM after update
dab36e1e
DM
3910sub __read_avail {
3911 my ($fh, $timeout) = @_;
3912
3913 my $sel = new IO::Select;
3914 $sel->add($fh);
3915
3916 my $res = '';
3917 my $buf;
3918
3919 my @ready;
3920 while (scalar (@ready = $sel->can_read($timeout))) {
3921 my $count;
3922 if ($count = $fh->sysread($buf, 8192)) {
3923 if ($buf =~ /^(.*)\(qemu\) $/s) {
3924 $res .= $1;
3925 last;
3926 } else {
3927 $res .= $buf;
3928 }
3929 } else {
3930 if (!defined($count)) {
3931 die "$!\n";
3932 }
3933 last;
3934 }
3935 }
3936
3937 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3938
dab36e1e
DM
3939 return $res;
3940}
3941
f5eb281a 3942# old code, only used to shutdown old VM after update
dab36e1e
DM
3943sub vm_monitor_command {
3944 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3945
dab36e1e
DM
3946 my $res;
3947
3948 eval {
3949 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3950
3951 my $sname = "${var_run_tmpdir}/$vmid.mon";
3952
3953 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3954 die "unable to connect to VM $vmid socket - $!\n";
3955
3956 my $timeout = 3;
3957
3958 # hack: migrate sometime blocks the monitor (when migrate_downtime
3959 # is set)
3960 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3961 $timeout = 60*60; # 1 hour
3962 }
3963
3964 # read banner;
3965 my $data = __read_avail($sock, $timeout);
3966
3967 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3968 die "got unexpected qemu monitor banner\n";
3969 }
3970
3971 my $sel = new IO::Select;
3972 $sel->add($sock);
3973
3974 if (!scalar(my @ready = $sel->can_write($timeout))) {
3975 die "monitor write error - timeout";
3976 }
3977
3978 my $fullcmd = "$cmdstr\r";
3979
3980 # syslog('info', "VM $vmid monitor command: $cmdstr");
3981
3982 my $b;
3983 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3984 die "monitor write error - $!";
3985 }
3986
3987 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3988
3989 $timeout = 20;
3990
3991 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3992 $timeout = 60*60; # 1 hour
3993 } elsif ($cmdstr =~ m/^(eject|change)/) {
3994 $timeout = 60; # note: cdrom mount command is slow
3995 }
3996 if ($res = __read_avail($sock, $timeout)) {
3997
3998 my @lines = split("\r?\n", $res);
f5eb281a 3999
dab36e1e 4000 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 4001
dab36e1e
DM
4002 $res = join("\n", @lines);
4003 $res .= "\n";
4004 }
4005 };
4006
4007 my $err = $@;
4008
4009 if ($err) {
4010 syslog("err", "VM $vmid monitor command failed - $err");
4011 die $err;
4012 }
f5eb281a 4013
dab36e1e
DM
4014 return $res;
4015}
4016
c1175c92
AD
4017sub qemu_block_resize {
4018 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
4019
ed221350 4020 my $running = check_running($vmid);
c1175c92 4021
7246e8f9 4022 $size = 0 if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
c1175c92
AD
4023
4024 return if !$running;
4025
4026 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
4027
4028}
4029
1ab0057c
AD
4030sub qemu_volume_snapshot {
4031 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
4032
ed221350 4033 my $running = check_running($vmid);
1ab0057c 4034
e5eaa028
WL
4035 if ($running && do_snapshots_with_qemu($storecfg, $volid)){
4036 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
4037 } else {
4038 PVE::Storage::volume_snapshot($storecfg, $volid, $snap);
4039 }
1ab0057c
AD
4040}
4041
fc46aff9
AD
4042sub qemu_volume_snapshot_delete {
4043 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
4044
ed221350 4045 my $running = check_running($vmid);
fc46aff9 4046
1ef7592f
AD
4047 if ($running && do_snapshots_with_qemu($storecfg, $volid)){
4048 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
4049 } else {
4050 PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
4051 }
fc46aff9
AD
4052}
4053
264e519f
DM
4054sub set_migration_caps {
4055 my ($vmid) = @_;
a89fded1 4056
8b8345f3 4057 my $cap_ref = [];
a89fded1
AD
4058
4059 my $enabled_cap = {
8b8345f3 4060 "auto-converge" => 1,
0b0a47e8 4061 "xbzrle" => 1,
8b8345f3
DM
4062 "x-rdma-pin-all" => 0,
4063 "zero-blocks" => 0,
b62532e4 4064 "compress" => 0
a89fded1
AD
4065 };
4066
8b8345f3 4067 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 4068
8b8345f3 4069 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
4070 push @$cap_ref, {
4071 capability => $supported_capability->{capability},
22430fa2
DM
4072 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
4073 };
a89fded1
AD
4074 }
4075
8b8345f3
DM
4076 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
4077}
a89fded1 4078
81d95ae1 4079my $fast_plug_option = {
7498eb64 4080 'lock' => 1,
81d95ae1 4081 'name' => 1,
a1b7d579 4082 'onboot' => 1,
81d95ae1
DM
4083 'shares' => 1,
4084 'startup' => 1,
b0ec896e 4085 'description' => 1,
ec647db4 4086 'protection' => 1,
81d95ae1
DM
4087};
4088
3a11fadb
DM
4089# hotplug changes in [PENDING]
4090# $selection hash can be used to only apply specified options, for
4091# example: { cores => 1 } (only apply changed 'cores')
4092# $errors ref is used to return error messages
c427973b 4093sub vmconfig_hotplug_pending {
3a11fadb 4094 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
c427973b 4095
8e90138a 4096 my $defaults = load_defaults();
c427973b
DM
4097
4098 # commit values which do not have any impact on running VM first
3a11fadb
DM
4099 # Note: those option cannot raise errors, we we do not care about
4100 # $selection and always apply them.
4101
4102 my $add_error = sub {
4103 my ($opt, $msg) = @_;
4104 $errors->{$opt} = "hotplug problem - $msg";
4105 };
c427973b
DM
4106
4107 my $changes = 0;
4108 foreach my $opt (keys %{$conf->{pending}}) { # add/change
81d95ae1 4109 if ($fast_plug_option->{$opt}) {
c427973b
DM
4110 $conf->{$opt} = $conf->{pending}->{$opt};
4111 delete $conf->{pending}->{$opt};
4112 $changes = 1;
4113 }
4114 }
4115
4116 if ($changes) {
ffda963f
FG
4117 PVE::QemuConfig->write_config($vmid, $conf);
4118 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
c427973b
DM
4119 }
4120
b3c2bdd1 4121 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
c427973b 4122
3dc38fbb
WB
4123 my $pending_delete_hash = split_flagged_list($conf->{pending}->{delete});
4124 while (my ($opt, $force) = each %$pending_delete_hash) {
3a11fadb 4125 next if $selection && !$selection->{$opt};
3a11fadb 4126 eval {
51a6f637
AD
4127 if ($opt eq 'hotplug') {
4128 die "skip\n" if ($conf->{hotplug} =~ /memory/);
4129 } elsif ($opt eq 'tablet') {
b3c2bdd1 4130 die "skip\n" if !$hotplug_features->{usb};
3a11fadb
DM
4131 if ($defaults->{tablet}) {
4132 vm_deviceplug($storecfg, $conf, $vmid, $opt);
4133 } else {
4134 vm_deviceunplug($vmid, $conf, $opt);
4135 }
4eb68604 4136 } elsif ($opt =~ m/^usb\d+/) {
f745762b
DC
4137 die "skip\n";
4138 # since we cannot reliably hot unplug usb devices
4139 # we are disabling it
4eb68604
DC
4140 die "skip\n" if !$hotplug_features->{usb} || $conf->{$opt} =~ m/spice/i;
4141 vm_deviceunplug($vmid, $conf, $opt);
8edc9c08 4142 } elsif ($opt eq 'vcpus') {
b3c2bdd1 4143 die "skip\n" if !$hotplug_features->{cpu};
8edc9c08 4144 qemu_cpu_hotplug($vmid, $conf, undef);
9c2f7069 4145 } elsif ($opt eq 'balloon') {
81d95ae1
DM
4146 # enable balloon device is not hotpluggable
4147 die "skip\n" if !defined($conf->{balloon}) || $conf->{balloon};
4148 } elsif ($fast_plug_option->{$opt}) {
4149 # do nothing
3eec5767 4150 } elsif ($opt =~ m/^net(\d+)$/) {
b3c2bdd1 4151 die "skip\n" if !$hotplug_features->{network};
3eec5767 4152 vm_deviceunplug($vmid, $conf, $opt);
74479ee9 4153 } elsif (is_valid_drivename($opt)) {
b3c2bdd1 4154 die "skip\n" if !$hotplug_features->{disk} || $opt =~ m/(ide|sata)(\d+)/;
19120f99 4155 vm_deviceunplug($vmid, $conf, $opt);
3dc38fbb 4156 vmconfig_delete_or_detach_drive($vmid, $storecfg, $conf, $opt, $force);
4d3f29ed
AD
4157 } elsif ($opt =~ m/^memory$/) {
4158 die "skip\n" if !$hotplug_features->{memory};
6779f1ac 4159 PVE::QemuServer::Memory::qemu_memory_hotplug($vmid, $conf, $defaults, $opt);
c8effec3
AD
4160 } elsif ($opt eq 'cpuunits') {
4161 cgroups_write("cpu", $vmid, "cpu.shares", $defaults->{cpuunits});
58be00f1
AD
4162 } elsif ($opt eq 'cpulimit') {
4163 cgroups_write("cpu", $vmid, "cpu.cfs_quota_us", -1);
3d7389fe 4164 } else {
e56beeda 4165 die "skip\n";
3d7389fe 4166 }
3a11fadb
DM
4167 };
4168 if (my $err = $@) {
e56beeda
DM
4169 &$add_error($opt, $err) if $err ne "skip\n";
4170 } else {
3a11fadb
DM
4171 # save new config if hotplug was successful
4172 delete $conf->{$opt};
4173 vmconfig_undelete_pending_option($conf, $opt);
ffda963f
FG
4174 PVE::QemuConfig->write_config($vmid, $conf);
4175 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
3d7389fe 4176 }
3d7389fe
DM
4177 }
4178
4179 foreach my $opt (keys %{$conf->{pending}}) {
3a11fadb 4180 next if $selection && !$selection->{$opt};
3d7389fe 4181 my $value = $conf->{pending}->{$opt};
3a11fadb 4182 eval {
51a6f637
AD
4183 if ($opt eq 'hotplug') {
4184 die "skip\n" if ($value =~ /memory/) || ($value !~ /memory/ && $conf->{hotplug} =~ /memory/);
4185 } elsif ($opt eq 'tablet') {
b3c2bdd1 4186 die "skip\n" if !$hotplug_features->{usb};
3a11fadb
DM
4187 if ($value == 1) {
4188 vm_deviceplug($storecfg, $conf, $vmid, $opt);
4189 } elsif ($value == 0) {
4190 vm_deviceunplug($vmid, $conf, $opt);
4191 }
4eb68604 4192 } elsif ($opt =~ m/^usb\d+$/) {
f745762b
DC
4193 die "skip\n";
4194 # since we cannot reliably hot unplug usb devices
4195 # we are disabling it
4eb68604
DC
4196 die "skip\n" if !$hotplug_features->{usb} || $value =~ m/spice/i;
4197 my $d = eval { PVE::JSONSchema::parse_property_string($usbdesc->{format}, $value) };
4198 die "skip\n" if !$d;
4199 qemu_usb_hotplug($storecfg, $conf, $vmid, $opt, $d);
8edc9c08 4200 } elsif ($opt eq 'vcpus') {
b3c2bdd1 4201 die "skip\n" if !$hotplug_features->{cpu};
3a11fadb
DM
4202 qemu_cpu_hotplug($vmid, $conf, $value);
4203 } elsif ($opt eq 'balloon') {
81d95ae1 4204 # enable/disable balloning device is not hotpluggable
8fe689e7 4205 my $old_balloon_enabled = !!(!defined($conf->{balloon}) || $conf->{balloon});
a1b7d579 4206 my $new_balloon_enabled = !!(!defined($conf->{pending}->{balloon}) || $conf->{pending}->{balloon});
81d95ae1
DM
4207 die "skip\n" if $old_balloon_enabled != $new_balloon_enabled;
4208
3a11fadb 4209 # allow manual ballooning if shares is set to zero
4cc1efa6 4210 if ((defined($conf->{shares}) && ($conf->{shares} == 0))) {
9c2f7069
AD
4211 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
4212 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
4213 }
a1b7d579 4214 } elsif ($opt =~ m/^net(\d+)$/) {
3eec5767 4215 # some changes can be done without hotplug
a1b7d579 4216 vmconfig_update_net($storecfg, $conf, $hotplug_features->{network},
b3c2bdd1 4217 $vmid, $opt, $value);
74479ee9 4218 } elsif (is_valid_drivename($opt)) {
a05cff86 4219 # some changes can be done without hotplug
b3c2bdd1
DM
4220 vmconfig_update_disk($storecfg, $conf, $hotplug_features->{disk},
4221 $vmid, $opt, $value, 1);
4d3f29ed
AD
4222 } elsif ($opt =~ m/^memory$/) { #dimms
4223 die "skip\n" if !$hotplug_features->{memory};
6779f1ac 4224 $value = PVE::QemuServer::Memory::qemu_memory_hotplug($vmid, $conf, $defaults, $opt, $value);
c8effec3
AD
4225 } elsif ($opt eq 'cpuunits') {
4226 cgroups_write("cpu", $vmid, "cpu.shares", $conf->{pending}->{$opt});
58be00f1 4227 } elsif ($opt eq 'cpulimit') {
c6f773b8 4228 my $cpulimit = $conf->{pending}->{$opt} == 0 ? -1 : int($conf->{pending}->{$opt} * 100000);
58be00f1 4229 cgroups_write("cpu", $vmid, "cpu.cfs_quota_us", $cpulimit);
3a11fadb 4230 } else {
e56beeda 4231 die "skip\n"; # skip non-hot-pluggable options
3d7389fe 4232 }
3a11fadb
DM
4233 };
4234 if (my $err = $@) {
e56beeda
DM
4235 &$add_error($opt, $err) if $err ne "skip\n";
4236 } else {
3a11fadb
DM
4237 # save new config if hotplug was successful
4238 $conf->{$opt} = $value;
4239 delete $conf->{pending}->{$opt};
ffda963f
FG
4240 PVE::QemuConfig->write_config($vmid, $conf);
4241 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
3d7389fe 4242 }
3d7389fe 4243 }
c427973b 4244}
055d554d 4245
3dc38fbb
WB
4246sub try_deallocate_drive {
4247 my ($storecfg, $vmid, $conf, $key, $drive, $rpcenv, $authuser, $force) = @_;
4248
4249 if (($force || $key =~ /^unused/) && !drive_is_cdrom($drive, 1)) {
4250 my $volid = $drive->{file};
4251 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
4252 my $sid = PVE::Storage::parse_volume_id($volid);
4253 $rpcenv->check($authuser, "/storage/$sid", ['Datastore.AllocateSpace']);
cee01bcb
WB
4254
4255 # check if the disk is really unused
cee01bcb 4256 die "unable to delete '$volid' - volume is still in use (snapshot?)\n"
77019edf 4257 if is_volume_in_use($storecfg, $conf, $key, $volid);
cee01bcb 4258 PVE::Storage::vdisk_free($storecfg, $volid);
3dc38fbb 4259 return 1;
40b977f3
WL
4260 } else {
4261 # If vm is not owner of this disk remove from config
4262 return 1;
3dc38fbb
WB
4263 }
4264 }
4265
4266 return undef;
4267}
4268
4269sub vmconfig_delete_or_detach_drive {
4270 my ($vmid, $storecfg, $conf, $opt, $force) = @_;
4271
4272 my $drive = parse_drive($opt, $conf->{$opt});
4273
4274 my $rpcenv = PVE::RPCEnvironment::get();
4275 my $authuser = $rpcenv->get_user();
4276
4277 if ($force) {
4278 $rpcenv->check_vm_perm($authuser, $vmid, undef, ['VM.Config.Disk']);
4279 try_deallocate_drive($storecfg, $vmid, $conf, $opt, $drive, $rpcenv, $authuser, $force);
4280 } else {
4281 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $drive);
4282 }
4283}
4284
055d554d 4285sub vmconfig_apply_pending {
3a11fadb 4286 my ($vmid, $conf, $storecfg) = @_;
c427973b
DM
4287
4288 # cold plug
055d554d 4289
3dc38fbb
WB
4290 my $pending_delete_hash = split_flagged_list($conf->{pending}->{delete});
4291 while (my ($opt, $force) = each %$pending_delete_hash) {
055d554d 4292 die "internal error" if $opt =~ m/^unused/;
ffda963f 4293 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4294 if (!defined($conf->{$opt})) {
4295 vmconfig_undelete_pending_option($conf, $opt);
ffda963f 4296 PVE::QemuConfig->write_config($vmid, $conf);
74479ee9 4297 } elsif (is_valid_drivename($opt)) {
3dc38fbb 4298 vmconfig_delete_or_detach_drive($vmid, $storecfg, $conf, $opt, $force);
055d554d
DM
4299 vmconfig_undelete_pending_option($conf, $opt);
4300 delete $conf->{$opt};
ffda963f 4301 PVE::QemuConfig->write_config($vmid, $conf);
055d554d
DM
4302 } else {
4303 vmconfig_undelete_pending_option($conf, $opt);
4304 delete $conf->{$opt};
ffda963f 4305 PVE::QemuConfig->write_config($vmid, $conf);
055d554d
DM
4306 }
4307 }
4308
ffda963f 4309 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4310
4311 foreach my $opt (keys %{$conf->{pending}}) { # add/change
ffda963f 4312 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4313
4314 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
4315 # skip if nothing changed
74479ee9 4316 } elsif (is_valid_drivename($opt)) {
055d554d
DM
4317 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
4318 if defined($conf->{$opt});
4319 $conf->{$opt} = $conf->{pending}->{$opt};
4320 } else {
4321 $conf->{$opt} = $conf->{pending}->{$opt};
4322 }
4323
4324 delete $conf->{pending}->{$opt};
ffda963f 4325 PVE::QemuConfig->write_config($vmid, $conf);
055d554d
DM
4326 }
4327}
4328
3eec5767
DM
4329my $safe_num_ne = sub {
4330 my ($a, $b) = @_;
4331
4332 return 0 if !defined($a) && !defined($b);
4333 return 1 if !defined($a);
4334 return 1 if !defined($b);
4335
4336 return $a != $b;
4337};
4338
4339my $safe_string_ne = sub {
4340 my ($a, $b) = @_;
4341
4342 return 0 if !defined($a) && !defined($b);
4343 return 1 if !defined($a);
4344 return 1 if !defined($b);
4345
4346 return $a ne $b;
4347};
4348
4349sub vmconfig_update_net {
b3c2bdd1 4350 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value) = @_;
3eec5767
DM
4351
4352 my $newnet = parse_net($value);
4353
4354 if ($conf->{$opt}) {
4355 my $oldnet = parse_net($conf->{$opt});
4356
4357 if (&$safe_string_ne($oldnet->{model}, $newnet->{model}) ||
4358 &$safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
4359 &$safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
4360 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
4361
4362 # for non online change, we try to hot-unplug
7196b757 4363 die "skip\n" if !$hotplug;
3eec5767
DM
4364 vm_deviceunplug($vmid, $conf, $opt);
4365 } else {
4366
4367 die "internal error" if $opt !~ m/net(\d+)/;
4368 my $iface = "tap${vmid}i$1";
a1b7d579 4369
25088687
DM
4370 if (&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
4371 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
16d08ecf 4372 &$safe_string_ne($oldnet->{trunks}, $newnet->{trunks}) ||
25088687 4373 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3eec5767 4374 PVE::Network::tap_unplug($iface);
4f4fbeb0
WB
4375 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks}, $newnet->{rate});
4376 } elsif (&$safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
4377 # Rate can be applied on its own but any change above needs to
4378 # include the rate in tap_plug since OVS resets everything.
4379 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3eec5767 4380 }
38c590d9 4381
25088687
DM
4382 if (&$safe_string_ne($oldnet->{link_down}, $newnet->{link_down})) {
4383 qemu_set_link_status($vmid, $opt, !$newnet->{link_down});
4384 }
4385
38c590d9 4386 return 1;
3eec5767
DM
4387 }
4388 }
a1b7d579 4389
7196b757 4390 if ($hotplug) {
38c590d9
DM
4391 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet);
4392 } else {
4393 die "skip\n";
4394 }
3eec5767
DM
4395}
4396
a05cff86 4397sub vmconfig_update_disk {
b3c2bdd1 4398 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value, $force) = @_;
a05cff86
DM
4399
4400 # fixme: do we need force?
4401
4402 my $drive = parse_drive($opt, $value);
4403
4404 if ($conf->{$opt}) {
4405
4406 if (my $old_drive = parse_drive($opt, $conf->{$opt})) {
4407
4408 my $media = $drive->{media} || 'disk';
4409 my $oldmedia = $old_drive->{media} || 'disk';
4410 die "unable to change media type\n" if $media ne $oldmedia;
4411
4412 if (!drive_is_cdrom($old_drive)) {
4413
a1b7d579 4414 if ($drive->{file} ne $old_drive->{file}) {
a05cff86 4415
7196b757 4416 die "skip\n" if !$hotplug;
a05cff86
DM
4417
4418 # unplug and register as unused
4419 vm_deviceunplug($vmid, $conf, $opt);
4420 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $old_drive)
a1b7d579 4421
a05cff86
DM
4422 } else {
4423 # update existing disk
4424
4425 # skip non hotpluggable value
6ecfbb44 4426 if (&$safe_string_ne($drive->{discard}, $old_drive->{discard}) ||
22de899a 4427 &$safe_string_ne($drive->{iothread}, $old_drive->{iothread}) ||
6e11f143 4428 &$safe_string_ne($drive->{queues}, $old_drive->{queues}) ||
a05cff86
DM
4429 &$safe_string_ne($drive->{cache}, $old_drive->{cache})) {
4430 die "skip\n";
4431 }
4432
4433 # apply throttle
4434 if (&$safe_num_ne($drive->{mbps}, $old_drive->{mbps}) ||
4435 &$safe_num_ne($drive->{mbps_rd}, $old_drive->{mbps_rd}) ||
4436 &$safe_num_ne($drive->{mbps_wr}, $old_drive->{mbps_wr}) ||
4437 &$safe_num_ne($drive->{iops}, $old_drive->{iops}) ||
4438 &$safe_num_ne($drive->{iops_rd}, $old_drive->{iops_rd}) ||
4439 &$safe_num_ne($drive->{iops_wr}, $old_drive->{iops_wr}) ||
4440 &$safe_num_ne($drive->{mbps_max}, $old_drive->{mbps_max}) ||
4441 &$safe_num_ne($drive->{mbps_rd_max}, $old_drive->{mbps_rd_max}) ||
4442 &$safe_num_ne($drive->{mbps_wr_max}, $old_drive->{mbps_wr_max}) ||
4443 &$safe_num_ne($drive->{iops_max}, $old_drive->{iops_max}) ||
4444 &$safe_num_ne($drive->{iops_rd_max}, $old_drive->{iops_rd_max}) ||
9196a8ec
WB
4445 &$safe_num_ne($drive->{iops_wr_max}, $old_drive->{iops_wr_max}) ||
4446 &$safe_num_ne($drive->{bps_max_length}, $old_drive->{bps_max_length}) ||
4447 &$safe_num_ne($drive->{bps_rd_max_length}, $old_drive->{bps_rd_max_length}) ||
4448 &$safe_num_ne($drive->{bps_wr_max_length}, $old_drive->{bps_wr_max_length}) ||
4449 &$safe_num_ne($drive->{iops_max_length}, $old_drive->{iops_max_length}) ||
4450 &$safe_num_ne($drive->{iops_rd_max_length}, $old_drive->{iops_rd_max_length}) ||
4451 &$safe_num_ne($drive->{iops_wr_max_length}, $old_drive->{iops_wr_max_length})) {
a1b7d579 4452
a05cff86
DM
4453 qemu_block_set_io_throttle($vmid,"drive-$opt",
4454 ($drive->{mbps} || 0)*1024*1024,
4455 ($drive->{mbps_rd} || 0)*1024*1024,
4456 ($drive->{mbps_wr} || 0)*1024*1024,
4457 $drive->{iops} || 0,
4458 $drive->{iops_rd} || 0,
4459 $drive->{iops_wr} || 0,
4460 ($drive->{mbps_max} || 0)*1024*1024,
4461 ($drive->{mbps_rd_max} || 0)*1024*1024,
4462 ($drive->{mbps_wr_max} || 0)*1024*1024,
4463 $drive->{iops_max} || 0,
4464 $drive->{iops_rd_max} || 0,
9196a8ec
WB
4465 $drive->{iops_wr_max} || 0,
4466 $drive->{bps_max_length} || 1,
4467 $drive->{bps_rd_max_length} || 1,
4468 $drive->{bps_wr_max_length} || 1,
4469 $drive->{iops_max_length} || 1,
4470 $drive->{iops_rd_max_length} || 1,
4471 $drive->{iops_wr_max_length} || 1);
a05cff86
DM
4472
4473 }
a1b7d579 4474
a05cff86
DM
4475 return 1;
4476 }
4de1bb25
DM
4477
4478 } else { # cdrom
a1b7d579 4479
4de1bb25
DM
4480 if ($drive->{file} eq 'none') {
4481 vm_mon_cmd($vmid, "eject",force => JSON::true,device => "drive-$opt");
4482 } else {
4483 my $path = get_iso_path($storecfg, $vmid, $drive->{file});
4484 vm_mon_cmd($vmid, "eject", force => JSON::true,device => "drive-$opt"); # force eject if locked
4485 vm_mon_cmd($vmid, "change", device => "drive-$opt",target => "$path") if $path;
4486 }
a1b7d579 4487
34758d66 4488 return 1;
a05cff86
DM
4489 }
4490 }
4491 }
4492
a1b7d579 4493 die "skip\n" if !$hotplug || $opt =~ m/(ide|sata)(\d+)/;
4de1bb25 4494 # hotplug new disks
f7b4356f 4495 PVE::Storage::activate_volumes($storecfg, [$drive->{file}]) if $drive->{file} !~ m|^/dev/.+|;
4de1bb25 4496 vm_deviceplug($storecfg, $conf, $vmid, $opt, $drive);
a05cff86
DM
4497}
4498
1e3baf05 4499sub vm_start {
ba9e1000 4500 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused,
2189246c 4501 $forcemachine, $spice_ticket, $migration_network, $migration_type, $targetstorage) = @_;
1e3baf05 4502
ffda963f
FG
4503 PVE::QemuConfig->lock_config($vmid, sub {
4504 my $conf = PVE::QemuConfig->load_config($vmid, $migratedfrom);
1e3baf05 4505
ffda963f 4506 die "you can't start a vm if it's a template\n" if PVE::QemuConfig->is_template($conf);
3dcb98d5 4507
ffda963f 4508 PVE::QemuConfig->check_lock($conf) if !$skiplock;
1e3baf05 4509
7e8dcf2c 4510 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 4511
055d554d 4512 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3a11fadb 4513 vmconfig_apply_pending($vmid, $conf, $storecfg);
ffda963f 4514 $conf = PVE::QemuConfig->load_config($vmid); # update/reload
055d554d
DM
4515 }
4516
6c47d546
DM
4517 my $defaults = load_defaults();
4518
4519 # set environment variable useful inside network script
4520 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
4521
2189246c
AD
4522 my $local_volumes = {};
4523
3b4cf0f0 4524 if ($targetstorage) {
2189246c
AD
4525 foreach_drive($conf, sub {
4526 my ($ds, $drive) = @_;
4527
4528 return if drive_is_cdrom($drive);
4529
4530 my $volid = $drive->{file};
4531
4532 return if !$volid;
4533
4534 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid);
4535
4536 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
4537 return if $scfg->{shared};
4538 $local_volumes->{$ds} = [$volid, $storeid, $volname];
4539 });
4540
4541 my $format = undef;
4542
4543 foreach my $opt (sort keys %$local_volumes) {
4544
4545 my ($volid, $storeid, $volname) = @{$local_volumes->{$opt}};
4546 my $drive = parse_drive($opt, $conf->{$opt});
4547
4548 #if remote storage is specified, use default format
4549 if ($targetstorage && $targetstorage ne "1") {
4550 $storeid = $targetstorage;
4551 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
4552 $format = $defFormat;
4553 } else {
4554 #else we use same format than original
4555 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
4556 $format = qemu_img_format($scfg, $volid);
4557 }
4558
4559 my $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $vmid, $format, undef, ($drive->{size}/1024));
4560 my $newdrive = $drive;
4561 $newdrive->{format} = $format;
4562 $newdrive->{file} = $newvolid;
4563 my $drivestr = PVE::QemuServer::print_drive($vmid, $newdrive);
4564 $local_volumes->{$opt} = $drivestr;
4565 #pass drive to conf for command line
4566 $conf->{$opt} = $drivestr;
4567 }
4568 }
4569
67812f9c 4570 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 4571
1e3baf05 4572 my $migrate_port = 0;
5bc1e039 4573 my $migrate_uri;
1e3baf05
DM
4574 if ($statefile) {
4575 if ($statefile eq 'tcp') {
5bc1e039
SP
4576 my $localip = "localhost";
4577 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
af0eba7e 4578 my $nodename = PVE::INotify::nodename();
2de2d6f7 4579
b7a5a225
TL
4580 if (!defined($migration_type)) {
4581 if (defined($datacenterconf->{migration}->{type})) {
4582 $migration_type = $datacenterconf->{migration}->{type};
4583 } else {
4584 $migration_type = 'secure';
4585 }
4586 }
4587
2de2d6f7
TL
4588 if ($migration_type eq 'insecure') {
4589 my $migrate_network_addr = PVE::Cluster::get_local_migration_ip($migration_network);
4590 if ($migrate_network_addr) {
4591 $localip = $migrate_network_addr;
4592 } else {
5bc1e039 4593 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
2de2d6f7
TL
4594 }
4595
4596 $localip = "[$localip]" if Net::IP::ip_is_ipv6($localip);
5bc1e039 4597 }
2de2d6f7 4598
af0eba7e
WB
4599 my $pfamily = PVE::Tools::get_host_address_family($nodename);
4600 $migrate_port = PVE::Tools::next_migrate_port($pfamily);
407e0b8b 4601 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
4602 push @$cmd, '-incoming', $migrate_uri;
4603 push @$cmd, '-S';
1c9d54bf
TL
4604
4605 } elsif ($statefile eq 'unix') {
4606 # should be default for secure migrations as a ssh TCP forward
4607 # tunnel is not deterministic reliable ready and fails regurarly
4608 # to set up in time, so use UNIX socket forwards
54323eed
TL
4609 my $socket_addr = "/run/qemu-server/$vmid.migrate";
4610 unlink $socket_addr;
4611
4612 $migrate_uri = "unix:$socket_addr";
1c9d54bf
TL
4613
4614 push @$cmd, '-incoming', $migrate_uri;
4615 push @$cmd, '-S';
4616
1e3baf05 4617 } else {
6c47d546 4618 push @$cmd, '-loadstate', $statefile;
1e3baf05 4619 }
91bd6c90
DM
4620 } elsif ($paused) {
4621 push @$cmd, '-S';
1e3baf05
DM
4622 }
4623
1e3baf05 4624 # host pci devices
040b06b7
DA
4625 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
4626 my $d = parse_hostpci($conf->{"hostpci$i"});
4627 next if !$d;
b1f72af6
AD
4628 my $pcidevices = $d->{pciid};
4629 foreach my $pcidevice (@$pcidevices) {
4630 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 4631
b1f72af6
AD
4632 my $info = pci_device_info("0000:$pciid");
4633 die "IOMMU not present\n" if !check_iommu_support();
4634 die "no pci device info for device '$pciid'\n" if !$info;
6ea8cd3b 4635 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
8f3e88af 4636 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 4637 }
040b06b7 4638 }
1e3baf05
DM
4639
4640 PVE::Storage::activate_volumes($storecfg, $vollist);
4641
2b401189
AD
4642 if (!check_running($vmid, 1) && -d "/sys/fs/cgroup/systemd/qemu.slice/$vmid.scope") {
4643 my $cmd = [];
4644 push @$cmd, '/bin/systemctl', 'stop', "$vmid.scope";
4645 eval { run_command($cmd); };
4646 }
4647
8e59d952
WB
4648 my $cpuunits = defined($conf->{cpuunits}) ? $conf->{cpuunits}
4649 : $defaults->{cpuunits};
4650
7023f3ea
AD
4651 my %run_params = (timeout => $statefile ? undef : 30, umask => 0077);
4652
4653 my %properties = (
4654 Slice => 'qemu.slice',
4655 KillMode => 'none',
4656 CPUShares => $cpuunits
4657 );
4658
4659 if (my $cpulimit = $conf->{cpulimit}) {
4660 $properties{CPUQuota} = int($cpulimit * 100);
4661 }
4662 $properties{timeout} = 10 if $statefile; # setting up the scope shoul be quick
4663
4664 if ($conf->{hugepages}) {
4665
4666 my $code = sub {
4667 my $hugepages_topology = PVE::QemuServer::Memory::hugepages_topology($conf);
4668 my $hugepages_host_topology = PVE::QemuServer::Memory::hugepages_host_topology();
4669
4670 PVE::QemuServer::Memory::hugepages_mount();
4671 PVE::QemuServer::Memory::hugepages_allocate($hugepages_topology, $hugepages_host_topology);
4672
4673 eval {
4674 PVE::Tools::enter_systemd_scope($vmid, "Proxmox VE VM $vmid", %properties);
4675 run_command($cmd, %run_params);
4676 };
4677
4678 if (my $err = $@) {
4679 PVE::QemuServer::Memory::hugepages_reset($hugepages_host_topology);
4680 die $err;
4681 }
4682
4683 PVE::QemuServer::Memory::hugepages_pre_deallocate($hugepages_topology);
4684 };
4685 eval { PVE::QemuServer::Memory::hugepages_update_locked($code); };
4686
4687 } else {
4688 eval {
4689 PVE::Tools::enter_systemd_scope($vmid, "Proxmox VE VM $vmid", %properties);
4690 run_command($cmd, %run_params);
4691 };
4692 }
77cde36b
DC
4693
4694 if (my $err = $@) {
4695 # deactivate volumes if start fails
4696 eval { PVE::Storage::deactivate_volumes($storecfg, $vollist); };
4697 die "start failed: $err";
4698 }
1e3baf05 4699
5bc1e039 4700 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 4701
b37ecfe6 4702 if ($statefile && $statefile ne 'tcp' && $statefile ne 'unix') {
95381ce0 4703 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 4704 warn $@ if $@;
62de2cbd
DM
4705 }
4706
2189246c
AD
4707 #start nbd server for storage migration
4708 if ($targetstorage) {
2189246c
AD
4709 my $nodename = PVE::INotify::nodename();
4710 my $migrate_network_addr = PVE::Cluster::get_local_migration_ip($migration_network);
4711 my $localip = $migrate_network_addr ? $migrate_network_addr : PVE::Cluster::remote_node_ip($nodename, 1);
4712 my $pfamily = PVE::Tools::get_host_address_family($nodename);
4713 $migrate_port = PVE::Tools::next_migrate_port($pfamily);
4714
4715 vm_mon_cmd_nocheck($vmid, "nbd-server-start", addr => { type => 'inet', data => { host => "${localip}", port => "${migrate_port}" } } );
4716
4717 $localip = "[$localip]" if Net::IP::ip_is_ipv6($localip);
4718
4719 foreach my $opt (sort keys %$local_volumes) {
4720 my $volid = $local_volumes->{$opt};
4721 vm_mon_cmd_nocheck($vmid, "nbd-server-add", device => "drive-$opt", writable => JSON::true );
4722 my $migrate_storage_uri = "nbd:${localip}:${migrate_port}:exportname=drive-$opt";
4723 print "storage migration listens on $migrate_storage_uri volume:$volid\n";
4724 }
4725 }
4726
1d794448 4727 if ($migratedfrom) {
a89fded1 4728 eval {
8e90138a 4729 set_migration_caps($vmid);
a89fded1 4730 };
1d794448 4731 warn $@ if $@;
a89fded1 4732
1d794448
DM
4733 if ($spice_port) {
4734 print "spice listens on port $spice_port\n";
4735 if ($spice_ticket) {
8e90138a
DM
4736 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
4737 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
4738 }
4739 }
4740
1d794448 4741 } else {
15b1fc93 4742 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 4743 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 4744 if $conf->{balloon};
4ec05c4c 4745 }
25088687
DM
4746
4747 foreach my $opt (keys %$conf) {
4748 next if $opt !~ m/^net\d+$/;
4749 my $nicconf = parse_net($conf->{$opt});
4750 qemu_set_link_status($vmid, $opt, 0) if $nicconf->{link_down};
4751 }
e18b0b99 4752 }
a1b7d579 4753
eb065317
AD
4754 vm_mon_cmd_nocheck($vmid, 'qom-set',
4755 path => "machine/peripheral/balloon0",
4756 property => "guest-stats-polling-interval",
4757 value => 2) if (!defined($conf->{balloon}) || $conf->{balloon});
4758
1e3baf05
DM
4759 });
4760}
4761
0eedc444
AD
4762sub vm_mon_cmd {
4763 my ($vmid, $execute, %params) = @_;
4764
26f11676
DM
4765 my $cmd = { execute => $execute, arguments => \%params };
4766 vm_qmp_command($vmid, $cmd);
0eedc444
AD
4767}
4768
4769sub vm_mon_cmd_nocheck {
4770 my ($vmid, $execute, %params) = @_;
4771
26f11676
DM
4772 my $cmd = { execute => $execute, arguments => \%params };
4773 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
4774}
4775
c971c4f2 4776sub vm_qmp_command {
c5a07de5 4777 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 4778
c971c4f2 4779 my $res;
26f11676 4780
14db5366
DM
4781 my $timeout;
4782 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
4783 $timeout = $cmd->{arguments}->{timeout};
4784 delete $cmd->{arguments}->{timeout};
4785 }
be190583 4786
c971c4f2
AD
4787 eval {
4788 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
4789 my $sname = qmp_socket($vmid);
4790 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 4791 my $qmpclient = PVE::QMPClient->new();
dab36e1e 4792
14db5366 4793 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 4794 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
4795 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
4796 if scalar(%{$cmd->{arguments}});
4797 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
4798 } else {
4799 die "unable to open monitor socket\n";
4800 }
c971c4f2 4801 };
26f11676 4802 if (my $err = $@) {
c971c4f2
AD
4803 syslog("err", "VM $vmid qmp command failed - $err");
4804 die $err;
4805 }
4806
4807 return $res;
4808}
4809
9df5cbcc
DM
4810sub vm_human_monitor_command {
4811 my ($vmid, $cmdline) = @_;
4812
4813 my $res;
4814
f5eb281a 4815 my $cmd = {
9df5cbcc
DM
4816 execute => 'human-monitor-command',
4817 arguments => { 'command-line' => $cmdline},
4818 };
4819
4820 return vm_qmp_command($vmid, $cmd);
4821}
4822
1e3baf05
DM
4823sub vm_commandline {
4824 my ($storecfg, $vmid) = @_;
4825
ffda963f 4826 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05
DM
4827
4828 my $defaults = load_defaults();
4829
6b64503e 4830 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 4831
5930c1ff 4832 return PVE::Tools::cmd2string($cmd);
1e3baf05
DM
4833}
4834
4835sub vm_reset {
4836 my ($vmid, $skiplock) = @_;
4837
ffda963f 4838 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 4839
ffda963f 4840 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 4841
ffda963f 4842 PVE::QemuConfig->check_lock($conf) if !$skiplock;
1e3baf05 4843
816e2c4a 4844 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
4845 });
4846}
4847
4848sub get_vm_volumes {
4849 my ($conf) = @_;
1e3baf05 4850
ff1a2432 4851 my $vollist = [];
d5769dc2 4852 foreach_volid($conf, sub {
392f8b5d 4853 my ($volid, $attr) = @_;
ff1a2432 4854
d5769dc2 4855 return if $volid =~ m|^/|;
ff1a2432 4856
d5769dc2
DM
4857 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4858 return if !$sid;
ff1a2432
DM
4859
4860 push @$vollist, $volid;
1e3baf05 4861 });
ff1a2432
DM
4862
4863 return $vollist;
4864}
4865
4866sub vm_stop_cleanup {
70b04821 4867 my ($storecfg, $vmid, $conf, $keepActive, $apply_pending_changes) = @_;
ff1a2432 4868
745fed70 4869 eval {
ff1a2432 4870
254575e9
DM
4871 if (!$keepActive) {
4872 my $vollist = get_vm_volumes($conf);
4873 PVE::Storage::deactivate_volumes($storecfg, $vollist);
4874 }
a1b7d579 4875
ab6a046f 4876 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
4877 unlink "/var/run/qemu-server/${vmid}.$ext";
4878 }
a1b7d579 4879
70b04821 4880 vmconfig_apply_pending($vmid, $conf, $storecfg) if $apply_pending_changes;
745fed70
DM
4881 };
4882 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
4883}
4884
e6c3b671 4885# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
4886# We need that when migration VMs to other nodes (files already moved)
4887# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 4888sub vm_stop {
af30308f 4889 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 4890
9269013a 4891 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 4892
af30308f
DM
4893 if ($migratedfrom){
4894 my $pid = check_running($vmid, $nocheck, $migratedfrom);
4895 kill 15, $pid if $pid;
ffda963f 4896 my $conf = PVE::QemuConfig->load_config($vmid, $migratedfrom);
70b04821 4897 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 0);
af30308f
DM
4898 return;
4899 }
4900
ffda963f 4901 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 4902
e6c3b671 4903 my $pid = check_running($vmid, $nocheck);
ff1a2432 4904 return if !$pid;
1e3baf05 4905
ff1a2432 4906 my $conf;
e6c3b671 4907 if (!$nocheck) {
ffda963f
FG
4908 $conf = PVE::QemuConfig->load_config($vmid);
4909 PVE::QemuConfig->check_lock($conf) if !$skiplock;
7f4a5b5a 4910 if (!defined($timeout) && $shutdown && $conf->{startup}) {
38f7f26c 4911 my $opts = PVE::JSONSchema::pve_parse_startup_order($conf->{startup});
7f4a5b5a
DM
4912 $timeout = $opts->{down} if $opts->{down};
4913 }
e6c3b671 4914 }
19672434 4915
7f4a5b5a 4916 $timeout = 60 if !defined($timeout);
67fb9de6 4917
9269013a
DM
4918 eval {
4919 if ($shutdown) {
fbda7965 4920 if (defined($conf) && $conf->{agent}) {
2ea54503 4921 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 4922 } else {
2ea54503 4923 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 4924 }
9269013a 4925 } else {
2ea54503 4926 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 4927 }
9269013a 4928 };
1e3baf05
DM
4929 my $err = $@;
4930
4931 if (!$err) {
1e3baf05 4932 my $count = 0;
e6c3b671 4933 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4934 $count++;
4935 sleep 1;
4936 }
4937
4938 if ($count >= $timeout) {
9269013a
DM
4939 if ($force) {
4940 warn "VM still running - terminating now with SIGTERM\n";
4941 kill 15, $pid;
4942 } else {
4943 die "VM quit/powerdown failed - got timeout\n";
4944 }
4945 } else {
70b04821 4946 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
9269013a 4947 return;
1e3baf05
DM
4948 }
4949 } else {
9269013a
DM
4950 if ($force) {
4951 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4952 kill 15, $pid;
4953 } else {
afdb31d5 4954 die "VM quit/powerdown failed\n";
9269013a 4955 }
1e3baf05
DM
4956 }
4957
4958 # wait again
ff1a2432 4959 $timeout = 10;
1e3baf05
DM
4960
4961 my $count = 0;
e6c3b671 4962 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4963 $count++;
4964 sleep 1;
4965 }
4966
4967 if ($count >= $timeout) {
ff1a2432 4968 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 4969 kill 9, $pid;
ff1a2432 4970 sleep 1;
1e3baf05
DM
4971 }
4972
70b04821 4973 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
ff1a2432 4974 });
1e3baf05
DM
4975}
4976
4977sub vm_suspend {
4978 my ($vmid, $skiplock) = @_;
4979
ffda963f 4980 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 4981
ffda963f 4982 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 4983
e79706d4
FG
4984 PVE::QemuConfig->check_lock($conf)
4985 if !($skiplock || PVE::QemuConfig->has_lock($conf, 'backup'));
bcb7c9cf 4986
f77f91f3 4987 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
4988 });
4989}
4990
4991sub vm_resume {
289e0b85 4992 my ($vmid, $skiplock, $nocheck) = @_;
1e3baf05 4993
ffda963f 4994 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 4995
289e0b85 4996 if (!$nocheck) {
1e3baf05 4997
ffda963f 4998 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 4999
e79706d4
FG
5000 PVE::QemuConfig->check_lock($conf)
5001 if !($skiplock || PVE::QemuConfig->has_lock($conf, 'backup'));
289e0b85
AD
5002
5003 vm_mon_cmd($vmid, "cont");
5004
5005 } else {
5006 vm_mon_cmd_nocheck($vmid, "cont");
5007 }
1e3baf05
DM
5008 });
5009}
5010
5fdbe4f0
DM
5011sub vm_sendkey {
5012 my ($vmid, $skiplock, $key) = @_;
1e3baf05 5013
ffda963f 5014 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 5015
ffda963f 5016 my $conf = PVE::QemuConfig->load_config($vmid);
f5eb281a 5017
7b7c6d1b
DM
5018 # there is no qmp command, so we use the human monitor command
5019 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
5020 });
5021}
5022
5023sub vm_destroy {
5024 my ($storecfg, $vmid, $skiplock) = @_;
5025
ffda963f 5026 PVE::QemuConfig->lock_config($vmid, sub {
1e3baf05 5027
ffda963f 5028 my $conf = PVE::QemuConfig->load_config($vmid);
1e3baf05 5029
ff1a2432 5030 if (!check_running($vmid)) {
15cc8784 5031 destroy_vm($storecfg, $vmid, undef, $skiplock);
ff1a2432
DM
5032 } else {
5033 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
5034 }
5035 });
5036}
5037
1e3baf05
DM
5038# pci helpers
5039
5040sub file_write {
5041 my ($filename, $buf) = @_;
5042
6b64503e 5043 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
5044 return undef if !$fh;
5045
5046 my $res = print $fh $buf;
5047
5048 $fh->close();
5049
5050 return $res;
5051}
5052
5053sub pci_device_info {
5054 my ($name) = @_;
5055
5056 my $res;
5057
5058 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
5059 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
5060
5061 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
5062 return undef if !defined($irq) || $irq !~ m/^\d+$/;
5063
5064 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
5065 return undef if !defined($vendor) || $vendor !~ s/^0x//;
5066
5067 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
5068 return undef if !defined($product) || $product !~ s/^0x//;
5069
5070 $res = {
5071 name => $name,
5072 vendor => $vendor,
5073 product => $product,
5074 domain => $domain,
5075 bus => $bus,
5076 slot => $slot,
5077 func => $func,
5078 irq => $irq,
5079 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
5080 };
5081
5082 return $res;
5083}
5084
5085sub pci_dev_reset {
5086 my ($dev) = @_;
5087
5088 my $name = $dev->{name};
5089
5090 my $fn = "$pcisysfs/devices/$name/reset";
5091
6b64503e 5092 return file_write($fn, "1");
1e3baf05
DM
5093}
5094
000fc0a2
SP
5095sub pci_dev_bind_to_vfio {
5096 my ($dev) = @_;
5097
5098 my $name = $dev->{name};
5099
5100 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
5101
5102 if (!-d $vfio_basedir) {
5103 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
5104 }
5105 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
5106
5107 my $testdir = "$vfio_basedir/$name";
5108 return 1 if -d $testdir;
5109
5110 my $data = "$dev->{vendor} $dev->{product}";
5111 return undef if !file_write("$vfio_basedir/new_id", $data);
5112
5113 my $fn = "$pcisysfs/devices/$name/driver/unbind";
5114 if (!file_write($fn, $name)) {
5115 return undef if -f $fn;
5116 }
5117
5118 $fn = "$vfio_basedir/bind";
5119 if (! -d $testdir) {
5120 return undef if !file_write($fn, $name);
5121 }
5122
5123 return -d $testdir;
5124}
5125
5126sub pci_dev_group_bind_to_vfio {
5127 my ($pciid) = @_;
5128
5129 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
5130
5131 if (!-d $vfio_basedir) {
5132 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
5133 }
5134 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
5135
5136 # get IOMMU group devices
5137 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
5138 my @devs = grep /^0000:/, readdir($D);
5139 closedir($D);
5140
5141 foreach my $pciid (@devs) {
5142 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
f8fa2ed7
SP
5143
5144 # pci bridges, switches or root ports are not supported
5145 # they have a pci_bus subdirectory so skip them
5146 next if (-e "$pcisysfs/devices/$pciid/pci_bus");
5147
000fc0a2
SP
5148 my $info = pci_device_info($1);
5149 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
5150 }
5151
5152 return 1;
5153}
5154
3e16d5fc
DM
5155# vzdump restore implementaion
5156
ed221350 5157sub tar_archive_read_firstfile {
3e16d5fc 5158 my $archive = shift;
afdb31d5 5159
3e16d5fc
DM
5160 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
5161
5162 # try to detect archive type first
387ba257 5163 my $pid = open (my $fh, '-|', 'tar', 'tf', $archive) ||
3e16d5fc 5164 die "unable to open file '$archive'\n";
387ba257 5165 my $firstfile = <$fh>;
3e16d5fc 5166 kill 15, $pid;
387ba257 5167 close $fh;
3e16d5fc
DM
5168
5169 die "ERROR: archive contaions no data\n" if !$firstfile;
5170 chomp $firstfile;
5171
5172 return $firstfile;
5173}
5174
ed221350
DM
5175sub tar_restore_cleanup {
5176 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
5177
5178 print STDERR "starting cleanup\n";
5179
5180 if (my $fd = IO::File->new($statfile, "r")) {
5181 while (defined(my $line = <$fd>)) {
5182 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5183 my $volid = $2;
5184 eval {
5185 if ($volid =~ m|^/|) {
5186 unlink $volid || die 'unlink failed\n';
5187 } else {
ed221350 5188 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 5189 }
afdb31d5 5190 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
5191 };
5192 print STDERR "unable to cleanup '$volid' - $@" if $@;
5193 } else {
5194 print STDERR "unable to parse line in statfile - $line";
afdb31d5 5195 }
3e16d5fc
DM
5196 }
5197 $fd->close();
5198 }
5199}
5200
5201sub restore_archive {
a0d1b1a2 5202 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 5203
91bd6c90
DM
5204 my $format = $opts->{format};
5205 my $comp;
5206
5207 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
5208 $format = 'tar' if !$format;
5209 $comp = 'gzip';
5210 } elsif ($archive =~ m/\.tar$/) {
5211 $format = 'tar' if !$format;
5212 } elsif ($archive =~ m/.tar.lzo$/) {
5213 $format = 'tar' if !$format;
5214 $comp = 'lzop';
5215 } elsif ($archive =~ m/\.vma$/) {
5216 $format = 'vma' if !$format;
5217 } elsif ($archive =~ m/\.vma\.gz$/) {
5218 $format = 'vma' if !$format;
5219 $comp = 'gzip';
5220 } elsif ($archive =~ m/\.vma\.lzo$/) {
5221 $format = 'vma' if !$format;
5222 $comp = 'lzop';
5223 } else {
5224 $format = 'vma' if !$format; # default
5225 }
5226
5227 # try to detect archive format
5228 if ($format eq 'tar') {
5229 return restore_tar_archive($archive, $vmid, $user, $opts);
5230 } else {
5231 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
5232 }
5233}
5234
5235sub restore_update_config_line {
5236 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
5237
5238 return if $line =~ m/^\#qmdump\#/;
5239 return if $line =~ m/^\#vzdump\#/;
5240 return if $line =~ m/^lock:/;
5241 return if $line =~ m/^unused\d+:/;
5242 return if $line =~ m/^parent:/;
ca3e4fa4 5243 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90 5244
b5b99790 5245 my $dc = PVE::Cluster::cfs_read_file('datacenter.cfg');
91bd6c90
DM
5246 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
5247 # try to convert old 1.X settings
5248 my ($id, $ind, $ethcfg) = ($1, $2, $3);
5249 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
5250 my ($model, $macaddr) = split(/\=/, $devconfig);
b5b99790 5251 $macaddr = PVE::Tools::random_ether_addr($dc->{mac_prefix}) if !$macaddr || $unique;
91bd6c90
DM
5252 my $net = {
5253 model => $model,
5254 bridge => "vmbr$ind",
5255 macaddr => $macaddr,
5256 };
5257 my $netstr = print_net($net);
5258
5259 print $outfd "net$cookie->{netcount}: $netstr\n";
5260 $cookie->{netcount}++;
5261 }
5262 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
5263 my ($id, $netstr) = ($1, $2);
5264 my $net = parse_net($netstr);
b5b99790 5265 $net->{macaddr} = PVE::Tools::random_ether_addr($dc->{mac_prefix}) if $net->{macaddr};
91bd6c90
DM
5266 $netstr = print_net($net);
5267 print $outfd "$id: $netstr\n";
6470743f 5268 } elsif ($line =~ m/^((ide|scsi|virtio|sata|efidisk)\d+):\s*(\S+)\s*$/) {
91bd6c90 5269 my $virtdev = $1;
907ea891 5270 my $value = $3;
d9faf790
WB
5271 my $di = parse_drive($virtdev, $value);
5272 if (defined($di->{backup}) && !$di->{backup}) {
91bd6c90 5273 print $outfd "#$line";
c0f7406e 5274 } elsif ($map->{$virtdev}) {
8fd57431 5275 delete $di->{format}; # format can change on restore
91bd6c90 5276 $di->{file} = $map->{$virtdev};
ed221350 5277 $value = print_drive($vmid, $di);
91bd6c90
DM
5278 print $outfd "$virtdev: $value\n";
5279 } else {
5280 print $outfd $line;
5281 }
5282 } else {
5283 print $outfd $line;
5284 }
5285}
5286
5287sub scan_volids {
5288 my ($cfg, $vmid) = @_;
5289
5290 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
5291
5292 my $volid_hash = {};
5293 foreach my $storeid (keys %$info) {
5294 foreach my $item (@{$info->{$storeid}}) {
5295 next if !($item->{volid} && $item->{size});
5996a936 5296 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
5297 $volid_hash->{$item->{volid}} = $item;
5298 }
5299 }
5300
5301 return $volid_hash;
5302}
5303
77019edf
WB
5304sub is_volume_in_use {
5305 my ($storecfg, $conf, $skip_drive, $volid) = @_;
a8e2f942 5306
77019edf 5307 my $path = PVE::Storage::path($storecfg, $volid);
a8e2f942
DM
5308
5309 my $scan_config = sub {
5310 my ($cref, $snapname) = @_;
5311
5312 foreach my $key (keys %$cref) {
5313 my $value = $cref->{$key};
74479ee9 5314 if (is_valid_drivename($key)) {
a8e2f942
DM
5315 next if $skip_drive && $key eq $skip_drive;
5316 my $drive = parse_drive($key, $value);
5317 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
77019edf 5318 return 1 if $volid eq $drive->{file};
a8e2f942 5319 if ($drive->{file} =~ m!^/!) {
77019edf 5320 return 1 if $drive->{file} eq $path;
a8e2f942
DM
5321 } else {
5322 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
5323 next if !$storeid;
5324 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
5325 next if !$scfg;
77019edf 5326 return 1 if $path eq PVE::Storage::path($storecfg, $drive->{file}, $snapname);
a8e2f942
DM
5327 }
5328 }
5329 }
77019edf
WB
5330
5331 return 0;
a8e2f942
DM
5332 };
5333
77019edf 5334 return 1 if &$scan_config($conf);
a8e2f942
DM
5335
5336 undef $skip_drive;
5337
77019edf
WB
5338 foreach my $snapname (keys %{$conf->{snapshots}}) {
5339 return 1 if &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
a8e2f942
DM
5340 }
5341
77019edf 5342 return 0;
a8e2f942
DM
5343}
5344
91bd6c90
DM
5345sub update_disksize {
5346 my ($vmid, $conf, $volid_hash) = @_;
be190583 5347
91bd6c90
DM
5348 my $changes;
5349
5350 my $used = {};
5351
5996a936
DM
5352 # Note: it is allowed to define multiple storages with same path (alias), so
5353 # we need to check both 'volid' and real 'path' (two different volid can point
5354 # to the same path).
5355
5356 my $usedpath = {};
be190583 5357
91bd6c90
DM
5358 # update size info
5359 foreach my $opt (keys %$conf) {
74479ee9 5360 if (is_valid_drivename($opt)) {
ed221350 5361 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
5362 my $volid = $drive->{file};
5363 next if !$volid;
5364
5365 $used->{$volid} = 1;
be190583 5366 if ($volid_hash->{$volid} &&
5996a936
DM
5367 (my $path = $volid_hash->{$volid}->{path})) {
5368 $usedpath->{$path} = 1;
5369 }
91bd6c90 5370
ed221350 5371 next if drive_is_cdrom($drive);
91bd6c90
DM
5372 next if !$volid_hash->{$volid};
5373
5374 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
5375 my $new = print_drive($vmid, $drive);
5376 if ($new ne $conf->{$opt}) {
5377 $changes = 1;
5378 $conf->{$opt} = $new;
5379 }
91bd6c90
DM
5380 }
5381 }
5382
5996a936
DM
5383 # remove 'unusedX' entry if volume is used
5384 foreach my $opt (keys %$conf) {
5385 next if $opt !~ m/^unused\d+$/;
5386 my $volid = $conf->{$opt};
5387 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 5388 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
5389 $changes = 1;
5390 delete $conf->{$opt};
5391 }
5392 }
5393
91bd6c90
DM
5394 foreach my $volid (sort keys %$volid_hash) {
5395 next if $volid =~ m/vm-$vmid-state-/;
5396 next if $used->{$volid};
5996a936
DM
5397 my $path = $volid_hash->{$volid}->{path};
5398 next if !$path; # just to be sure
5399 next if $usedpath->{$path};
91bd6c90 5400 $changes = 1;
8793d495 5401 PVE::QemuConfig->add_unused_volume($conf, $volid);
05937a14 5402 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
5403 }
5404
5405 return $changes;
5406}
5407
5408sub rescan {
5409 my ($vmid, $nolock) = @_;
5410
20519efc 5411 my $cfg = PVE::Storage::config();
91bd6c90
DM
5412
5413 my $volid_hash = scan_volids($cfg, $vmid);
5414
5415 my $updatefn = sub {
5416 my ($vmid) = @_;
5417
ffda963f 5418 my $conf = PVE::QemuConfig->load_config($vmid);
be190583 5419
ffda963f 5420 PVE::QemuConfig->check_lock($conf);
91bd6c90 5421
03da3f0d
DM
5422 my $vm_volids = {};
5423 foreach my $volid (keys %$volid_hash) {
5424 my $info = $volid_hash->{$volid};
5425 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
5426 }
5427
5428 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 5429
ffda963f 5430 PVE::QemuConfig->write_config($vmid, $conf) if $changes;
91bd6c90
DM
5431 };
5432
5433 if (defined($vmid)) {
5434 if ($nolock) {
5435 &$updatefn($vmid);
5436 } else {
ffda963f 5437 PVE::QemuConfig->lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
5438 }
5439 } else {
5440 my $vmlist = config_list();
5441 foreach my $vmid (keys %$vmlist) {
5442 if ($nolock) {
5443 &$updatefn($vmid);
5444 } else {
ffda963f 5445 PVE::QemuConfig->lock_config($vmid, $updatefn, $vmid);
be190583 5446 }
91bd6c90
DM
5447 }
5448 }
5449}
5450
5451sub restore_vma_archive {
5452 my ($archive, $vmid, $user, $opts, $comp) = @_;
5453
5454 my $input = $archive eq '-' ? "<&STDIN" : undef;
5455 my $readfrom = $archive;
5456
5457 my $uncomp = '';
5458 if ($comp) {
5459 $readfrom = '-';
5460 my $qarchive = PVE::Tools::shellquote($archive);
5461 if ($comp eq 'gzip') {
5462 $uncomp = "zcat $qarchive|";
5463 } elsif ($comp eq 'lzop') {
5464 $uncomp = "lzop -d -c $qarchive|";
5465 } else {
5466 die "unknown compression method '$comp'\n";
5467 }
be190583 5468
91bd6c90
DM
5469 }
5470
5471 my $tmpdir = "/var/tmp/vzdumptmp$$";
5472 rmtree $tmpdir;
5473
5474 # disable interrupts (always do cleanups)
5475 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5476 warn "got interrupt - ignored\n";
5477 };
5478
5479 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
5480 POSIX::mkfifo($mapfifo, 0600);
5481 my $fifofh;
5482
5483 my $openfifo = sub {
5484 open($fifofh, '>', $mapfifo) || die $!;
5485 };
5486
5487 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
5488
5489 my $oldtimeout;
5490 my $timeout = 5;
5491
5492 my $devinfo = {};
5493
5494 my $rpcenv = PVE::RPCEnvironment::get();
5495
ffda963f 5496 my $conffile = PVE::QemuConfig->config_file($vmid);
91bd6c90
DM
5497 my $tmpfn = "$conffile.$$.tmp";
5498
ed221350 5499 # Note: $oldconf is undef if VM does not exists
ffda963f
FG
5500 my $cfs_path = PVE::QemuConfig->cfs_config_path($vmid);
5501 my $oldconf = PVE::Cluster::cfs_read_file($cfs_path);
ed221350 5502
91bd6c90
DM
5503 my $print_devmap = sub {
5504 my $virtdev_hash = {};
5505
5506 my $cfgfn = "$tmpdir/qemu-server.conf";
5507
5508 # we can read the config - that is already extracted
5509 my $fh = IO::File->new($cfgfn, "r") ||
5510 "unable to read qemu-server.conf - $!\n";
5511
6738ab9c 5512 my $fwcfgfn = "$tmpdir/qemu-server.fw";
3457d090
WL
5513 if (-f $fwcfgfn) {
5514 my $pve_firewall_dir = '/etc/pve/firewall';
5515 mkdir $pve_firewall_dir; # make sure the dir exists
5516 PVE::Tools::file_copy($fwcfgfn, "${pve_firewall_dir}/$vmid.fw");
5517 }
6738ab9c 5518
91bd6c90
DM
5519 while (defined(my $line = <$fh>)) {
5520 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
5521 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
5522 die "archive does not contain data for drive '$virtdev'\n"
5523 if !$devinfo->{$devname};
5524 if (defined($opts->{storage})) {
5525 $storeid = $opts->{storage} || 'local';
5526 } elsif (!$storeid) {
5527 $storeid = 'local';
5528 }
5529 $format = 'raw' if !$format;
5530 $devinfo->{$devname}->{devname} = $devname;
5531 $devinfo->{$devname}->{virtdev} = $virtdev;
5532 $devinfo->{$devname}->{format} = $format;
5533 $devinfo->{$devname}->{storeid} = $storeid;
5534
be190583 5535 # check permission on storage
91bd6c90
DM
5536 my $pool = $opts->{pool}; # todo: do we need that?
5537 if ($user ne 'root@pam') {
5538 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
5539 }
5540
5541 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
5542 }
5543 }
5544
5545 foreach my $devname (keys %$devinfo) {
be190583
DM
5546 die "found no device mapping information for device '$devname'\n"
5547 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
5548 }
5549
20519efc 5550 my $cfg = PVE::Storage::config();
ed221350
DM
5551
5552 # create empty/temp config
be190583 5553 if ($oldconf) {
ed221350
DM
5554 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
5555 foreach_drive($oldconf, sub {
5556 my ($ds, $drive) = @_;
5557
5558 return if drive_is_cdrom($drive);
5559
5560 my $volid = $drive->{file};
5561
5562 return if !$volid || $volid =~ m|^/|;
5563
5564 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
5565 return if !$path || !$owner || ($owner != $vmid);
5566
5567 # Note: only delete disk we want to restore
5568 # other volumes will become unused
5569 if ($virtdev_hash->{$ds}) {
6b72854b
FG
5570 eval { PVE::Storage::vdisk_free($cfg, $volid); };
5571 if (my $err = $@) {
5572 warn $err;
5573 }
ed221350
DM
5574 }
5575 });
381b8fae
DC
5576
5577 # delete vmstate files
5578 # since after the restore we have no snapshots anymore
5579 foreach my $snapname (keys %{$oldconf->{snapshots}}) {
5580 my $snap = $oldconf->{snapshots}->{$snapname};
5581 if ($snap->{vmstate}) {
5582 eval { PVE::Storage::vdisk_free($cfg, $snap->{vmstate}); };
5583 if (my $err = $@) {
5584 warn $err;
5585 }
5586 }
5587 }
ed221350
DM
5588 }
5589
5590 my $map = {};
91bd6c90
DM
5591 foreach my $virtdev (sort keys %$virtdev_hash) {
5592 my $d = $virtdev_hash->{$virtdev};
5593 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
5594 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
5595
5596 # test if requested format is supported
5597 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
5598 my $supported = grep { $_ eq $d->{format} } @$validFormats;
5599 $d->{format} = $defFormat if !$supported;
5600
91bd6c90
DM
5601 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
5602 $d->{format}, undef, $alloc_size);
5603 print STDERR "new volume ID is '$volid'\n";
5604 $d->{volid} = $volid;
5605 my $path = PVE::Storage::path($cfg, $volid);
5606
5f96f4df
WL
5607 PVE::Storage::activate_volumes($cfg,[$volid]);
5608
91bd6c90 5609 my $write_zeros = 1;
88240a83 5610 if (PVE::Storage::volume_has_feature($cfg, 'sparseinit', $volid)) {
91bd6c90
DM
5611 $write_zeros = 0;
5612 }
5613
3c525055 5614 print $fifofh "format=$d->{format}:${write_zeros}:$d->{devname}=$path\n";
91bd6c90
DM
5615
5616 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
5617 $map->{$virtdev} = $volid;
5618 }
5619
5620 $fh->seek(0, 0) || die "seek failed - $!\n";
5621
5622 my $outfd = new IO::File ($tmpfn, "w") ||
5623 die "unable to write config for VM $vmid\n";
5624
5625 my $cookie = { netcount => 0 };
5626 while (defined(my $line = <$fh>)) {
be190583 5627 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
5628 }
5629
5630 $fh->close();
5631 $outfd->close();
5632 };
5633
5634 eval {
5635 # enable interrupts
5636 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5637 die "interrupted by signal\n";
5638 };
5639 local $SIG{ALRM} = sub { die "got timeout\n"; };
5640
5641 $oldtimeout = alarm($timeout);
5642
5643 my $parser = sub {
5644 my $line = shift;
5645
5646 print "$line\n";
5647
5648 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
5649 my ($dev_id, $size, $devname) = ($1, $2, $3);
5650 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
5651 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 5652 # we correctly received the vma config, so we can disable
3cf90d7a
DM
5653 # the timeout now for disk allocation (set to 10 minutes, so
5654 # that we always timeout if something goes wrong)
5655 alarm(600);
91bd6c90
DM
5656 &$print_devmap();
5657 print $fifofh "done\n";
5658 my $tmp = $oldtimeout || 0;
5659 $oldtimeout = undef;
5660 alarm($tmp);
5661 close($fifofh);
5662 }
5663 };
be190583 5664
91bd6c90
DM
5665 print "restore vma archive: $cmd\n";
5666 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
5667 };
5668 my $err = $@;
5669
5670 alarm($oldtimeout) if $oldtimeout;
5671
5f96f4df
WL
5672 my $vollist = [];
5673 foreach my $devname (keys %$devinfo) {
5674 my $volid = $devinfo->{$devname}->{volid};
5675 push @$vollist, $volid if $volid;
5676 }
5677
20519efc 5678 my $cfg = PVE::Storage::config();
5f96f4df
WL
5679 PVE::Storage::deactivate_volumes($cfg, $vollist);
5680
91bd6c90
DM
5681 unlink $mapfifo;
5682
5683 if ($err) {
5684 rmtree $tmpdir;
5685 unlink $tmpfn;
5686
91bd6c90
DM
5687 foreach my $devname (keys %$devinfo) {
5688 my $volid = $devinfo->{$devname}->{volid};
5689 next if !$volid;
5690 eval {
5691 if ($volid =~ m|^/|) {
5692 unlink $volid || die 'unlink failed\n';
5693 } else {
5694 PVE::Storage::vdisk_free($cfg, $volid);
5695 }
5696 print STDERR "temporary volume '$volid' sucessfuly removed\n";
5697 };
5698 print STDERR "unable to cleanup '$volid' - $@" if $@;
5699 }
5700 die $err;
5701 }
5702
5703 rmtree $tmpdir;
ed221350
DM
5704
5705 rename($tmpfn, $conffile) ||
91bd6c90
DM
5706 die "unable to commit configuration file '$conffile'\n";
5707
ed221350
DM
5708 PVE::Cluster::cfs_update(); # make sure we read new file
5709
91bd6c90
DM
5710 eval { rescan($vmid, 1); };
5711 warn $@ if $@;
5712}
5713
5714sub restore_tar_archive {
5715 my ($archive, $vmid, $user, $opts) = @_;
5716
9c502e26 5717 if ($archive ne '-') {
ed221350 5718 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
5719 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
5720 if $firstfile ne 'qemu-server.conf';
5721 }
3e16d5fc 5722
20519efc 5723 my $storecfg = PVE::Storage::config();
ebb55558 5724
ed221350 5725 # destroy existing data - keep empty config
ffda963f 5726 my $vmcfgfn = PVE::QemuConfig->config_file($vmid);
ebb55558 5727 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 5728
3e16d5fc
DM
5729 my $tocmd = "/usr/lib/qemu-server/qmextract";
5730
2415a446 5731 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 5732 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
5733 $tocmd .= ' --prealloc' if $opts->{prealloc};
5734 $tocmd .= ' --info' if $opts->{info};
5735
a0d1b1a2 5736 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 5737 # so we pipe to zcat
2415a446
DM
5738 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
5739 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
5740
5741 my $tmpdir = "/var/tmp/vzdumptmp$$";
5742 mkpath $tmpdir;
5743
5744 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
5745 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 5746 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 5747
ffda963f 5748 my $conffile = PVE::QemuConfig->config_file($vmid);
3e16d5fc
DM
5749 my $tmpfn = "$conffile.$$.tmp";
5750
5751 # disable interrupts (always do cleanups)
5752 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5753 print STDERR "got interrupt - ignored\n";
5754 };
5755
afdb31d5 5756 eval {
3e16d5fc
DM
5757 # enable interrupts
5758 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5759 die "interrupted by signal\n";
5760 };
5761
9c502e26
DM
5762 if ($archive eq '-') {
5763 print "extracting archive from STDIN\n";
5764 run_command($cmd, input => "<&STDIN");
5765 } else {
5766 print "extracting archive '$archive'\n";
5767 run_command($cmd);
5768 }
3e16d5fc
DM
5769
5770 return if $opts->{info};
5771
5772 # read new mapping
5773 my $map = {};
5774 my $statfile = "$tmpdir/qmrestore.stat";
5775 if (my $fd = IO::File->new($statfile, "r")) {
5776 while (defined (my $line = <$fd>)) {
5777 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5778 $map->{$1} = $2 if $1;
5779 } else {
5780 print STDERR "unable to parse line in statfile - $line\n";
5781 }
5782 }
5783 $fd->close();
5784 }
5785
5786 my $confsrc = "$tmpdir/qemu-server.conf";
5787
5788 my $srcfd = new IO::File($confsrc, "r") ||
5789 die "unable to open file '$confsrc'\n";
5790
5791 my $outfd = new IO::File ($tmpfn, "w") ||
5792 die "unable to write config for VM $vmid\n";
5793
91bd6c90 5794 my $cookie = { netcount => 0 };
3e16d5fc 5795 while (defined (my $line = <$srcfd>)) {
be190583 5796 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
5797 }
5798
5799 $srcfd->close();
5800 $outfd->close();
5801 };
5802 my $err = $@;
5803
afdb31d5 5804 if ($err) {
3e16d5fc
DM
5805
5806 unlink $tmpfn;
5807
ed221350 5808 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 5809
3e16d5fc 5810 die $err;
afdb31d5 5811 }
3e16d5fc
DM
5812
5813 rmtree $tmpdir;
5814
5815 rename $tmpfn, $conffile ||
5816 die "unable to commit configuration file '$conffile'\n";
91bd6c90 5817
ed221350
DM
5818 PVE::Cluster::cfs_update(); # make sure we read new file
5819
91bd6c90
DM
5820 eval { rescan($vmid, 1); };
5821 warn $@ if $@;
3e16d5fc
DM
5822};
5823
18bfb361
DM
5824sub foreach_writable_storage {
5825 my ($conf, $func) = @_;
5826
5827 my $sidhash = {};
5828
5829 foreach my $ds (keys %$conf) {
74479ee9 5830 next if !is_valid_drivename($ds);
18bfb361
DM
5831
5832 my $drive = parse_drive($ds, $conf->{$ds});
5833 next if !$drive;
5834 next if drive_is_cdrom($drive);
5835
5836 my $volid = $drive->{file};
5837
5838 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 5839 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
5840 }
5841
5842 foreach my $sid (sort keys %$sidhash) {
5843 &$func($sid);
5844 }
5845}
5846
e5eaa028
WL
5847sub do_snapshots_with_qemu {
5848 my ($storecfg, $volid) = @_;
5849
5850 my $storage_name = PVE::Storage::parse_volume_id($volid);
5851
116da784
WL
5852 if ($qemu_snap_storage->{$storecfg->{ids}->{$storage_name}->{type}}
5853 && !$storecfg->{ids}->{$storage_name}->{krbd}){
e5eaa028
WL
5854 return 1;
5855 }
5856
5857 if ($volid =~ m/\.(qcow2|qed)$/){
5858 return 1;
5859 }
5860
5861 return undef;
5862}
5863
4dcc780c
WL
5864sub qga_check_running {
5865 my ($vmid) = @_;
5866
5867 eval { vm_mon_cmd($vmid, "guest-ping", timeout => 3); };
5868 if ($@) {
5869 warn "Qemu Guest Agent are not running - $@";
5870 return 0;
5871 }
5872 return 1;
5873}
5874
04a69bb4
AD
5875sub template_create {
5876 my ($vmid, $conf, $disk) = @_;
5877
04a69bb4 5878 my $storecfg = PVE::Storage::config();
04a69bb4 5879
9cd07842
DM
5880 foreach_drive($conf, sub {
5881 my ($ds, $drive) = @_;
5882
5883 return if drive_is_cdrom($drive);
5884 return if $disk && $ds ne $disk;
5885
5886 my $volid = $drive->{file};
bbd56097 5887 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5888
04a69bb4
AD
5889 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5890 $drive->{file} = $voliddst;
152fe752 5891 $conf->{$ds} = print_drive($vmid, $drive);
ffda963f 5892 PVE::QemuConfig->write_config($vmid, $conf);
04a69bb4 5893 });
04a69bb4
AD
5894}
5895
5133de42 5896sub qemu_img_convert {
988e2714 5897 my ($src_volid, $dst_volid, $size, $snapname, $is_zero_initialized) = @_;
5133de42
AD
5898
5899 my $storecfg = PVE::Storage::config();
5900 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5901 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5902
5903 if ($src_storeid && $dst_storeid) {
6bb91c17
DM
5904
5905 PVE::Storage::activate_volumes($storecfg, [$src_volid], $snapname);
5906
5133de42
AD
5907 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5908 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5909
5910 my $src_format = qemu_img_format($src_scfg, $src_volname);
5911 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5912
5913 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5914 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5915
5916 my $cmd = [];
eed24303 5917 push @$cmd, '/usr/bin/qemu-img', 'convert', '-p', '-n';
5133de42 5918 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
988e2714
WB
5919 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path;
5920 if ($is_zero_initialized) {
5921 push @$cmd, "zeroinit:$dst_path";
5922 } else {
5923 push @$cmd, $dst_path;
5924 }
5133de42
AD
5925
5926 my $parser = sub {
5927 my $line = shift;
5928 if($line =~ m/\((\S+)\/100\%\)/){
5929 my $percent = $1;
5930 my $transferred = int($size * $percent / 100);
5931 my $remaining = $size - $transferred;
5932
5933 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5934 }
5935
5936 };
5937
5938 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5939 my $err = $@;
5940 die "copy failed: $err" if $err;
5941 }
5942}
5943
5944sub qemu_img_format {
5945 my ($scfg, $volname) = @_;
5946
d81f0f09 5947 if ($scfg->{path} && $volname =~ m/\.(raw|cow|qcow|qcow2|qed|vmdk|cloop)$/) {
5133de42 5948 return $1;
be190583 5949 } else {
5133de42 5950 return "raw";
5133de42
AD
5951 }
5952}
5953
cfad42af 5954sub qemu_drive_mirror {
5619e74a 5955 my ($vmid, $drive, $dst_volid, $vmiddst, $is_zero_initialized, $jobs, $skipcomplete, $qga) = @_;
cfad42af 5956
5a345967
AD
5957 $jobs = {} if !$jobs;
5958
5959 my $qemu_target;
5960 my $format;
35e4ab04 5961 $jobs->{"drive-$drive"} = {};
152fe752 5962
3b4cf0f0 5963 if ($dst_volid =~ /^nbd:(localhost|[\d\.]+|\[[\d\.:a-fA-F]+\]):(\d+):exportname=(\S+)/) {
5a345967
AD
5964 my $server = $1;
5965 my $port = $2;
35e4ab04
AD
5966 my $exportname = $3;
5967
5a345967 5968 $format = "nbd";
35e4ab04
AD
5969 my $unixsocket = "/run/qemu-server/$vmid.mirror-drive-$drive";
5970 $qemu_target = "nbd+unix:///$exportname?socket=$unixsocket";
923aaa9e 5971 my $cmd = ['socat', '-T30', "UNIX-LISTEN:$unixsocket,fork", "TCP:$server:$2,connect-timeout=5"];
35e4ab04
AD
5972
5973 my $pid = fork();
5974 if (!defined($pid)) {
bd2d5fe6 5975 die "forking socat tunnel failed\n";
35e4ab04
AD
5976 } elsif ($pid == 0) {
5977 exec(@$cmd);
ca5c27f0
WB
5978 warn "exec failed: $!\n";
5979 POSIX::_exit(-1);
5980 }
5981 $jobs->{"drive-$drive"}->{pid} = $pid;
35e4ab04 5982
ca5c27f0
WB
5983 my $timeout = 0;
5984 while (!-S $unixsocket) {
5985 die "nbd connection helper timed out\n"
5986 if $timeout++ > 5;
5987 sleep 1;
35e4ab04 5988 }
5a345967 5989 } else {
5a345967
AD
5990 my $storecfg = PVE::Storage::config();
5991 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
5992
5993 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 5994
5a345967 5995 $format = qemu_img_format($dst_scfg, $dst_volname);
21ccdb50 5996
5a345967 5997 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 5998
5a345967
AD
5999 $qemu_target = $is_zero_initialized ? "zeroinit:$dst_path" : $dst_path;
6000 }
988e2714
WB
6001
6002 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $qemu_target };
88383920
DM
6003 $opts->{format} = $format if $format;
6004
5a345967 6005 print "drive mirror is starting for drive-$drive\n";
21ccdb50 6006
5a345967 6007 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); }; #if a job already run for this device,it's throw an error
35e4ab04 6008
5a345967
AD
6009 if (my $err = $@) {
6010 eval { PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs) };
6011 die "mirroring error: $err";
6012 }
6013
5619e74a 6014 qemu_drive_mirror_monitor ($vmid, $vmiddst, $jobs, $skipcomplete, $qga);
5a345967
AD
6015}
6016
6017sub qemu_drive_mirror_monitor {
5619e74a 6018 my ($vmid, $vmiddst, $jobs, $skipcomplete, $qga) = @_;
2e953867 6019
08ac653f 6020 eval {
5a345967
AD
6021 my $err_complete = 0;
6022
08ac653f 6023 while (1) {
5a345967
AD
6024 die "storage migration timed out\n" if $err_complete > 300;
6025
08ac653f 6026 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
08ac653f 6027
5a345967
AD
6028 my $running_mirror_jobs = {};
6029 foreach my $stat (@$stats) {
6030 next if $stat->{type} ne 'mirror';
6031 $running_mirror_jobs->{$stat->{device}} = $stat;
6032 }
08ac653f 6033
5a345967 6034 my $readycounter = 0;
67fb9de6 6035
5a345967
AD
6036 foreach my $job (keys %$jobs) {
6037
6038 if(defined($jobs->{$job}->{complete}) && !defined($running_mirror_jobs->{$job})) {
6039 print "$job : finished\n";
6040 delete $jobs->{$job};
6041 next;
6042 }
6043
bd2d5fe6 6044 die "$job: mirroring has been cancelled\n" if !defined($running_mirror_jobs->{$job});
f34ebd52 6045
5a345967
AD
6046 my $busy = $running_mirror_jobs->{$job}->{busy};
6047 my $ready = $running_mirror_jobs->{$job}->{ready};
6048 if (my $total = $running_mirror_jobs->{$job}->{len}) {
6049 my $transferred = $running_mirror_jobs->{$job}->{offset} || 0;
6050 my $remaining = $total - $transferred;
6051 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
08ac653f 6052
5a345967
AD
6053 print "$job: transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy ready: $ready \n";
6054 }
f34ebd52 6055
d1782eba 6056 $readycounter++ if $running_mirror_jobs->{$job}->{ready};
5a345967 6057 }
b467f79a 6058
5a345967
AD
6059 last if scalar(keys %$jobs) == 0;
6060
6061 if ($readycounter == scalar(keys %$jobs)) {
6062 print "all mirroring jobs are ready \n";
6063 last if $skipcomplete; #do the complete later
6064
6065 if ($vmiddst && $vmiddst != $vmid) {
5619e74a
AD
6066 if ($qga) {
6067 print "freeze filesystem\n";
6068 eval { PVE::QemuServer::vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
6069 } else {
6070 print "suspend vm\n";
6071 eval { PVE::QemuServer::vm_suspend($vmid, 1); };
6072 }
6073
5a345967
AD
6074 # if we clone a disk for a new target vm, we don't switch the disk
6075 PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs);
5619e74a
AD
6076
6077 if ($qga) {
6078 print "unfreeze filesystem\n";
6079 eval { PVE::QemuServer::vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
6080 } else {
6081 print "resume vm\n";
6082 eval { PVE::QemuServer::vm_resume($vmid, 1, 1); };
6083 }
6084
2e953867 6085 last;
5a345967
AD
6086 } else {
6087
6088 foreach my $job (keys %$jobs) {
6089 # try to switch the disk if source and destination are on the same guest
bd2d5fe6 6090 print "$job: Completing block job...\n";
5a345967
AD
6091
6092 eval { vm_mon_cmd($vmid, "block-job-complete", device => $job) };
6093 if ($@ =~ m/cannot be completed/) {
bd2d5fe6 6094 print "$job: Block job cannot be completed, try again.\n";
5a345967
AD
6095 $err_complete++;
6096 }else {
bd2d5fe6 6097 print "$job: Completed successfully.\n";
5a345967 6098 $jobs->{$job}->{complete} = 1;
35e4ab04 6099 eval { qemu_blockjobs_finish_tunnel($vmid, $job, $jobs->{$job}->{pid}) } ;
5a345967
AD
6100 }
6101 }
2e953867 6102 }
08ac653f 6103 }
08ac653f 6104 sleep 1;
cfad42af 6105 }
08ac653f 6106 };
88383920 6107 my $err = $@;
08ac653f 6108
88383920 6109 if ($err) {
5a345967 6110 eval { PVE::QemuServer::qemu_blockjobs_cancel($vmid, $jobs) };
88383920
DM
6111 die "mirroring error: $err";
6112 }
6113
5a345967
AD
6114}
6115
6116sub qemu_blockjobs_cancel {
6117 my ($vmid, $jobs) = @_;
6118
6119 foreach my $job (keys %$jobs) {
bd2d5fe6 6120 print "$job: Cancelling block job\n";
5a345967
AD
6121 eval { vm_mon_cmd($vmid, "block-job-cancel", device => $job); };
6122 $jobs->{$job}->{cancel} = 1;
6123 }
6124
6125 while (1) {
6126 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
6127
6128 my $running_jobs = {};
6129 foreach my $stat (@$stats) {
6130 $running_jobs->{$stat->{device}} = $stat;
6131 }
6132
6133 foreach my $job (keys %$jobs) {
6134
bd2d5fe6
WB
6135 if (defined($jobs->{$job}->{cancel}) && !defined($running_jobs->{$job})) {
6136 print "$job: Done.\n";
35e4ab04 6137 eval { qemu_blockjobs_finish_tunnel($vmid, $job, $jobs->{$job}->{pid}) } ;
5a345967
AD
6138 delete $jobs->{$job};
6139 }
6140 }
6141
6142 last if scalar(keys %$jobs) == 0;
6143
6144 sleep 1;
cfad42af
AD
6145 }
6146}
6147
35e4ab04
AD
6148sub qemu_blockjobs_finish_tunnel {
6149 my ($vmid, $job, $cpid) = @_;
6150
6151 return if !$cpid;
6152
6153 for (my $i = 1; $i < 20; $i++) {
6154 my $waitpid = waitpid($cpid, WNOHANG);
6155 last if (defined($waitpid) && ($waitpid == $cpid));
6156
6157 if ($i == 10) {
6158 kill(15, $cpid);
6159 } elsif ($i >= 15) {
6160 kill(9, $cpid);
6161 }
6162 sleep (1);
6163 }
6164 unlink "/run/qemu-server/$vmid.mirror-$job";
6165}
6166
152fe752 6167sub clone_disk {
be190583 6168 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
5619e74a 6169 $newvmid, $storage, $format, $full, $newvollist, $jobs, $skipcomplete, $qga) = @_;
152fe752
DM
6170
6171 my $newvolid;
6172
6173 if (!$full) {
6174 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 6175 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
6176 push @$newvollist, $newvolid;
6177 } else {
5a345967 6178
152fe752
DM
6179 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
6180 $storeid = $storage if $storage;
6181
44549149 6182 my $dst_format = resolve_dst_disk_format($storecfg, $storeid, $volname, $format);
152fe752
DM
6183 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
6184
6185 print "create full clone of drive $drivename ($drive->{file})\n";
44549149 6186 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $dst_format, undef, ($size/1024));
152fe752
DM
6187 push @$newvollist, $newvolid;
6188
3999f370 6189 PVE::Storage::activate_volumes($storecfg, [$newvolid]);
1dbd6d30 6190
988e2714 6191 my $sparseinit = PVE::Storage::volume_has_feature($storecfg, 'sparseinit', $newvolid);
152fe752 6192 if (!$running || $snapname) {
988e2714 6193 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname, $sparseinit);
152fe752 6194 } else {
2e541679
AD
6195
6196 my $kvmver = get_running_qemu_version ($vmid);
6197 if (!qemu_machine_feature_enabled (undef, $kvmver, 2, 7)) {
961af8a3
WB
6198 die "drive-mirror with iothread requires qemu version 2.7 or higher\n"
6199 if $drive->{iothread};
2e541679 6200 }
2af848a2 6201
5619e74a 6202 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid, $sparseinit, $jobs, $skipcomplete, $qga);
be190583 6203 }
152fe752
DM
6204 }
6205
6206 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
6207
6208 my $disk = $drive;
6209 $disk->{format} = undef;
6210 $disk->{file} = $newvolid;
6211 $disk->{size} = $size;
6212
6213 return $disk;
6214}
6215
ff556cf2
DM
6216# this only works if VM is running
6217sub get_current_qemu_machine {
6218 my ($vmid) = @_;
6219
6220 my $cmd = { execute => 'query-machines', arguments => {} };
8e90138a 6221 my $res = vm_qmp_command($vmid, $cmd);
ff556cf2
DM
6222
6223 my ($current, $default);
6224 foreach my $e (@$res) {
6225 $default = $e->{name} if $e->{'is-default'};
6226 $current = $e->{name} if $e->{'is-current'};
6227 }
6228
6229 # fallback to the default machine if current is not supported by qemu
6230 return $current || $default || 'pc';
6231}
6232
98cfd8b6
AD
6233sub get_running_qemu_version {
6234 my ($vmid) = @_;
6235 my $cmd = { execute => 'query-version', arguments => {} };
6236 my $res = vm_qmp_command($vmid, $cmd);
6237 return "$res->{qemu}->{major}.$res->{qemu}->{minor}";
6238}
6239
23f73120
AD
6240sub qemu_machine_feature_enabled {
6241 my ($machine, $kvmver, $version_major, $version_minor) = @_;
6242
6243 my $current_major;
6244 my $current_minor;
6245
6246 if ($machine && $machine =~ m/^(pc(-i440fx|-q35)?-(\d+)\.(\d+))/) {
6247
6248 $current_major = $3;
6249 $current_minor = $4;
6250
6251 } elsif ($kvmver =~ m/^(\d+)\.(\d+)/) {
6252
6253 $current_major = $1;
6254 $current_minor = $2;
6255 }
6256
6257 return 1 if $current_major >= $version_major && $current_minor >= $version_minor;
6258
6259
6260}
6261
42dbd2ee
AD
6262sub qemu_machine_pxe {
6263 my ($vmid, $conf, $machine) = @_;
6264
6265 $machine = PVE::QemuServer::get_current_qemu_machine($vmid) if !$machine;
6266
6267 foreach my $opt (keys %$conf) {
6268 next if $opt !~ m/^net(\d+)$/;
6269 my $net = PVE::QemuServer::parse_net($conf->{$opt});
6270 next if !$net;
6271 my $romfile = PVE::QemuServer::vm_mon_cmd_nocheck($vmid, 'qom-get', path => $opt, property => 'romfile');
6272 return $machine.".pxe" if $romfile =~ m/pxe/;
6273 last;
6274 }
6275
d1363934 6276 return $machine;
42dbd2ee
AD
6277}
6278
249c4a6c
AD
6279sub qemu_use_old_bios_files {
6280 my ($machine_type) = @_;
6281
6282 return if !$machine_type;
6283
6284 my $use_old_bios_files = undef;
6285
6286 if ($machine_type =~ m/^(\S+)\.pxe$/) {
6287 $machine_type = $1;
6288 $use_old_bios_files = 1;
6289 } else {
74cc511f 6290 my $kvmver = kvm_user_version();
249c4a6c
AD
6291 # Note: kvm version < 2.4 use non-efi pxe files, and have problems when we
6292 # load new efi bios files on migration. So this hack is required to allow
6293 # live migration from qemu-2.2 to qemu-2.4, which is sometimes used when
6294 # updrading from proxmox-ve-3.X to proxmox-ve 4.0
74cc511f 6295 $use_old_bios_files = !qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 4);
249c4a6c
AD
6296 }
6297
6298 return ($use_old_bios_files, $machine_type);
6299}
6300
4543ecf0
AD
6301sub lspci {
6302
6303 my $devices = {};
6304
6305 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
6306 my (undef, $id, $function) = @_;
6307 my $res = { id => $id, function => $function};
6308 push @{$devices->{$id}}, $res;
6309 });
6310
5ee38471
WB
6311 # Entries should be sorted by functions.
6312 foreach my $id (keys %$devices) {
6313 my $dev = $devices->{$id};
6314 $devices->{$id} = [ sort { $a->{function} <=> $b->{function} } @$dev ];
6315 }
6316
4543ecf0
AD
6317 return $devices;
6318}
6319
22de899a
AD
6320sub vm_iothreads_list {
6321 my ($vmid) = @_;
6322
6323 my $res = vm_mon_cmd($vmid, 'query-iothreads');
6324
6325 my $iothreads = {};
6326 foreach my $iothread (@$res) {
6327 $iothreads->{ $iothread->{id} } = $iothread->{"thread-id"};
6328 }
6329
6330 return $iothreads;
6331}
6332
ee034f5c
AD
6333sub scsihw_infos {
6334 my ($conf, $drive) = @_;
6335
6336 my $maxdev = 0;
6337
7fe1b688 6338 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)) {
ee034f5c 6339 $maxdev = 7;
a1511b3c 6340 } elsif ($conf->{scsihw} && ($conf->{scsihw} eq 'virtio-scsi-single')) {
ee034f5c
AD
6341 $maxdev = 1;
6342 } else {
6343 $maxdev = 256;
6344 }
6345
6346 my $controller = int($drive->{index} / $maxdev);
a1511b3c 6347 my $controller_prefix = ($conf->{scsihw} && $conf->{scsihw} eq 'virtio-scsi-single') ? "virtioscsi" : "scsihw";
ee034f5c
AD
6348
6349 return ($maxdev, $controller, $controller_prefix);
6350}
a1511b3c 6351
4317f69f
AD
6352sub add_hyperv_enlighments {
6353 my ($cpuFlags, $winversion, $machine_type, $kvmver, $nokvm, $bios, $gpu_passthrough) = @_;
6354
6355 return if $nokvm;
6356 return if $winversion < 6;
6357 return if $bios && $bios eq 'ovmf' && $winversion < 8;
6358
5aba3953
AD
6359 push @$cpuFlags , 'hv_vendor_id=proxmox' if $gpu_passthrough;
6360
4317f69f
AD
6361 if (qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 3)) {
6362 push @$cpuFlags , 'hv_spinlocks=0x1fff';
6363 push @$cpuFlags , 'hv_vapic';
6364 push @$cpuFlags , 'hv_time';
6365 } else {
6366 push @$cpuFlags , 'hv_spinlocks=0xffff';
6367 }
6368
6369 if (qemu_machine_feature_enabled ($machine_type, $kvmver, 2, 6)) {
6370 push @$cpuFlags , 'hv_reset';
6371 push @$cpuFlags , 'hv_vpindex';
6372 push @$cpuFlags , 'hv_runtime';
6373 }
6374
6375 if ($winversion >= 7) {
6376 push @$cpuFlags , 'hv_relaxed';
4317f69f
AD
6377 }
6378}
6379
6380sub windows_version {
6381 my ($ostype) = @_;
6382
6383 return 0 if !$ostype;
6384
6385 my $winversion = 0;
6386
6387 if($ostype eq 'wxp' || $ostype eq 'w2k3' || $ostype eq 'w2k') {
6388 $winversion = 5;
6389 } elsif($ostype eq 'w2k8' || $ostype eq 'wvista') {
6390 $winversion = 6;
6391 } elsif ($ostype =~ m/^win(\d+)$/) {
6392 $winversion = $1;
6393 }
6394
6395 return $winversion;
6396}
6397
44549149
EK
6398sub resolve_dst_disk_format {
6399 my ($storecfg, $storeid, $src_volname, $format) = @_;
6400 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
6401
6402 if (!$format) {
6403 # if no target format is specified, use the source disk format as hint
6404 if ($src_volname) {
6405 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
6406 $format = qemu_img_format($scfg, $src_volname);
6407 } else {
6408 return $defFormat;
6409 }
6410 }
6411
6412 # test if requested format is supported - else use default
6413 my $supported = grep { $_ eq $format } @$validFormats;
6414 $format = $defFormat if !$supported;
6415 return $format;
6416}
6417
65e866e5
DM
6418# bash completion helper
6419
6420sub complete_backup_archives {
6421 my ($cmdname, $pname, $cvalue) = @_;
6422
6423 my $cfg = PVE::Storage::config();
6424
6425 my $storeid;
6426
6427 if ($cvalue =~ m/^([^:]+):/) {
6428 $storeid = $1;
6429 }
6430
6431 my $data = PVE::Storage::template_list($cfg, $storeid, 'backup');
6432
6433 my $res = [];
6434 foreach my $id (keys %$data) {
6435 foreach my $item (@{$data->{$id}}) {
6436 next if $item->{format} !~ m/^vma\.(gz|lzo)$/;
6437 push @$res, $item->{volid} if defined($item->{volid});
6438 }
6439 }
6440
6441 return $res;
6442}
6443
6444my $complete_vmid_full = sub {
6445 my ($running) = @_;
6446
6447 my $idlist = vmstatus();
6448
6449 my $res = [];
6450
6451 foreach my $id (keys %$idlist) {
6452 my $d = $idlist->{$id};
6453 if (defined($running)) {
6454 next if $d->{template};
6455 next if $running && $d->{status} ne 'running';
6456 next if !$running && $d->{status} eq 'running';
6457 }
6458 push @$res, $id;
6459
6460 }
6461 return $res;
6462};
6463
6464sub complete_vmid {
6465 return &$complete_vmid_full();
6466}
6467
6468sub complete_vmid_stopped {
6469 return &$complete_vmid_full(0);
6470}
6471
6472sub complete_vmid_running {
6473 return &$complete_vmid_full(1);
6474}
6475
335af808
DM
6476sub complete_storage {
6477
6478 my $cfg = PVE::Storage::config();
6479 my $ids = $cfg->{ids};
6480
6481 my $res = [];
6482 foreach my $sid (keys %$ids) {
6483 next if !PVE::Storage::storage_check_enabled($cfg, $sid, undef, 1);
c4c844ef 6484 next if !$ids->{$sid}->{content}->{images};
335af808
DM
6485 push @$res, $sid;
6486 }
6487
6488 return $res;
6489}
6490
63a09370
AD
6491sub nbd_stop {
6492 my ($vmid) = @_;
6493
6494 vm_mon_cmd($vmid, 'nbd-server-stop');
6495}
6496
1e3baf05 64971;