]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
vmconfig_hotplug_pending : add update_net
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05 154my $confdesc = {
7183bd9a
AD
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
1e3baf05
DM
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
2ff09f52
DA
173 hotplug => {
174 optional => 1,
e8b9c17c 175 type => 'boolean',
6c52b679 176 description => "Allow hotplug for disk and network device",
2dbe827e 177 default => 0,
2ff09f52 178 },
1e3baf05
DM
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
22c377f0 189 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
7878afeb 209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
210 minimum => 16,
211 default => 512,
212 },
13a48620
DA
213 balloon => {
214 optional => 1,
215 type => 'integer',
8b1accf7
DM
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
13a48620 226 },
1e3baf05
DM
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 231 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
7fabe17d 236 type => 'string', format => 'dns-name',
1e3baf05
DM
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
cdd20088
AD
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
5b952ff5 243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
244 default => 'lsi',
245 },
1e3baf05
DM
246 description => {
247 optional => 1,
248 type => 'string',
0581fe4f 249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
6b9d84cf 254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
255 description => <<EODESC,
256Used to enable special optimization/features for specific
257operating systems:
258
259other => unspecified OS
260wxp => Microsoft Windows XP
261w2k => Microsoft Windows 2000
262w2k3 => Microsoft Windows 2003
263w2k8 => Microsoft Windows 2008
264wvista => Microsoft Windows Vista
265win7 => Microsoft Windows 7
a70ebde3 266win8 => Microsoft Windows 8/2012
1e3baf05
DM
267l24 => Linux 2.4 Kernel
268l26 => Linux 2.6/3.X Kernel
6b9d84cf 269solaris => solaris/opensolaris/openindiania kernel
1e3baf05 270
6b9d84cf 271other|l24|l26|solaris ... no special behaviour
a70ebde3 272wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
273EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
32baffb4 280 default => 'cdn',
1e3baf05
DM
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
03e480fc 286 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
8a010eae
AD
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
3bd18e48
AD
315 maxcpus => {
316 optional => 1,
317 type => 'integer',
318 description => "Maximum cpus for hotplug.",
319 minimum => 1,
320 default => 1,
321 },
1e3baf05
DM
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
bc84dcca 328 agent => {
ab6a046f
AD
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
be79c214 332 default => 0,
ab6a046f 333 },
1e3baf05
DM
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
8c559505
DM
343 description => "Enable/disable time drift fix.",
344 default => 0,
1e3baf05 345 },
19672434 346 localtime => {
1e3baf05
DM
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
ef5e2be2 359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 361 },
0ea9541d
DM
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
1e3baf05
DM
368 startdate => {
369 optional => 1,
19672434 370 type => 'string',
1e3baf05
DM
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
59411c4e
DM
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
68eda3ab
AD
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
1e3baf05
DM
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394args: -no-reboot -no-hpet
395EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
5acbfe9e 401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
04432191 412 type => 'number',
1e3baf05
DM
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
04432191 415 default => 0.1,
1e3baf05
DM
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
3aefd6fd 427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 428 default => 'kvm64',
1e3baf05 429 },
b7ba6b79
DM
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
982c7f12
DM
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
18bfb361
DM
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
3bafc510
DM
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
2796e7d5
DM
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
1e3baf05
DM
459};
460
461# what about other qemu settings ?
462#cpu => 'string',
463#machine => 'string',
464#fda => 'file',
465#fdb => 'file',
466#mtdblock => 'file',
467#sd => 'file',
468#pflash => 'file',
469#snapshot => 'bool',
470#bootp => 'file',
471##tftp => 'dir',
472##smb => 'dir',
473#kernel => 'file',
474#append => 'string',
475#initrd => 'file',
476##soundhw => 'string',
477
478while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480}
481
482my $MAX_IDE_DISKS = 4;
f62db2a4 483my $MAX_SCSI_DISKS = 14;
a2650619 484my $MAX_VIRTIO_DISKS = 16;
cdb0931f 485my $MAX_SATA_DISKS = 6;
1e3baf05 486my $MAX_USB_DEVICES = 5;
5bdcf937 487my $MAX_NETS = 32;
1e3baf05 488my $MAX_UNUSED_DISKS = 8;
5cffb2d2 489my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 490my $MAX_SERIAL_PORTS = 4;
1989a89c 491my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
492my $MAX_NUMA = 8;
493
494my $numadesc = {
495 optional => 1,
496 type => 'string', format => 'pve-qm-numanode',
497 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>][,policy=<preferred|bind|interleave>]]",
498 description => "numa topology",
499};
500PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
501
502for (my $i = 0; $i < $MAX_NUMA; $i++) {
503 $confdesc->{"numa$i"} = $numadesc;
504}
1e3baf05
DM
505
506my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
e4c6e0b8 507 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
6b64503e 508my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 509
1e3baf05
DM
510my $netdesc = {
511 optional => 1,
512 type => 'string', format => 'pve-qm-net',
a9410357 513 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
1e3baf05 514 description => <<EODESCR,
19672434 515Specify network devices.
1e3baf05
DM
516
517MODEL is one of: $nic_model_list_txt
518
19672434 519XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
520automatically generated if not specified.
521
522The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
523
524Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
525
526If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
527
52810.0.2.2 Gateway
52910.0.2.3 DNS Server
53010.0.2.4 SMB Server
531
532The DHCP server assign addresses to the guest starting from 10.0.2.15.
533
534EODESCR
535};
536PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
537
538for (my $i = 0; $i < $MAX_NETS; $i++) {
539 $confdesc->{"net$i"} = $netdesc;
540}
541
542my $drivename_hash;
19672434 543
1e3baf05
DM
544my $idedesc = {
545 optional => 1,
546 type => 'string', format => 'pve-qm-drive',
8d87f8aa 547 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 548 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
549};
550PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
551
552my $scsidesc = {
553 optional => 1,
554 type => 'string', format => 'pve-qm-drive',
8d87f8aa 555 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 556 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
557};
558PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
559
cdb0931f
DA
560my $satadesc = {
561 optional => 1,
562 type => 'string', format => 'pve-qm-drive',
8d87f8aa 563 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 564 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
565};
566PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
567
1e3baf05
DM
568my $virtiodesc = {
569 optional => 1,
570 type => 'string', format => 'pve-qm-drive',
8d87f8aa 571 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 572 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
573};
574PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
575
576my $usbdesc = {
577 optional => 1,
578 type => 'string', format => 'pve-qm-usb-device',
80401dd8 579 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 580 description => <<EODESCR,
2fe1a152 581Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
582pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
583
19672434 584'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
585'vendor_id:product_id' (hexadeciaml numbers)
586
19672434 587You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
588
589Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
590
80401dd8
DM
591The value 'spice' can be used to add a usb redirection devices for spice.
592
1e3baf05
DM
593EODESCR
594};
595PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
596
040b06b7
DA
597my $hostpcidesc = {
598 optional => 1,
599 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 600 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
601 description => <<EODESCR,
602Map host pci devices. HOSTPCIDEVICE syntax is:
603
604'bus:dev.func' (hexadecimal numbers)
605
606You can us the 'lspci' command to list existing pci devices.
607
0cea6a01
DM
608The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
609
040b06b7
DA
610Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
611
612Experimental: user reported problems with this option.
613EODESCR
614};
615PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
616
bae179aa
DA
617my $serialdesc = {
618 optional => 1,
ca0cef26 619 type => 'string',
1b0b51ed 620 pattern => '(/dev/.+|socket)',
bae179aa 621 description => <<EODESCR,
1b0b51ed 622Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
623
624Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
625
626Experimental: user reported problems with this option.
627EODESCR
628};
bae179aa 629
1989a89c
DA
630my $paralleldesc= {
631 optional => 1,
ca0cef26 632 type => 'string',
9ecc8431 633 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 634 description => <<EODESCR,
19672434 635Map host parallel devices (n is 0 to 2).
1989a89c
DA
636
637Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
638
639Experimental: user reported problems with this option.
640EODESCR
641};
1989a89c
DA
642
643for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
644 $confdesc->{"parallel$i"} = $paralleldesc;
645}
646
bae179aa
DA
647for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
648 $confdesc->{"serial$i"} = $serialdesc;
649}
650
040b06b7
DA
651for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
652 $confdesc->{"hostpci$i"} = $hostpcidesc;
653}
1e3baf05
DM
654
655for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
656 $drivename_hash->{"ide$i"} = 1;
657 $confdesc->{"ide$i"} = $idedesc;
658}
659
cdb0931f
DA
660for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
661 $drivename_hash->{"sata$i"} = 1;
662 $confdesc->{"sata$i"} = $satadesc;
663}
664
1e3baf05
DM
665for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
666 $drivename_hash->{"scsi$i"} = 1;
667 $confdesc->{"scsi$i"} = $scsidesc ;
668}
669
670for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
671 $drivename_hash->{"virtio$i"} = 1;
672 $confdesc->{"virtio$i"} = $virtiodesc;
673}
674
675for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
676 $confdesc->{"usb$i"} = $usbdesc;
677}
678
679my $unuseddesc = {
680 optional => 1,
681 type => 'string', format => 'pve-volume-id',
682 description => "Reference to unused volumes.",
683};
684
685for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
686 $confdesc->{"unused$i"} = $unuseddesc;
687}
688
689my $kvm_api_version = 0;
690
691sub kvm_version {
692
693 return $kvm_api_version if $kvm_api_version;
694
6b64503e 695 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
696 return 0;
697
6b64503e 698 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
699 $kvm_api_version = $v;
700 }
701
702 $fh->close();
703
704 return $kvm_api_version;
705}
706
707my $kvm_user_version;
708
709sub kvm_user_version {
710
711 return $kvm_user_version if $kvm_user_version;
712
713 $kvm_user_version = 'unknown';
714
715 my $tmp = `kvm -help 2>/dev/null`;
19672434 716
fa7ae705 717 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
718 $kvm_user_version = $2;
719 }
720
721 return $kvm_user_version;
722
723}
724
725my $kernel_has_vhost_net = -c '/dev/vhost-net';
726
727sub disknames {
728 # order is important - used to autoselect boot disk
19672434 729 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 730 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
731 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
732 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
733}
734
735sub valid_drivename {
736 my $dev = shift;
737
6b64503e 738 return defined($drivename_hash->{$dev});
1e3baf05
DM
739}
740
741sub option_exists {
742 my $key = shift;
743 return defined($confdesc->{$key});
19672434 744}
1e3baf05
DM
745
746sub nic_models {
747 return $nic_model_list;
748}
749
750sub os_list_description {
751
752 return {
753 other => 'Other',
754 wxp => 'Windows XP',
755 w2k => 'Windows 2000',
756 w2k3 =>, 'Windows 2003',
757 w2k8 => 'Windows 2008',
758 wvista => 'Windows Vista',
759 win7 => 'Windows 7',
a70ebde3 760 win8 => 'Windows 8/2012',
1e3baf05
DM
761 l24 => 'Linux 2.4',
762 l26 => 'Linux 2.6',
19672434 763 };
1e3baf05
DM
764}
765
1e3baf05
DM
766my $cdrom_path;
767
768sub get_cdrom_path {
769
770 return $cdrom_path if $cdrom_path;
771
772 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
773 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
774 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
775}
776
777sub get_iso_path {
778 my ($storecfg, $vmid, $cdrom) = @_;
779
780 if ($cdrom eq 'cdrom') {
781 return get_cdrom_path();
782 } elsif ($cdrom eq 'none') {
783 return '';
784 } elsif ($cdrom =~ m|^/|) {
785 return $cdrom;
786 } else {
6b64503e 787 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
788 }
789}
790
791# try to convert old style file names to volume IDs
792sub filename_to_volume_id {
793 my ($vmid, $file, $media) = @_;
794
795 if (!($file eq 'none' || $file eq 'cdrom' ||
796 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 797
1e3baf05 798 return undef if $file =~ m|/|;
19672434 799
1e3baf05
DM
800 if ($media && $media eq 'cdrom') {
801 $file = "local:iso/$file";
802 } else {
803 $file = "local:$vmid/$file";
804 }
805 }
806
807 return $file;
808}
809
810sub verify_media_type {
811 my ($opt, $vtype, $media) = @_;
812
813 return if !$media;
814
815 my $etype;
816 if ($media eq 'disk') {
a125592c 817 $etype = 'images';
1e3baf05
DM
818 } elsif ($media eq 'cdrom') {
819 $etype = 'iso';
820 } else {
821 die "internal error";
822 }
823
824 return if ($vtype eq $etype);
19672434 825
1e3baf05
DM
826 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
827}
828
829sub cleanup_drive_path {
830 my ($opt, $storecfg, $drive) = @_;
831
832 # try to convert filesystem paths to volume IDs
833
834 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
835 ($drive->{file} !~ m|^/dev/.+|) &&
836 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 837 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
838 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
839 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
840 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
841 verify_media_type($opt, $vtype, $drive->{media});
842 $drive->{file} = $volid;
843 }
844
845 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
846}
847
848sub create_conf_nolock {
849 my ($vmid, $settings) = @_;
850
6b64503e 851 my $filename = config_file($vmid);
1e3baf05
DM
852
853 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 854
1e3baf05
DM
855 my $defaults = load_defaults();
856
857 $settings->{name} = "vm$vmid" if !$settings->{name};
858 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
859
860 my $data = '';
861 foreach my $opt (keys %$settings) {
862 next if !$confdesc->{$opt};
863
864 my $value = $settings->{$opt};
865 next if !$value;
866
867 $data .= "$opt: $value\n";
868 }
869
870 PVE::Tools::file_set_contents($filename, $data);
871}
872
f36ed4f4
DM
873my $parse_size = sub {
874 my ($value) = @_;
875
9bf371a6 876 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
877 my ($size, $unit) = ($1, $3);
878 if ($unit) {
879 if ($unit eq 'K') {
880 $size = $size * 1024;
881 } elsif ($unit eq 'M') {
882 $size = $size * 1024 * 1024;
883 } elsif ($unit eq 'G') {
884 $size = $size * 1024 * 1024 * 1024;
885 }
886 }
887 return int($size);
888};
889
890my $format_size = sub {
891 my ($size) = @_;
892
893 $size = int($size);
894
895 my $kb = int($size/1024);
896 return $size if $kb*1024 != $size;
897
898 my $mb = int($kb/1024);
899 return "${kb}K" if $mb*1024 != $kb;
900
901 my $gb = int($mb/1024);
902 return "${mb}M" if $gb*1024 != $mb;
903
904 return "${gb}G";
905};
906
1e3baf05
DM
907# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
908# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 909# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 910# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
911
912sub parse_drive {
913 my ($key, $data) = @_;
914
915 my $res = {};
19672434 916
1e3baf05
DM
917 # $key may be undefined - used to verify JSON parameters
918 if (!defined($key)) {
919 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
920 $res->{index} = 0;
921 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
922 $res->{interface} = $1;
923 $res->{index} = $2;
924 } else {
925 return undef;
926 }
927
928 foreach my $p (split (/,/, $data)) {
929 next if $p =~ m/^\s*$/;
930
74edd76b 931 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
932 my ($k, $v) = ($1, $2);
933
934 $k = 'file' if $k eq 'volume';
935
936 return undef if defined $res->{$k};
19672434 937
9bf371a6
DM
938 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
939 return undef if !$v || $v !~ m/^\d+/;
940 $k = "m$k";
941 $v = sprintf("%.3f", $v / (1024*1024));
942 }
1e3baf05
DM
943 $res->{$k} = $v;
944 } else {
945 if (!$res->{file} && $p !~ m/=/) {
946 $res->{file} = $p;
947 } else {
948 return undef;
949 }
950 }
951 }
952
953 return undef if !$res->{file};
954
bdf3f362
AD
955 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
956 $res->{format} = $1;
957 }
958
19672434 959 return undef if $res->{cache} &&
e482cec3 960 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
961 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
962 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
963 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
964 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
965 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
966 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
967 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
968 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
969 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
970 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
971 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 972 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 973
9bf371a6
DM
974 return undef if $res->{mbps_rd} && $res->{mbps};
975 return undef if $res->{mbps_wr} && $res->{mbps};
976
977 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 978 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 979 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 980 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 981 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 982 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 983
affd2f88
AD
984 return undef if $res->{iops_rd} && $res->{iops};
985 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
986
987
affd2f88 988 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 989 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 990 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 991 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 992 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 993 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
994
995
24afaca0 996 if ($res->{size}) {
be190583 997 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
998 }
999
1e3baf05
DM
1000 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1001 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1002 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1003 return undef if $res->{interface} eq 'virtio';
1004 }
1005
1006 # rerror does not work with scsi drives
1007 if ($res->{rerror}) {
1008 return undef if $res->{interface} eq 'scsi';
1009 }
1010
1011 return $res;
1012}
1013
74edd76b 1014my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
1015
1016sub print_drive {
1017 my ($vmid, $drive) = @_;
1018
1019 my $opts = '';
74edd76b 1020 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
1021 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1022 }
1023
24afaca0
DM
1024 if ($drive->{size}) {
1025 $opts .= ",size=" . &$format_size($drive->{size});
1026 }
1027
1e3baf05
DM
1028 return "$drive->{file}$opts";
1029}
1030
28ef82d3
DM
1031sub scsi_inquiry {
1032 my($fh, $noerr) = @_;
1033
1034 my $SG_IO = 0x2285;
1035 my $SG_GET_VERSION_NUM = 0x2282;
1036
1037 my $versionbuf = "\x00" x 8;
1038 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1039 if (!$ret) {
1040 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1041 return undef;
1042 }
97d62eb7 1043 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1044 if ($version < 30000) {
1045 die "scsi generic interface too old\n" if !$noerr;
1046 return undef;
1047 }
97d62eb7 1048
28ef82d3
DM
1049 my $buf = "\x00" x 36;
1050 my $sensebuf = "\x00" x 8;
f334aa3e 1051 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1052
28ef82d3
DM
1053 # see /usr/include/scsi/sg.h
1054 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1055
97d62eb7
DM
1056 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1057 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1058 $cmd, $sensebuf, 6000);
1059
1060 $ret = ioctl($fh, $SG_IO, $packet);
1061 if (!$ret) {
1062 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1063 return undef;
1064 }
97d62eb7 1065
28ef82d3
DM
1066 my @res = unpack($sg_io_hdr_t, $packet);
1067 if ($res[17] || $res[18]) {
1068 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1069 return undef;
1070 }
1071
1072 my $res = {};
09984754 1073 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1074 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1075
09984754
DM
1076 $res->{removable} = $byte1 & 128 ? 1 : 0;
1077 $res->{type} = $byte0 & 31;
1078
28ef82d3
DM
1079 return $res;
1080}
1081
1082sub path_is_scsi {
1083 my ($path) = @_;
1084
1085 my $fh = IO::File->new("+<$path") || return undef;
1086 my $res = scsi_inquiry($fh, 1);
1087 close($fh);
1088
1089 return $res;
1090}
1091
db656e5f
DM
1092sub machine_type_is_q35 {
1093 my ($conf) = @_;
b467f79a 1094
db656e5f
DM
1095 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1096}
1097
1098sub print_tabletdevice_full {
1099 my ($conf) = @_;
b467f79a 1100
db656e5f
DM
1101 my $q35 = machine_type_is_q35($conf);
1102
1103 # we use uhci for old VMs because tablet driver was buggy in older qemu
1104 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1105
db656e5f
DM
1106 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1107}
1108
ca916ecc 1109sub print_drivedevice_full {
5bdcf937 1110 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1111
1112 my $device = '';
1113 my $maxdev = 0;
19672434 1114
ca916ecc 1115 if ($drive->{interface} eq 'virtio') {
5bdcf937 1116 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1117 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
7183bd9a 1118 $device .= ",iothread=iothread0" if $conf->{iothread};
2ed36a41 1119 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1120 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1121 my $controller = int($drive->{index} / $maxdev);
1122 my $unit = $drive->{index} % $maxdev;
1123 my $devicetype = 'hd';
231f2e13
DA
1124 my $path = '';
1125 if (drive_is_cdrom($drive)) {
1126 $devicetype = 'cd';
29b19529 1127 } else {
231f2e13
DA
1128 if ($drive->{file} =~ m|^/|) {
1129 $path = $drive->{file};
1130 } else {
1131 $path = PVE::Storage::path($storecfg, $drive->{file});
1132 }
d454d040
AD
1133
1134 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1135 $devicetype = 'generic';
1136 } else {
09984754
DM
1137 if (my $info = path_is_scsi($path)) {
1138 if ($info->{type} == 0) {
1139 $devicetype = 'block';
1140 } elsif ($info->{type} == 1) { # tape
1141 $devicetype = 'generic';
1142 }
1143 }
d454d040 1144 }
231f2e13 1145 }
ca916ecc 1146
5b952ff5
DM
1147 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1148 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1149 } else {
1150 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1151 }
1152
2ed36a41
DM
1153 } elsif ($drive->{interface} eq 'ide'){
1154 $maxdev = 2;
1155 my $controller = int($drive->{index} / $maxdev);
1156 my $unit = $drive->{index} % $maxdev;
1157 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1158
7ebe888a 1159 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1160 } elsif ($drive->{interface} eq 'sata'){
1161 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1162 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1163 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1164 } elsif ($drive->{interface} eq 'usb') {
1165 die "implement me";
1166 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1167 } else {
1168 die "unsupported interface type";
ca916ecc
DA
1169 }
1170
3b408e82
DM
1171 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1172
ca916ecc
DA
1173 return $device;
1174}
1175
15b21acc 1176sub get_initiator_name {
46f58b5f 1177 my $initiator;
15b21acc 1178
46f58b5f
DM
1179 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1180 while (defined(my $line = <$fh>)) {
1181 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1182 $initiator = $1;
1183 last;
1184 }
46f58b5f
DM
1185 $fh->close();
1186
15b21acc
MR
1187 return $initiator;
1188}
1189
1e3baf05
DM
1190sub print_drive_full {
1191 my ($storecfg, $vmid, $drive) = @_;
1192
1193 my $opts = '';
1194 foreach my $o (@qemu_drive_options) {
3b408e82 1195 next if $o eq 'bootindex';
1e3baf05 1196 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1197 }
1e3baf05 1198
9bf371a6
DM
1199 foreach my $o (qw(bps bps_rd bps_wr)) {
1200 my $v = $drive->{"m$o"};
1201 $opts .= ",$o=" . int($v*1024*1024) if $v;
1202 }
1203
1e3baf05 1204 # use linux-aio by default (qemu default is threads)
19672434 1205 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1206
1207 my $path;
1208 my $volid = $drive->{file};
6b64503e
DM
1209 if (drive_is_cdrom($drive)) {
1210 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1211 } else {
1212 if ($volid =~ m|^/|) {
1213 $path = $volid;
1214 } else {
6b64503e 1215 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1216 }
1217 }
1218
ef86170e 1219 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1220
f1e05305
AD
1221 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1222 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1223
1e3baf05
DM
1224 my $pathinfo = $path ? "file=$path," : '';
1225
3ebfcc86 1226 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1227}
1228
cc4d6182 1229sub print_netdevice_full {
5bdcf937 1230 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1231
1232 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1233
1234 my $device = $net->{model};
1235 if ($net->{model} eq 'virtio') {
1236 $device = 'virtio-net-pci';
1237 };
1238
1239 # qemu > 0.15 always try to boot from network - we disable that by
1240 # not loading the pxe rom file
1241 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
5bdcf937 1242 my $pciaddr = print_pci_addr("$netid", $bridges);
cc4d6182 1243 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1244 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1245 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1246 my $vectors = $net->{queues} * 2 + 2;
1247 $tmpstr .= ",vectors=$vectors,mq=on";
1248 }
cc4d6182
DA
1249 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1250 return $tmpstr;
1251}
1252
1253sub print_netdev_full {
1254 my ($vmid, $conf, $net, $netid) = @_;
1255
1256 my $i = '';
1257 if ($netid =~ m/^net(\d+)$/) {
1258 $i = int($1);
1259 }
1260
1261 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1262
1263 my $ifname = "tap${vmid}i$i";
1264
1265 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1266 die "interface name '$ifname' is too long (max 15 character)\n"
1267 if length($ifname) >= 16;
1268
1269 my $vhostparam = '';
1270 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1271
1272 my $vmname = $conf->{name} || "vm$vmid";
1273
a9410357
AD
1274 my $netdev = "";
1275
cc4d6182 1276 if ($net->{bridge}) {
a9410357 1277 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1278 } else {
a9410357 1279 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1280 }
a9410357
AD
1281
1282 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1283
1284 return $netdev;
cc4d6182 1285}
1e3baf05
DM
1286
1287sub drive_is_cdrom {
1288 my ($drive) = @_;
1289
1290 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1291
1292}
1293
2ed5d572
AD
1294sub parse_numa {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 foreach my $kvp (split(/,/, $data)) {
1300
1301 if ($kvp =~ m/^memory=(\S+)$/) {
1302 $res->{memory} = $1;
1303 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1304 $res->{policy} = $1;
1305 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1306 $res->{cpus}->{start} = $1;
1307 $res->{cpus}->{end} = $3;
1308 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1309 $res->{hostnodes}->{start} = $1;
1310 $res->{hostnodes}->{end} = $3;
1311 } else {
1312 return undef;
1313 }
1314 }
1315
1316 return $res;
1317}
1318
040b06b7
DA
1319sub parse_hostpci {
1320 my ($value) = @_;
1321
1322 return undef if !$value;
1323
0cea6a01
DM
1324
1325 my @list = split(/,/, $value);
1326 my $found;
1327
040b06b7 1328 my $res = {};
0cea6a01 1329 foreach my $kv (@list) {
040b06b7 1330
4543ecf0 1331 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1332 $found = 1;
4543ecf0
AD
1333 if(defined($4)){
1334 push @{$res->{pciid}}, { id => $2 , function => $4};
1335
1336 }else{
1337 my $pcidevices = lspci($2);
1338 $res->{pciid} = $pcidevices->{$2};
1339 }
0cea6a01
DM
1340 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1341 $res->{driver} = $1;
1342 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1343 $res->{rombar} = $1;
2e3b7e2a
AD
1344 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1345 $res->{'x-vga'} = $1;
1346 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1347 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1348 } else {
1349 warn "unknown hostpci setting '$kv'\n";
1350 }
040b06b7
DA
1351 }
1352
0cea6a01
DM
1353 return undef if !$found;
1354
040b06b7
DA
1355 return $res;
1356}
1357
1e3baf05
DM
1358# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1359sub parse_net {
1360 my ($data) = @_;
1361
1362 my $res = {};
1363
6b64503e 1364 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1365
e4c6e0b8 1366 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1367 my $model = lc($1);
92f0fedc 1368 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1369 $res->{model} = $model;
1370 $res->{macaddr} = $mac;
1371 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1372 $res->{bridge} = $1;
a9410357
AD
1373 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1374 $res->{queues} = $1;
1e3baf05
DM
1375 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1376 $res->{rate} = $1;
5070f384
DA
1377 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1378 $res->{tag} = $1;
2dd4aa4c
AD
1379 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1380 $res->{firewall} = $1;
1e3baf05
DM
1381 } else {
1382 return undef;
1383 }
19672434 1384
1e3baf05
DM
1385 }
1386
1387 return undef if !$res->{model};
1388
1389 return $res;
1390}
1391
1392sub print_net {
1393 my $net = shift;
1394
1395 my $res = "$net->{model}";
1396 $res .= "=$net->{macaddr}" if $net->{macaddr};
1397 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1398 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1399 $res .= ",tag=$net->{tag}" if $net->{tag};
28138e9a 1400 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1e3baf05
DM
1401
1402 return $res;
1403}
1404
1405sub add_random_macs {
1406 my ($settings) = @_;
1407
1408 foreach my $opt (keys %$settings) {
1409 next if $opt !~ m/^net(\d+)$/;
1410 my $net = parse_net($settings->{$opt});
1411 next if !$net;
1412 $settings->{$opt} = print_net($net);
1413 }
1414}
1415
1416sub add_unused_volume {
1858638f 1417 my ($config, $volid) = @_;
1e3baf05
DM
1418
1419 my $key;
1420 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1421 my $test = "unused$ind";
1422 if (my $vid = $config->{$test}) {
1423 return if $vid eq $volid; # do not add duplicates
1424 } else {
1425 $key = $test;
19672434 1426 }
1e3baf05
DM
1427 }
1428
1429 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1430
1858638f 1431 $config->{$key} = $volid;
1e3baf05 1432
1858638f 1433 return $key;
1e3baf05
DM
1434}
1435
055d554d
DM
1436sub vm_is_volid_owner {
1437 my ($storecfg, $vmid, $volid) = @_;
1438
1439 if ($volid !~ m|^/|) {
1440 my ($path, $owner);
1441 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1442 if ($owner && ($owner == $vmid)) {
1443 return 1;
1444 }
1445 }
1446
1447 return undef;
1448}
1449
1450sub vmconfig_delete_pending_option {
1451 my ($conf, $key) = @_;
1452
1453 delete $conf->{pending}->{$key};
1454 my $pending_delete_hash = { $key => 1 };
1455 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1456 $pending_delete_hash->{$opt} = 1;
1457 }
1458 $conf->{pending}->{delete} = join(',', keys %$pending_delete_hash);
1459}
1460
1461sub vmconfig_undelete_pending_option {
1462 my ($conf, $key) = @_;
1463
1464 my $pending_delete_hash = {};
1465 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1466 $pending_delete_hash->{$opt} = 1;
1467 }
1468 delete $pending_delete_hash->{$key};
1469
1470 my @keylist = keys %$pending_delete_hash;
1471 if (scalar(@keylist)) {
1472 $conf->{pending}->{delete} = join(',', @keylist);
1473 } else {
1474 delete $conf->{pending}->{delete};
1475 }
1476}
1477
1478sub vmconfig_register_unused_drive {
1479 my ($storecfg, $vmid, $conf, $drive) = @_;
1480
1481 if (!drive_is_cdrom($drive)) {
1482 my $volid = $drive->{file};
1483 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
1484 add_unused_volume($conf, $volid, $vmid);
1485 }
1486 }
1487}
1488
c750e90a
DM
1489sub vmconfig_cleanup_pending {
1490 my ($conf) = @_;
1491
1492 # remove pending changes when nothing changed
1493 my $changes;
1494 foreach my $opt (keys %{$conf->{pending}}) {
1495 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1496 $changes = 1;
1497 delete $conf->{pending}->{$opt};
1498 }
1499 }
1500
1501 # remove delete if option is not set
1502 my $pending_delete_hash = {};
1503 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1504 if (defined($conf->{$opt})) {
1505 $pending_delete_hash->{$opt} = 1;
1506 } else {
1507 $changes = 1;
1508 }
1509 }
1510
1511 my @keylist = keys %$pending_delete_hash;
1512 if (scalar(@keylist)) {
1513 $conf->{pending}->{delete} = join(',', @keylist);
1514 } else {
1515 delete $conf->{pending}->{delete};
1516 }
1517
1518 return $changes;
1519}
1520
2796e7d5
DM
1521my $valid_smbios1_options = {
1522 manufacturer => '\S+',
1523 product => '\S+',
1524 version => '\S+',
1525 serial => '\S+',
1526 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1527 sku => '\S+',
1528 family => '\S+',
1529};
1530
1531# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1532sub parse_smbios1 {
1533 my ($data) = @_;
1534
1535 my $res = {};
1536
1537 foreach my $kvp (split(/,/, $data)) {
1538 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1539 my ($k, $v) = split(/=/, $kvp);
1540 return undef if !defined($k) || !defined($v);
1541 return undef if !$valid_smbios1_options->{$k};
1542 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1543 $res->{$k} = $v;
1544 }
1545
1546 return $res;
1547}
1548
cd11416f
DM
1549sub print_smbios1 {
1550 my ($smbios1) = @_;
1551
1552 my $data = '';
1553 foreach my $k (keys %$smbios1) {
1554 next if !defined($smbios1->{$k});
1555 next if !$valid_smbios1_options->{$k};
1556 $data .= ',' if $data;
1557 $data .= "$k=$smbios1->{$k}";
1558 }
1559 return $data;
1560}
1561
2796e7d5
DM
1562PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1563sub verify_smbios1 {
1564 my ($value, $noerr) = @_;
1565
1566 return $value if parse_smbios1($value);
1567
1568 return undef if $noerr;
1569
1570 die "unable to parse smbios (type 1) options\n";
1571}
1572
1e3baf05
DM
1573PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1574sub verify_bootdisk {
1575 my ($value, $noerr) = @_;
1576
19672434 1577 return $value if valid_drivename($value);
1e3baf05
DM
1578
1579 return undef if $noerr;
1580
1581 die "invalid boot disk '$value'\n";
1582}
1583
2ed5d572
AD
1584PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1585sub verify_numa {
1586 my ($value, $noerr) = @_;
1587
1588 return $value if parse_numa($value);
1589
1590 return undef if $noerr;
1591
1592 die "unable to parse numa options\n";
1593}
1594
1e3baf05
DM
1595PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1596sub verify_net {
1597 my ($value, $noerr) = @_;
1598
1599 return $value if parse_net($value);
1600
1601 return undef if $noerr;
19672434 1602
1e3baf05
DM
1603 die "unable to parse network options\n";
1604}
1605
1606PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1607sub verify_drive {
1608 my ($value, $noerr) = @_;
1609
6b64503e 1610 return $value if parse_drive(undef, $value);
1e3baf05
DM
1611
1612 return undef if $noerr;
19672434 1613
1e3baf05
DM
1614 die "unable to parse drive options\n";
1615}
1616
1617PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1618sub verify_hostpci {
1619 my ($value, $noerr) = @_;
1620
040b06b7
DA
1621 return $value if parse_hostpci($value);
1622
1623 return undef if $noerr;
1624
1625 die "unable to parse pci id\n";
1e3baf05
DM
1626}
1627
0ea9541d
DM
1628PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1629sub verify_watchdog {
1630 my ($value, $noerr) = @_;
1631
1632 return $value if parse_watchdog($value);
1633
1634 return undef if $noerr;
19672434 1635
0ea9541d
DM
1636 die "unable to parse watchdog options\n";
1637}
1638
1639sub parse_watchdog {
1640 my ($value) = @_;
1641
1642 return undef if !$value;
1643
1644 my $res = {};
1645
6b64503e 1646 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1647 next if $p =~ m/^\s*$/;
1648
1649 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1650 $res->{model} = $2;
1651 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1652 $res->{action} = $2;
1653 } else {
1654 return undef;
1655 }
1656 }
1657
1658 return $res;
1659}
1660
59411c4e
DM
1661PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1662sub verify_startup {
1663 my ($value, $noerr) = @_;
1664
1665 return $value if parse_startup($value);
1666
1667 return undef if $noerr;
1668
1669 die "unable to parse startup options\n";
1670}
1671
1672sub parse_startup {
1673 my ($value) = @_;
1674
1675 return undef if !$value;
1676
1677 my $res = {};
1678
1679 foreach my $p (split(/,/, $value)) {
1680 next if $p =~ m/^\s*$/;
1681
1682 if ($p =~ m/^(order=)?(\d+)$/) {
1683 $res->{order} = $2;
1684 } elsif ($p =~ m/^up=(\d+)$/) {
1685 $res->{up} = $1;
1686 } elsif ($p =~ m/^down=(\d+)$/) {
1687 $res->{down} = $1;
1688 } else {
1689 return undef;
1690 }
1691 }
1692
1693 return $res;
1694}
1695
1e3baf05
DM
1696sub parse_usb_device {
1697 my ($value) = @_;
1698
1699 return undef if !$value;
1700
6b64503e 1701 my @dl = split(/,/, $value);
1e3baf05
DM
1702 my $found;
1703
1704 my $res = {};
1705 foreach my $v (@dl) {
036e0e2b 1706 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1707 $found = 1;
036e0e2b
DM
1708 $res->{vendorid} = $2;
1709 $res->{productid} = $4;
1e3baf05
DM
1710 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1711 $found = 1;
1712 $res->{hostbus} = $1;
1713 $res->{hostport} = $2;
80401dd8
DM
1714 } elsif ($v =~ m/^spice$/) {
1715 $found = 1;
1716 $res->{spice} = 1;
1e3baf05
DM
1717 } else {
1718 return undef;
1719 }
1720 }
1721 return undef if !$found;
1722
1723 return $res;
1724}
19672434 1725
1e3baf05
DM
1726PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1727sub verify_usb_device {
1728 my ($value, $noerr) = @_;
1729
1730 return $value if parse_usb_device($value);
1731
1732 return undef if $noerr;
19672434 1733
1e3baf05
DM
1734 die "unable to parse usb device\n";
1735}
1736
1e3baf05
DM
1737# add JSON properties for create and set function
1738sub json_config_properties {
1739 my $prop = shift;
1740
1741 foreach my $opt (keys %$confdesc) {
18bfb361 1742 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1743 $prop->{$opt} = $confdesc->{$opt};
1744 }
1745
1746 return $prop;
1747}
1748
1749sub check_type {
1750 my ($key, $value) = @_;
1751
1752 die "unknown setting '$key'\n" if !$confdesc->{$key};
1753
1754 my $type = $confdesc->{$key}->{type};
1755
6b64503e 1756 if (!defined($value)) {
1e3baf05
DM
1757 die "got undefined value\n";
1758 }
1759
1760 if ($value =~ m/[\n\r]/) {
1761 die "property contains a line feed\n";
1762 }
1763
1764 if ($type eq 'boolean') {
19672434
DM
1765 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1766 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1767 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1768 } elsif ($type eq 'integer') {
1769 return int($1) if $value =~ m/^(\d+)$/;
1770 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1771 } elsif ($type eq 'number') {
1772 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1773 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1774 } elsif ($type eq 'string') {
1775 if (my $fmt = $confdesc->{$key}->{format}) {
1776 if ($fmt eq 'pve-qm-drive') {
1777 # special case - we need to pass $key to parse_drive()
6b64503e 1778 my $drive = parse_drive($key, $value);
1e3baf05
DM
1779 return $value if $drive;
1780 die "unable to parse drive options\n";
1781 }
1782 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1783 return $value;
1784 }
1e3baf05 1785 $value =~ s/^\"(.*)\"$/$1/;
19672434 1786 return $value;
1e3baf05
DM
1787 } else {
1788 die "internal error"
1789 }
1790}
1791
191435c6
DM
1792sub lock_config_full {
1793 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1794
6b64503e 1795 my $filename = config_file_lock($vmid);
1e3baf05 1796
191435c6 1797 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1798
1799 die $@ if $@;
5fdbe4f0
DM
1800
1801 return $res;
1e3baf05
DM
1802}
1803
4e4f83fe
DM
1804sub lock_config_mode {
1805 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1806
1807 my $filename = config_file_lock($vmid);
1808
4e4f83fe 1809 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1810
1811 die $@ if $@;
1812
1813 return $res;
1814}
1815
191435c6
DM
1816sub lock_config {
1817 my ($vmid, $code, @param) = @_;
1818
1819 return lock_config_full($vmid, 10, $code, @param);
1820}
1821
1e3baf05 1822sub cfs_config_path {
a78ccf26 1823 my ($vmid, $node) = @_;
1e3baf05 1824
a78ccf26
DM
1825 $node = $nodename if !$node;
1826 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1827}
1828
040b06b7
DA
1829sub check_iommu_support{
1830 #fixme : need to check IOMMU support
1831 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1832
1833 my $iommu=1;
1834 return $iommu;
1835
1836}
1837
1e3baf05 1838sub config_file {
a78ccf26 1839 my ($vmid, $node) = @_;
1e3baf05 1840
a78ccf26 1841 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1842 return "/etc/pve/$cfspath";
1843}
1844
1845sub config_file_lock {
1846 my ($vmid) = @_;
1847
1848 return "$lock_dir/lock-$vmid.conf";
1849}
1850
1851sub touch_config {
1852 my ($vmid) = @_;
1853
6b64503e 1854 my $conf = config_file($vmid);
1e3baf05
DM
1855 utime undef, undef, $conf;
1856}
1857
1e3baf05 1858sub destroy_vm {
a6af7b3e 1859 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1860
6b64503e 1861 my $conffile = config_file($vmid);
1e3baf05 1862
6b64503e 1863 my $conf = load_config($vmid);
1e3baf05 1864
6b64503e 1865 check_lock($conf);
1e3baf05 1866
19672434 1867 # only remove disks owned by this VM
1e3baf05
DM
1868 foreach_drive($conf, sub {
1869 my ($ds, $drive) = @_;
1870
6b64503e 1871 return if drive_is_cdrom($drive);
1e3baf05
DM
1872
1873 my $volid = $drive->{file};
ed221350 1874
ff1a2432 1875 return if !$volid || $volid =~ m|^/|;
1e3baf05 1876
6b64503e 1877 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1878 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1879
6b64503e 1880 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1881 });
19672434 1882
a6af7b3e 1883 if ($keep_empty_config) {
9c502e26 1884 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1885 } else {
1886 unlink $conffile;
1887 }
1e3baf05
DM
1888
1889 # also remove unused disk
1890 eval {
6b64503e 1891 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1892
1893 eval {
6b64503e 1894 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1895 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1896 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1897 });
1898 };
1899 warn $@ if $@;
1900
1901 };
1902 warn $@ if $@;
1903}
1904
1e3baf05 1905sub load_config {
7e8dcf2c 1906 my ($vmid, $node) = @_;
1e3baf05 1907
7e8dcf2c 1908 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1909
1910 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1911
1912 die "no such VM ('$vmid')\n" if !defined($conf);
1913
1914 return $conf;
19672434 1915}
1e3baf05
DM
1916
1917sub parse_vm_config {
1918 my ($filename, $raw) = @_;
1919
1920 return undef if !defined($raw);
1921
554ac7e7 1922 my $res = {
fc1ddcdc 1923 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1924 snapshots => {},
0d732d16 1925 pending => {},
554ac7e7 1926 };
1e3baf05 1927
19672434 1928 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1929 || die "got strange filename '$filename'";
1930
1931 my $vmid = $1;
1932
0d18dcfc 1933 my $conf = $res;
0581fe4f 1934 my $descr = '';
e297c490 1935 my $section = '';
0581fe4f 1936
0d18dcfc
DM
1937 my @lines = split(/\n/, $raw);
1938 foreach my $line (@lines) {
1e3baf05 1939 next if $line =~ m/^\s*$/;
be190583 1940
eab09f4e 1941 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 1942 $section = 'pending';
0d732d16
DM
1943 $conf->{description} = $descr if $descr;
1944 $descr = '';
e297c490 1945 $conf = $res->{$section} = {};
eab09f4e
AD
1946 next;
1947
0d732d16 1948 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 1949 $section = $1;
0d18dcfc 1950 $conf->{description} = $descr if $descr;
782f4f75 1951 $descr = '';
e297c490 1952 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
1953 next;
1954 }
1e3baf05 1955
0581fe4f
DM
1956 if ($line =~ m/^\#(.*)\s*$/) {
1957 $descr .= PVE::Tools::decode_text($1) . "\n";
1958 next;
1959 }
1960
1e3baf05 1961 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1962 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1963 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1964 $conf->{snapstate} = $1;
1e3baf05
DM
1965 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1966 my $key = $1;
1967 my $value = $2;
0d18dcfc 1968 $conf->{$key} = $value;
ef824322 1969 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
e297c490 1970 my $value = $1;
ef824322
DM
1971 if ($section eq 'pending') {
1972 $conf->{delete} = $value; # we parse this later
1973 } else {
1974 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
eab09f4e 1975 }
1e3baf05
DM
1976 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1977 my $key = $1;
1978 my $value = $2;
1979 eval { $value = check_type($key, $value); };
1980 if ($@) {
1981 warn "vm $vmid - unable to parse value of '$key' - $@";
1982 } else {
1983 my $fmt = $confdesc->{$key}->{format};
1984 if ($fmt && $fmt eq 'pve-qm-drive') {
1985 my $v = parse_drive($key, $value);
1986 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1987 $v->{file} = $volid;
6b64503e 1988 $value = print_drive($vmid, $v);
1e3baf05
DM
1989 } else {
1990 warn "vm $vmid - unable to parse value of '$key'\n";
1991 next;
1992 }
1993 }
1994
1995 if ($key eq 'cdrom') {
0d18dcfc 1996 $conf->{ide2} = $value;
1e3baf05 1997 } else {
0d18dcfc 1998 $conf->{$key} = $value;
1e3baf05
DM
1999 }
2000 }
2001 }
2002 }
2003
0d18dcfc 2004 $conf->{description} = $descr if $descr;
0581fe4f 2005
0d18dcfc 2006 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
2007
2008 return $res;
2009}
2010
1858638f
DM
2011sub write_vm_config {
2012 my ($filename, $conf) = @_;
1e3baf05 2013
0d18dcfc
DM
2014 delete $conf->{snapstate}; # just to be sure
2015
1858638f
DM
2016 if ($conf->{cdrom}) {
2017 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2018 $conf->{ide2} = $conf->{cdrom};
2019 delete $conf->{cdrom};
2020 }
1e3baf05
DM
2021
2022 # we do not use 'smp' any longer
1858638f
DM
2023 if ($conf->{sockets}) {
2024 delete $conf->{smp};
2025 } elsif ($conf->{smp}) {
2026 $conf->{sockets} = $conf->{smp};
2027 delete $conf->{cores};
2028 delete $conf->{smp};
1e3baf05
DM
2029 }
2030
264e519f 2031 if ($conf->{maxcpus} && $conf->{sockets}) {
3bd18e48
AD
2032 delete $conf->{sockets};
2033 }
264e519f 2034
ee2f90b1 2035 my $used_volids = {};
0d18dcfc 2036
ee2f90b1 2037 my $cleanup_config = sub {
ef824322 2038 my ($cref, $pending, $snapname) = @_;
1858638f 2039
ee2f90b1
DM
2040 foreach my $key (keys %$cref) {
2041 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
ef824322 2042 $key eq 'snapstate' || $key eq 'pending';
ee2f90b1 2043 my $value = $cref->{$key};
ef824322
DM
2044 if ($key eq 'delete') {
2045 die "propertry 'delete' is only allowed in [PENDING]\n"
2046 if !$pending;
2047 # fixme: check syntax?
2048 next;
2049 }
ee2f90b1
DM
2050 eval { $value = check_type($key, $value); };
2051 die "unable to parse value of '$key' - $@" if $@;
1858638f 2052
ee2f90b1
DM
2053 $cref->{$key} = $value;
2054
a8e2f942 2055 if (!$snapname && valid_drivename($key)) {
ed221350 2056 my $drive = parse_drive($key, $value);
ee2f90b1
DM
2057 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2058 }
1e3baf05 2059 }
ee2f90b1
DM
2060 };
2061
2062 &$cleanup_config($conf);
ef824322
DM
2063
2064 &$cleanup_config($conf->{pending}, 1);
2065
ee2f90b1 2066 foreach my $snapname (keys %{$conf->{snapshots}}) {
ef824322
DM
2067 die "internal error" if $snapname eq 'pending';
2068 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
1e3baf05
DM
2069 }
2070
1858638f
DM
2071 # remove 'unusedX' settings if we re-add a volume
2072 foreach my $key (keys %$conf) {
2073 my $value = $conf->{$key};
ee2f90b1 2074 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 2075 delete $conf->{$key};
1e3baf05 2076 }
1858638f 2077 }
be190583 2078
0d18dcfc
DM
2079 my $generate_raw_config = sub {
2080 my ($conf) = @_;
0581fe4f 2081
0d18dcfc
DM
2082 my $raw = '';
2083
2084 # add description as comment to top of file
2085 my $descr = $conf->{description} || '';
2086 foreach my $cl (split(/\n/, $descr)) {
2087 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2088 }
2089
2090 foreach my $key (sort keys %$conf) {
ef824322 2091 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
0d18dcfc
DM
2092 $raw .= "$key: $conf->{$key}\n";
2093 }
2094 return $raw;
2095 };
0581fe4f 2096
0d18dcfc 2097 my $raw = &$generate_raw_config($conf);
ef824322
DM
2098
2099 if (scalar(keys %{$conf->{pending}})){
2100 $raw .= "\n[PENDING]\n";
2101 $raw .= &$generate_raw_config($conf->{pending});
2102 }
2103
0d18dcfc
DM
2104 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2105 $raw .= "\n[$snapname]\n";
2106 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2107 }
1e3baf05 2108
1858638f
DM
2109 return $raw;
2110}
1e3baf05 2111
1858638f
DM
2112sub update_config_nolock {
2113 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2114
1858638f 2115 check_lock($conf) if !$skiplock;
97d62eb7 2116
1858638f 2117 my $cfspath = cfs_config_path($vmid);
1e3baf05 2118
1858638f
DM
2119 PVE::Cluster::cfs_write_file($cfspath, $conf);
2120}
1e3baf05 2121
1858638f
DM
2122sub update_config {
2123 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2124
1858638f 2125 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
2126}
2127
19672434 2128sub load_defaults {
1e3baf05
DM
2129
2130 my $res = {};
2131
2132 # we use static defaults from our JSON schema configuration
2133 foreach my $key (keys %$confdesc) {
2134 if (defined(my $default = $confdesc->{$key}->{default})) {
2135 $res->{$key} = $default;
2136 }
2137 }
19672434 2138
1e3baf05
DM
2139 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2140 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2141
2142 return $res;
2143}
2144
2145sub config_list {
2146 my $vmlist = PVE::Cluster::get_vmlist();
2147 my $res = {};
2148 return $res if !$vmlist || !$vmlist->{ids};
2149 my $ids = $vmlist->{ids};
2150
1e3baf05
DM
2151 foreach my $vmid (keys %$ids) {
2152 my $d = $ids->{$vmid};
2153 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2154 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2155 $res->{$vmid}->{exists} = 1;
2156 }
2157 return $res;
2158}
2159
64e13401
DM
2160# test if VM uses local resources (to prevent migration)
2161sub check_local_resources {
2162 my ($conf, $noerr) = @_;
2163
2164 my $loc_res = 0;
19672434 2165
e0ab7331
DM
2166 $loc_res = 1 if $conf->{hostusb}; # old syntax
2167 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2168
0d29ab3b 2169 foreach my $k (keys %$conf) {
49ca581d 2170 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 2171 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2172 }
2173
2174 die "VM uses local resources\n" if $loc_res && !$noerr;
2175
2176 return $loc_res;
2177}
2178
719893a9 2179# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2180sub check_storage_availability {
2181 my ($storecfg, $conf, $node) = @_;
2182
2183 foreach_drive($conf, sub {
2184 my ($ds, $drive) = @_;
2185
2186 my $volid = $drive->{file};
2187 return if !$volid;
2188
2189 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2190 return if !$sid;
2191
2192 # check if storage is available on both nodes
2193 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2194 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2195 });
2196}
2197
719893a9
DM
2198# list nodes where all VM images are available (used by has_feature API)
2199sub shared_nodes {
2200 my ($conf, $storecfg) = @_;
2201
2202 my $nodelist = PVE::Cluster::get_nodelist();
2203 my $nodehash = { map { $_ => 1 } @$nodelist };
2204 my $nodename = PVE::INotify::nodename();
be190583 2205
719893a9
DM
2206 foreach_drive($conf, sub {
2207 my ($ds, $drive) = @_;
2208
2209 my $volid = $drive->{file};
2210 return if !$volid;
2211
2212 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2213 if ($storeid) {
2214 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2215 if ($scfg->{disable}) {
2216 $nodehash = {};
2217 } elsif (my $avail = $scfg->{nodes}) {
2218 foreach my $node (keys %$nodehash) {
2219 delete $nodehash->{$node} if !$avail->{$node};
2220 }
2221 } elsif (!$scfg->{shared}) {
2222 foreach my $node (keys %$nodehash) {
2223 delete $nodehash->{$node} if $node ne $nodename
2224 }
2225 }
2226 }
2227 });
2228
2229 return $nodehash
2230}
2231
1e3baf05
DM
2232sub check_lock {
2233 my ($conf) = @_;
2234
2235 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2236}
2237
2238sub check_cmdline {
2239 my ($pidfile, $pid) = @_;
2240
6b64503e
DM
2241 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2242 if (defined($fh)) {
1e3baf05
DM
2243 my $line = <$fh>;
2244 $fh->close;
2245 return undef if !$line;
6b64503e 2246 my @param = split(/\0/, $line);
1e3baf05
DM
2247
2248 my $cmd = $param[0];
06094efd 2249 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2250
2251 for (my $i = 0; $i < scalar (@param); $i++) {
2252 my $p = $param[$i];
2253 next if !$p;
2254 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2255 my $p = $param[$i+1];
2256 return 1 if $p && ($p eq $pidfile);
2257 return undef;
2258 }
2259 }
2260 }
2261 return undef;
2262}
2263
2264sub check_running {
7e8dcf2c 2265 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2266
7e8dcf2c 2267 my $filename = config_file($vmid, $node);
1e3baf05
DM
2268
2269 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2270 if !$nocheck && ! -f $filename;
1e3baf05 2271
e6c3b671 2272 my $pidfile = pidfile_name($vmid);
1e3baf05 2273
e6c3b671
DM
2274 if (my $fd = IO::File->new("<$pidfile")) {
2275 my $st = stat($fd);
1e3baf05 2276 my $line = <$fd>;
6b64503e 2277 close($fd);
1e3baf05
DM
2278
2279 my $mtime = $st->mtime;
2280 if ($mtime > time()) {
2281 warn "file '$filename' modified in future\n";
2282 }
2283
2284 if ($line =~ m/^(\d+)$/) {
2285 my $pid = $1;
e6c3b671
DM
2286 if (check_cmdline($pidfile, $pid)) {
2287 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2288 return $pid;
2289 }
2290 }
1e3baf05
DM
2291 }
2292 }
2293
2294 return undef;
2295}
2296
2297sub vzlist {
19672434 2298
1e3baf05
DM
2299 my $vzlist = config_list();
2300
6b64503e 2301 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2302
19672434 2303 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2304 next if $de !~ m/^(\d+)\.pid$/;
2305 my $vmid = $1;
6b64503e
DM
2306 next if !defined($vzlist->{$vmid});
2307 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2308 $vzlist->{$vmid}->{pid} = $pid;
2309 }
2310 }
2311
2312 return $vzlist;
2313}
2314
1e3baf05
DM
2315sub disksize {
2316 my ($storecfg, $conf) = @_;
2317
2318 my $bootdisk = $conf->{bootdisk};
2319 return undef if !$bootdisk;
2320 return undef if !valid_drivename($bootdisk);
2321
2322 return undef if !$conf->{$bootdisk};
2323
2324 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2325 return undef if !defined($drive);
2326
2327 return undef if drive_is_cdrom($drive);
2328
2329 my $volid = $drive->{file};
2330 return undef if !$volid;
2331
24afaca0 2332 return $drive->{size};
1e3baf05
DM
2333}
2334
2335my $last_proc_pid_stat;
2336
03a33f30
DM
2337# get VM status information
2338# This must be fast and should not block ($full == false)
2339# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2340sub vmstatus {
03a33f30 2341 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2342
2343 my $res = {};
2344
19672434 2345 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2346
2347 my $list = vzlist();
694fcad4 2348 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2349
ae4915a2
DM
2350 my $cpucount = $cpuinfo->{cpus} || 1;
2351
1e3baf05
DM
2352 foreach my $vmid (keys %$list) {
2353 next if $opt_vmid && ($vmid ne $opt_vmid);
2354
2355 my $cfspath = cfs_config_path($vmid);
2356 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2357
2358 my $d = {};
2359 $d->{pid} = $list->{$vmid}->{pid};
2360
2361 # fixme: better status?
2362 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2363
af990afe
DM
2364 my $size = disksize($storecfg, $conf);
2365 if (defined($size)) {
2366 $d->{disk} = 0; # no info available
1e3baf05
DM
2367 $d->{maxdisk} = $size;
2368 } else {
2369 $d->{disk} = 0;
2370 $d->{maxdisk} = 0;
2371 }
2372
2373 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2374 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2375
1e3baf05 2376 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2377 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2378
8b1accf7 2379 if ($conf->{balloon}) {
4bdb0514 2380 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2381 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2382 }
2383
1e3baf05
DM
2384 $d->{uptime} = 0;
2385 $d->{cpu} = 0;
1e3baf05
DM
2386 $d->{mem} = 0;
2387
2388 $d->{netout} = 0;
2389 $d->{netin} = 0;
2390
2391 $d->{diskread} = 0;
2392 $d->{diskwrite} = 0;
2393
4d8c851b
AD
2394 $d->{template} = is_template($conf);
2395
1e3baf05
DM
2396 $res->{$vmid} = $d;
2397 }
2398
2399 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2400 foreach my $dev (keys %$netdev) {
2401 next if $dev !~ m/^tap([1-9]\d*)i/;
2402 my $vmid = $1;
2403 my $d = $res->{$vmid};
2404 next if !$d;
19672434 2405
1e3baf05
DM
2406 $d->{netout} += $netdev->{$dev}->{receive};
2407 $d->{netin} += $netdev->{$dev}->{transmit};
2408 }
2409
1e3baf05
DM
2410 my $ctime = gettimeofday;
2411
2412 foreach my $vmid (keys %$list) {
2413
2414 my $d = $res->{$vmid};
2415 my $pid = $d->{pid};
2416 next if !$pid;
2417
694fcad4
DM
2418 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2419 next if !$pstat; # not running
19672434 2420
694fcad4 2421 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2422
694fcad4 2423 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2424
694fcad4 2425 if ($pstat->{vsize}) {
6b64503e 2426 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2427 }
2428
2429 my $old = $last_proc_pid_stat->{$pid};
2430 if (!$old) {
19672434
DM
2431 $last_proc_pid_stat->{$pid} = {
2432 time => $ctime,
1e3baf05
DM
2433 used => $used,
2434 cpu => 0,
1e3baf05
DM
2435 };
2436 next;
2437 }
2438
7f0b5beb 2439 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2440
2441 if ($dtime > 1000) {
2442 my $dutime = $used - $old->{used};
2443
ae4915a2 2444 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2445 $last_proc_pid_stat->{$pid} = {
19672434 2446 time => $ctime,
1e3baf05
DM
2447 used => $used,
2448 cpu => $d->{cpu},
1e3baf05
DM
2449 };
2450 } else {
2451 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2452 }
2453 }
2454
f5eb281a 2455 return $res if !$full;
03a33f30
DM
2456
2457 my $qmpclient = PVE::QMPClient->new();
2458
64e7fcf2
DM
2459 my $ballooncb = sub {
2460 my ($vmid, $resp) = @_;
2461
2462 my $info = $resp->{'return'};
2463 return if !$info->{max_mem};
be190583 2464
64e7fcf2
DM
2465 my $d = $res->{$vmid};
2466
2467 # use memory assigned to VM
2468 $d->{maxmem} = $info->{max_mem};
2469 $d->{balloon} = $info->{actual};
be190583 2470
64e7fcf2
DM
2471 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2472 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2473 $d->{freemem} = $info->{free_mem};
2474 }
2475
2476 };
2477
03a33f30
DM
2478 my $blockstatscb = sub {
2479 my ($vmid, $resp) = @_;
2480 my $data = $resp->{'return'} || [];
2481 my $totalrdbytes = 0;
2482 my $totalwrbytes = 0;
2483 for my $blockstat (@$data) {
2484 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2485 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2486 }
2487 $res->{$vmid}->{diskread} = $totalrdbytes;
2488 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2489 };
2490
2491 my $statuscb = sub {
2492 my ($vmid, $resp) = @_;
64e7fcf2 2493
03a33f30 2494 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2495 # this fails if ballon driver is not loaded, so this must be
2496 # the last commnand (following command are aborted if this fails).
2497 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2498
2499 my $status = 'unknown';
2500 if (!defined($status = $resp->{'return'}->{status})) {
2501 warn "unable to get VM status\n";
2502 return;
2503 }
2504
2505 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2506 };
2507
2508 foreach my $vmid (keys %$list) {
2509 next if $opt_vmid && ($vmid ne $opt_vmid);
2510 next if !$res->{$vmid}->{pid}; # not running
2511 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2512 }
2513
c8125172 2514 $qmpclient->queue_execute(undef, 1);
03a33f30
DM
2515
2516 foreach my $vmid (keys %$list) {
2517 next if $opt_vmid && ($vmid ne $opt_vmid);
2518 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2519 }
2520
1e3baf05
DM
2521 return $res;
2522}
2523
2524sub foreach_drive {
2525 my ($conf, $func) = @_;
2526
2527 foreach my $ds (keys %$conf) {
2528 next if !valid_drivename($ds);
2529
6b64503e 2530 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2531 next if !$drive;
2532
2533 &$func($ds, $drive);
2534 }
2535}
2536
d5769dc2
DM
2537sub foreach_volid {
2538 my ($conf, $func) = @_;
be190583 2539
d5769dc2
DM
2540 my $volhash = {};
2541
2542 my $test_volid = sub {
2543 my ($volid, $is_cdrom) = @_;
2544
2545 return if !$volid;
be190583 2546
d5769dc2
DM
2547 $volhash->{$volid} = $is_cdrom || 0;
2548 };
2549
ed221350 2550 foreach_drive($conf, sub {
d5769dc2
DM
2551 my ($ds, $drive) = @_;
2552 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2553 });
2554
2555 foreach my $snapname (keys %{$conf->{snapshots}}) {
2556 my $snap = $conf->{snapshots}->{$snapname};
2557 &$test_volid($snap->{vmstate}, 0);
ed221350 2558 foreach_drive($snap, sub {
d5769dc2
DM
2559 my ($ds, $drive) = @_;
2560 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2561 });
2562 }
2563
2564 foreach my $volid (keys %$volhash) {
be190583 2565 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2566 }
2567}
2568
86b8228b
DM
2569sub vga_conf_has_spice {
2570 my ($vga) = @_;
2571
590e698c
DM
2572 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2573
2574 return $1 || 1;
86b8228b
DM
2575}
2576
1e3baf05 2577sub config_to_command {
952958bc 2578 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2579
2580 my $cmd = [];
8c559505
DM
2581 my $globalFlags = [];
2582 my $machineFlags = [];
2583 my $rtcFlags = [];
519ed28c 2584 my $cpuFlags = [];
5bdcf937 2585 my $devices = [];
b78ebef7 2586 my $pciaddr = '';
5bdcf937 2587 my $bridges = {};
1e3baf05
DM
2588 my $kvmver = kvm_user_version();
2589 my $vernum = 0; # unknown
a3c52213
DM
2590 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2591 $vernum = $1*1000000+$2*1000;
2592 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2593 $vernum = $1*1000000+$2*1000+$3;
2594 }
2595
a3c52213 2596 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2597
2598 my $have_ovz = -f '/proc/vz/vestat';
2599
db656e5f
DM
2600 my $q35 = machine_type_is_q35($conf);
2601
1e3baf05
DM
2602 push @$cmd, '/usr/bin/kvm';
2603
2604 push @$cmd, '-id', $vmid;
2605
2606 my $use_virtio = 0;
2607
c971c4f2
AD
2608 my $qmpsocket = qmp_socket($vmid);
2609 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2610 push @$cmd, '-mon', "chardev=qmp,mode=control";
2611
7b7c6d1b 2612 my $socket = vnc_socket($vmid);
1e3baf05
DM
2613 push @$cmd, '-vnc', "unix:$socket,x509,password";
2614
6b64503e 2615 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2616
1e3baf05
DM
2617 push @$cmd, '-daemonize';
2618
2796e7d5
DM
2619 if ($conf->{smbios1}) {
2620 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2621 }
2622
7183bd9a
AD
2623 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2624
db656e5f 2625 if ($q35) {
b467f79a 2626 # the q35 chipset support native usb2, so we enable usb controller
db656e5f 2627 # by default for this machine type
f8e83f05 2628 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2629 } else {
f8e83f05
AD
2630 $pciaddr = print_pci_addr("piix3", $bridges);
2631 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2632
f8e83f05 2633 my $use_usb2 = 0;
db656e5f
DM
2634 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2635 next if !$conf->{"usb$i"};
2636 $use_usb2 = 1;
2637 }
2638 # include usb device config
2639 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2640 }
19672434 2641
5acbfe9e 2642 my $vga = $conf->{vga};
2fa3151e 2643
590e698c
DM
2644 my $qxlnum = vga_conf_has_spice($vga);
2645 $vga = 'qxl' if $qxlnum;
2fa3151e 2646
5acbfe9e 2647 if (!$vga) {
264e519f
DM
2648 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2649 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2650 $conf->{ostype} eq 'w2k8')) {
2651 $vga = 'std';
2652 } else {
2653 $vga = 'cirrus';
2654 }
2655 }
2656
1e3baf05 2657 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2658 my $tablet;
2659 if (defined($conf->{tablet})) {
2660 $tablet = $conf->{tablet};
2661 } else {
2662 $tablet = $defaults->{tablet};
590e698c 2663 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2664 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2665 }
2666
db656e5f 2667 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2668
1e3baf05 2669 # host pci devices
040b06b7 2670 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2671 my $d = parse_hostpci($conf->{"hostpci$i"});
2672 next if !$d;
2673
2674 my $pcie = $d->{pcie};
2675 if($pcie){
2676 die "q35 machine model is not enabled" if !$q35;
2677 $pciaddr = print_pcie_addr("hostpci$i");
2678 }else{
2679 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2680 }
2681
2682 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2683 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2684 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2685 if ($xvga && $xvga ne '') {
2686 push @$cpuFlags, 'kvm=off';
2687 $vga = 'none';
2688 }
2e3b7e2a 2689 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2690 my $pcidevices = $d->{pciid};
2691 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2692
4543ecf0
AD
2693 my $j=0;
2694 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2695
4543ecf0
AD
2696 my $id = "hostpci$i";
2697 $id .= ".$j" if $multifunction;
2698 my $addr = $pciaddr;
2699 $addr .= ".$j" if $multifunction;
2700 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2701
2702 if($j == 0){
2703 $devicestr .= "$rombar$xvga";
2704 $devicestr .= ",multifunction=on" if $multifunction;
2705 }
2706
2707 push @$devices, '-device', $devicestr;
2708 $j++;
2709 }
1e3baf05
DM
2710 }
2711
2712 # usb devices
2713 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2714 my $d = parse_usb_device($conf->{"usb$i"});
2715 next if !$d;
2716 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2717 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2718 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2719 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2720 } elsif ($d->{spice}) {
2721 # usb redir support for spice
2722 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2723 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2724 }
2725 }
2726
1e3baf05 2727 # serial devices
bae179aa 2728 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2729 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2730 if ($path eq 'socket') {
2731 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2732 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2733 push @$devices, '-device', "isa-serial,chardev=serial$i";
2734 } else {
2735 die "no such serial device\n" if ! -c $path;
2736 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2737 push @$devices, '-device', "isa-serial,chardev=serial$i";
2738 }
34978be3 2739 }
1e3baf05
DM
2740 }
2741
2742 # parallel devices
1989a89c 2743 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2744 if (my $path = $conf->{"parallel$i"}) {
19672434 2745 die "no such parallel device\n" if ! -c $path;
32e69805 2746 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2747 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2748 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2749 }
1e3baf05
DM
2750 }
2751
2752 my $vmname = $conf->{name} || "vm$vmid";
2753
2754 push @$cmd, '-name', $vmname;
19672434 2755
1e3baf05
DM
2756 my $sockets = 1;
2757 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2758 $sockets = $conf->{sockets} if $conf->{sockets};
2759
2760 my $cores = $conf->{cores} || 1;
3bd18e48
AD
2761 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2762
76267728
WL
2763 my $total_cores = $sockets * $cores;
2764 my $allowed_cores = $cpuinfo->{cpus};
2765
f34ebd52 2766 die "MAX $allowed_cores cores allowed per VM on this node\n"
76267728
WL
2767 if ($allowed_cores < $total_cores);
2768
264e519f 2769 if ($maxcpus) {
3bd18e48 2770 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
264e519f 2771 } else {
3bd18e48
AD
2772 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2773 }
1e3baf05 2774
1e3baf05
DM
2775 push @$cmd, '-nodefaults';
2776
32baffb4 2777 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2778
0888fdce
DM
2779 my $bootindex_hash = {};
2780 my $i = 1;
2781 foreach my $o (split(//, $bootorder)) {
2782 $bootindex_hash->{$o} = $i*100;
2783 $i++;
afdb31d5 2784 }
3b408e82
DM
2785
2786 push @$cmd, '-boot', "menu=on";
1e3baf05 2787
6b64503e 2788 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2789
6b64503e 2790 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2791
ef5e2be2 2792 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2793
2794 # time drift fix
6b64503e 2795 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2796
6b64503e 2797 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2798 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2799
2800 if (my $ost = $conf->{ostype}) {
6b9d84cf 2801 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2802
2803 if ($ost =~ m/^w/) { # windows
8c559505 2804 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2805
8c559505 2806 # use time drift fix when acpi is enabled
6b64503e 2807 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2808 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2809 }
2810 }
2811
be190583 2812 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2813 $ost eq 'wvista') {
8c559505 2814 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2815 push @$cmd, '-no-hpet';
462e8d19
AD
2816 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2817 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2818 }
2819
2820 if ($ost eq 'win7' || $ost eq 'win8') {
2821 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2822 }
1e3baf05
DM
2823 }
2824
8c559505
DM
2825 push @$rtcFlags, 'driftfix=slew' if $tdf;
2826
7f0b5beb 2827 if ($nokvm) {
8c559505 2828 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2829 } else {
2830 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2831 }
1e3baf05 2832
952958bc
DM
2833 my $machine_type = $forcemachine || $conf->{machine};
2834 if ($machine_type) {
2835 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2836 }
2837
8c559505
DM
2838 if ($conf->{startdate}) {
2839 push @$rtcFlags, "base=$conf->{startdate}";
2840 } elsif ($useLocaltime) {
2841 push @$rtcFlags, 'base=localtime';
2842 }
1e3baf05 2843
519ed28c
AD
2844 my $cpu = $nokvm ? "qemu64" : "kvm64";
2845 $cpu = $conf->{cpu} if $conf->{cpu};
2846
4dc339e7
AD
2847 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2848
6b9d84cf
AD
2849 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2850
2851 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2852
2e1a5389
AD
2853 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2854
be190583 2855 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2856
c0efd8cd
DM
2857 # Note: enforce needs kernel 3.10, so we do not use it for now
2858 # push @$cmd, '-cpu', "$cpu,enforce";
2859 push @$cmd, '-cpu', $cpu;
519ed28c 2860
67fb9de6 2861 my $memory = $conf->{memory} || $defaults->{memory};
8a010eae
AD
2862 push @$cmd, '-m', $memory;
2863
67fb9de6 2864 if ($conf->{numa}) {
8a010eae 2865
2ed5d572
AD
2866 my $numa_totalmemory = undef;
2867 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2868 next if !$conf->{"numa$i"};
2869 my $numa = parse_numa($conf->{"numa$i"});
2870 next if !$numa;
67fb9de6
DM
2871 # memory
2872 die "missing numa node$i memory value\n" if !$numa->{memory};
2ed5d572
AD
2873 my $numa_memory = $numa->{memory};
2874 $numa_totalmemory += $numa_memory;
2875 my $numa_object = "memory-backend-ram,id=ram-node$i,size=$numa_memory"."M";
2876
67fb9de6 2877 # cpus
2ed5d572 2878 my $cpus_start = $numa->{cpus}->{start};
67fb9de6 2879 die "missing numa node$i cpus\n" if !defined($cpus_start);
2ed5d572
AD
2880 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2881 my $cpus = $cpus_start;
2882 if (defined($cpus_end)) {
2883 $cpus .= "-$cpus_end";
67fb9de6 2884 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2ed5d572 2885 }
8a010eae 2886
67fb9de6 2887 # hostnodes
2ed5d572
AD
2888 my $hostnodes_start = $numa->{hostnodes}->{start};
2889 if (defined($hostnodes_start)) {
2890 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2891 my $hostnodes = $hostnodes_start;
2892 if (defined($hostnodes_end)) {
2893 $hostnodes .= "-$hostnodes_end";
67fb9de6 2894 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2ed5d572 2895 }
8a010eae 2896
2ed5d572
AD
2897 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2898 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
67fb9de6 2899 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2ed5d572 2900 }
8a010eae 2901
67fb9de6 2902 # policy
2ed5d572 2903 my $policy = $numa->{policy};
67fb9de6
DM
2904 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2905 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2ed5d572
AD
2906 }
2907
2908 push @$cmd, '-object', $numa_object;
8a010eae
AD
2909 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2910 }
67fb9de6
DM
2911
2912 die "total memory for NUMA nodes must be equal to vm memory\n"
2913 if $numa_totalmemory && $numa_totalmemory != $memory;
2ed5d572
AD
2914
2915 #if no custom tology, we split memory and cores across numa nodes
2916 if(!$numa_totalmemory) {
2917
67fb9de6 2918 my $numa_memory = ($memory / $sockets) . "M";
2ed5d572
AD
2919
2920 for (my $i = 0; $i < $sockets; $i++) {
2921
2922 my $cpustart = ($cores * $i);
2923 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2924 my $cpus = $cpustart;
2925 $cpus .= "-$cpuend" if $cpuend;
2926
2927 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2928 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2929 }
2930 }
8a010eae
AD
2931 }
2932
1e3baf05
DM
2933 push @$cmd, '-S' if $conf->{freeze};
2934
2935 # set keyboard layout
2936 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2937 push @$cmd, '-k', $kb if $kb;
2938
2939 # enable sound
2940 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2941 #push @$cmd, '-soundhw', 'es1370';
2942 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 2943
bc84dcca 2944 if($conf->{agent}) {
7a6c2150 2945 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
2946 my $pciaddr = print_pci_addr("qga0", $bridges);
2947 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2948 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2949 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2950 }
2951
1d794448 2952 my $spice_port;
2fa3151e 2953
590e698c
DM
2954 if ($qxlnum) {
2955 if ($qxlnum > 1) {
2956 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2957 for(my $i = 1; $i < $qxlnum; $i++){
2958 my $pciaddr = print_pci_addr("vga$i", $bridges);
2959 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2960 }
2961 } else {
2962 # assume other OS works like Linux
2963 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2964 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
2965 }
2966 }
2967
1011b570 2968 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 2969
cd339d1f 2970 $spice_port = PVE::Tools::next_spice_port();
943340a6 2971
d2da6d9b 2972 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 2973
d2da6d9b
AD
2974 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2975 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2976 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
2977 }
2978
8d9ae0d2
DM
2979 # enable balloon by default, unless explicitly disabled
2980 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2981 $pciaddr = print_pci_addr("balloon0", $bridges);
2982 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2983 }
1e3baf05 2984
0ea9541d
DM
2985 if ($conf->{watchdog}) {
2986 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 2987 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 2988 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
2989 push @$devices, '-device', "$watchdog$pciaddr";
2990 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
2991 }
2992
1e3baf05 2993 my $vollist = [];
941e0c42 2994 my $scsicontroller = {};
26ee04b6 2995 my $ahcicontroller = {};
cdd20088 2996 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 2997
5881b913
DM
2998 # Add iscsi initiator name if available
2999 if (my $initiator = get_initiator_name()) {
3000 push @$devices, '-iscsi', "initiator-name=$initiator";
3001 }
3002
1e3baf05
DM
3003 foreach_drive($conf, sub {
3004 my ($ds, $drive) = @_;
3005
ff1a2432 3006 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 3007 push @$vollist, $drive->{file};
ff1a2432 3008 }
afdb31d5 3009
1e3baf05 3010 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
3011
3012 if (drive_is_cdrom ($drive)) {
3013 if ($bootindex_hash->{d}) {
3014 $drive->{bootindex} = $bootindex_hash->{d};
3015 $bootindex_hash->{d} += 1;
3016 }
3017 } else {
3018 if ($bootindex_hash->{c}) {
3019 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3020 $bootindex_hash->{c} += 1;
3021 }
3022 }
3023
941e0c42 3024 if ($drive->{interface} eq 'scsi') {
cdd20088 3025
5b952ff5 3026 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 3027 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
3028 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
3029 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 3030 $scsicontroller->{$controller}=1;
941e0c42 3031 }
3b408e82 3032
26ee04b6
DA
3033 if ($drive->{interface} eq 'sata') {
3034 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
3035 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3036 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
3037 $ahcicontroller->{$controller}=1;
3038 }
46f58b5f 3039
15b21acc
MR
3040 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3041 push @$devices, '-drive',$drive_cmd;
46f58b5f 3042 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
3043 });
3044
cc4d6182 3045 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 3046 next if !$conf->{"net$i"};
cc4d6182
DA
3047 my $d = parse_net($conf->{"net$i"});
3048 next if !$d;
1e3baf05 3049
cc4d6182 3050 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 3051
cc4d6182
DA
3052 if ($bootindex_hash->{n}) {
3053 $d->{bootindex} = $bootindex_hash->{n};
3054 $bootindex_hash->{n} += 1;
3055 }
1e3baf05 3056
cc4d6182 3057 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
3058 push @$devices, '-netdev', $netdevfull;
3059
3060 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
3061 push @$devices, '-device', $netdevicefull;
3062 }
1e3baf05 3063
db656e5f
DM
3064 if (!$q35) {
3065 # add pci bridges
f8e83f05
AD
3066 while (my ($k, $v) = each %$bridges) {
3067 $pciaddr = print_pci_addr("pci.$k");
3068 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3069 }
19672434
DM
3070 }
3071
1e3baf05
DM
3072 # hack: virtio with fairsched is unreliable, so we do not use fairsched
3073 # when the VM uses virtio devices.
19672434
DM
3074 if (!$use_virtio && $have_ovz) {
3075
6b64503e 3076 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
3077 $conf->{cpuunits} : $defaults->{cpuunits};
3078
3079 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
3080
3081 # fixme: cpulimit is currently ignored
3082 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
3083 }
3084
3085 # add custom args
3086 if ($conf->{args}) {
3ada46c9 3087 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
3088 push @$cmd, @$aa;
3089 }
3090
5bdcf937 3091 push @$cmd, @$devices;
be190583 3092 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 3093 if scalar(@$rtcFlags);
be190583 3094 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
3095 if scalar(@$machineFlags);
3096 push @$cmd, '-global', join(',', @$globalFlags)
3097 if scalar(@$globalFlags);
3098
1d794448 3099 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 3100}
19672434 3101
1e3baf05
DM
3102sub vnc_socket {
3103 my ($vmid) = @_;
3104 return "${var_run_tmpdir}/$vmid.vnc";
3105}
3106
943340a6 3107sub spice_port {
1011b570 3108 my ($vmid) = @_;
943340a6 3109
1d794448 3110 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
3111
3112 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3113}
3114
c971c4f2 3115sub qmp_socket {
693d12a2
AD
3116 my ($vmid, $qga) = @_;
3117 my $sockettype = $qga ? 'qga' : 'qmp';
3118 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3119}
3120
1e3baf05
DM
3121sub pidfile_name {
3122 my ($vmid) = @_;
3123 return "${var_run_tmpdir}/$vmid.pid";
3124}
3125
86fdcfb2
DA
3126sub vm_devices_list {
3127 my ($vmid) = @_;
3128
ceea9078 3129 my $res = vm_mon_cmd($vmid, 'query-pci');
ceea9078
DM
3130 my $devices = {};
3131 foreach my $pcibus (@$res) {
3132 foreach my $device (@{$pcibus->{devices}}) {
3133 next if !$device->{'qdev_id'};
f78cc802
AD
3134 $devices->{$device->{'qdev_id'}} = 1;
3135 }
3136 }
3137
3138 my $resblock = vm_mon_cmd($vmid, 'query-block');
3139 foreach my $block (@$resblock) {
3140 if($block->{device} =~ m/^drive-(\S+)/){
3141 $devices->{$1} = 1;
1dc4f496
DM
3142 }
3143 }
86fdcfb2 3144
3d7389fe
DM
3145 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3146 foreach my $mice (@$resmice) {
3147 if ($mice->{name} eq 'QEMU HID Tablet') {
3148 $devices->{tablet} = 1;
3149 last;
3150 }
3151 }
3152
1dc4f496 3153 return $devices;
86fdcfb2
DA
3154}
3155
3eec5767 3156# fixme: this should raise exceptions on error!
ec21aa11 3157sub vm_deviceplug {
f19d1c47 3158 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3159
cd6ecb89 3160 return 1 if !check_running($vmid);
db656e5f
DM
3161
3162 my $q35 = machine_type_is_q35($conf);
3163
2dbe827e 3164 return 1 if !$conf->{hotplug};
afdb31d5 3165
95d6343b
DA
3166 my $devices_list = vm_devices_list($vmid);
3167 return 1 if defined($devices_list->{$deviceid});
3168
3d7389fe
DM
3169 if ($deviceid eq 'tablet') {
3170 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3171 return 1;
3172 }
3173
281fedb3 3174 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid); # add PCI bridge if we need it for the device
40f28a9f 3175
5e5dcb73
DA
3176 if ($deviceid =~ m/^(virtio)(\d+)$/) {
3177 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3178 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
5e5dcb73
DA
3179 qemu_deviceadd($vmid, $devicefull);
3180 if(!qemu_deviceaddverify($vmid, $deviceid)) {
3181 qemu_drivedel($vmid, $deviceid);
3182 return undef;
3183 }
f19d1c47 3184 }
cfc817c7 3185
cdd20088
AD
3186 if ($deviceid =~ m/^(scsihw)(\d+)$/) {
3187 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3188 my $pciaddr = print_pci_addr($deviceid);
cdd20088 3189 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
cfc817c7
DA
3190 qemu_deviceadd($vmid, $devicefull);
3191 return undef if(!qemu_deviceaddverify($vmid, $deviceid));
3192 }
3193
a4f091a0 3194 if ($deviceid =~ m/^(scsi)(\d+)$/) {
cdd20088 3195 return undef if !qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
a4f091a0 3196 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3197 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3eec5767 3198 if(!qemu_deviceadd($vmid, $devicefull)) { # fixme: use qemu_deviceaddverify?
a4f091a0
DA
3199 qemu_drivedel($vmid, $deviceid);
3200 return undef;
3201 }
3202 }
3203
2630d2a9
DA
3204 if ($deviceid =~ m/^(net)(\d+)$/) {
3205 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3206 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3207 qemu_deviceadd($vmid, $netdevicefull);
3208 if(!qemu_deviceaddverify($vmid, $deviceid)) {
3209 qemu_netdevdel($vmid, $deviceid);
3210 return undef;
3211 }
3212 }
3213
b467f79a 3214
f8e83f05 3215 if (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
40f28a9f
AD
3216 my $bridgeid = $2;
3217 my $pciaddr = print_pci_addr($deviceid);
3218 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
3219 qemu_deviceadd($vmid, $devicefull);
3220 return undef if !qemu_deviceaddverify($vmid, $deviceid);
3221 }
3222
5e5dcb73 3223 return 1;
a4dea331
DA
3224}
3225
3eec5767 3226# fixme: this should raise exceptions on error!
ec21aa11 3227sub vm_deviceunplug {
f19d1c47 3228 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3229
cd6ecb89
AD
3230 return 1 if !check_running ($vmid);
3231
2dbe827e 3232 return 1 if !$conf->{hotplug};
873c2d69 3233
95d6343b
DA
3234 my $devices_list = vm_devices_list($vmid);
3235 return 1 if !defined($devices_list->{$deviceid});
3236
3d7389fe
DM
3237 if ($deviceid eq 'tablet') {
3238 qemu_devicedel($vmid, $deviceid);
3239 return 1;
3240 }
3241
ae57f6b3 3242 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
f19d1c47 3243
5e5dcb73 3244 if ($deviceid =~ m/^(virtio)(\d+)$/) {
5e5dcb73
DA
3245 qemu_devicedel($vmid, $deviceid);
3246 return undef if !qemu_devicedelverify($vmid, $deviceid);
1f219ef5 3247 return undef if !qemu_drivedel($vmid, $deviceid);
5e5dcb73 3248 }
cfc817c7
DA
3249
3250 if ($deviceid =~ m/^(lsi)(\d+)$/) {
3251 return undef if !qemu_devicedel($vmid, $deviceid);
3252 }
3253
a4f091a0
DA
3254 if ($deviceid =~ m/^(scsi)(\d+)$/) {
3255 return undef if !qemu_devicedel($vmid, $deviceid);
3256 return undef if !qemu_drivedel($vmid, $deviceid);
3257 }
3258
2630d2a9 3259 if ($deviceid =~ m/^(net)(\d+)$/) {
2630d2a9
DA
3260 qemu_devicedel($vmid, $deviceid);
3261 return undef if !qemu_devicedelverify($vmid, $deviceid);
750886f8 3262 return undef if !qemu_netdevdel($vmid, $deviceid);
2630d2a9
DA
3263 }
3264
5e5dcb73
DA
3265 return 1;
3266}
3267
3268sub qemu_deviceadd {
3269 my ($vmid, $devicefull) = @_;
873c2d69 3270
d695b5b7
AD
3271 $devicefull = "driver=".$devicefull;
3272 my %options = split(/[=,]/, $devicefull);
f19d1c47 3273
d695b5b7
AD
3274 vm_mon_cmd($vmid, "device_add" , %options);
3275 return 1;
5e5dcb73 3276}
afdb31d5 3277
5e5dcb73
DA
3278sub qemu_devicedel {
3279 my($vmid, $deviceid) = @_;
5a77d8c1
AD
3280 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
3281 return 1;
5e5dcb73
DA
3282}
3283
3284sub qemu_driveadd {
3285 my($storecfg, $vmid, $device) = @_;
3286
3287 my $drive = print_drive_full($storecfg, $vmid, $device);
7b7c6d1b 3288 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
5e5dcb73
DA
3289 # If the command succeeds qemu prints: "OK"
3290 if ($ret !~ m/OK/s) {
3291 syslog("err", "adding drive failed: $ret");
3292 return undef;
f19d1c47 3293 }
5e5dcb73
DA
3294 return 1;
3295}
afdb31d5 3296
5e5dcb73
DA
3297sub qemu_drivedel {
3298 my($vmid, $deviceid) = @_;
873c2d69 3299
7b7c6d1b 3300 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73
DA
3301 $ret =~ s/^\s+//;
3302 if ($ret =~ m/Device \'.*?\' not found/s) {
afdb31d5 3303 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
5e5dcb73
DA
3304 }
3305 elsif ($ret ne "") {
3306 syslog("err", "deleting drive $deviceid failed : $ret");
3307 return undef;
873c2d69 3308 }
5e5dcb73
DA
3309 return 1;
3310}
f19d1c47 3311
5e5dcb73
DA
3312sub qemu_deviceaddverify {
3313 my ($vmid,$deviceid) = @_;
873c2d69 3314
5e5dcb73
DA
3315 for (my $i = 0; $i <= 5; $i++) {
3316 my $devices_list = vm_devices_list($vmid);
3317 return 1 if defined($devices_list->{$deviceid});
3318 sleep 1;
afdb31d5 3319 }
5e5dcb73
DA
3320 syslog("err", "error on hotplug device $deviceid");
3321 return undef;
3322}
afdb31d5 3323
5e5dcb73
DA
3324
3325sub qemu_devicedelverify {
3326 my ($vmid,$deviceid) = @_;
3327
3328 #need to verify the device is correctly remove as device_del is async and empty return is not reliable
3329 for (my $i = 0; $i <= 5; $i++) {
3330 my $devices_list = vm_devices_list($vmid);
3331 return 1 if !defined($devices_list->{$deviceid});
3332 sleep 1;
afdb31d5 3333 }
5e5dcb73
DA
3334 syslog("err", "error on hot-unplugging device $deviceid");
3335 return undef;
873c2d69
DA
3336}
3337
cdd20088 3338sub qemu_findorcreatescsihw {
cfc817c7
DA
3339 my ($storecfg, $conf, $vmid, $device) = @_;
3340
5b952ff5 3341 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3342 my $controller = int($device->{index} / $maxdev);
cdd20088 3343 my $scsihwid="scsihw$controller";
cfc817c7
DA
3344 my $devices_list = vm_devices_list($vmid);
3345
cdd20088
AD
3346 if(!defined($devices_list->{$scsihwid})) {
3347 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7
DA
3348 }
3349 return 1;
3350}
3351
281fedb3 3352sub qemu_add_pci_bridge {
40f28a9f
AD
3353 my ($storecfg, $conf, $vmid, $device) = @_;
3354
3355 my $bridges = {};
281fedb3
DM
3356
3357 my $bridgeid;
3358
40f28a9f
AD
3359 print_pci_addr($device, $bridges);
3360
3361 while (my ($k, $v) = each %$bridges) {
3362 $bridgeid = $k;
3363 }
281fedb3
DM
3364 return if !defined($bridgeid) || $bridgeid < 1;
3365
40f28a9f
AD
3366 my $bridge = "pci.$bridgeid";
3367 my $devices_list = vm_devices_list($vmid);
3368
281fedb3 3369 if (!defined($devices_list->{$bridge})) {
40f28a9f
AD
3370 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $bridge);
3371 }
281fedb3 3372
40f28a9f
AD
3373 return 1;
3374}
3375
2630d2a9
DA
3376sub qemu_netdevadd {
3377 my ($vmid, $conf, $device, $deviceid) = @_;
3378
3379 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3380 my %options = split(/[=,]/, $netdev);
2630d2a9 3381
73aa03b8
AD
3382 vm_mon_cmd($vmid, "netdev_add", %options);
3383 return 1;
2630d2a9
DA
3384}
3385
3386sub qemu_netdevdel {
3387 my ($vmid, $deviceid) = @_;
3388
89c1e0f4
AD
3389 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
3390 return 1;
2630d2a9
DA
3391}
3392
838776ab
AD
3393sub qemu_cpu_hotplug {
3394 my ($vmid, $conf, $cores) = @_;
3395
3a11fadb
DM
3396 my $sockets = $conf->{sockets} || 1;
3397 die "cpu hotplug only works with one socket\n"
3398 if $sockets > 1;
838776ab 3399
3a11fadb
DM
3400 die "maxcpus is not defined\n"
3401 if !$conf->{maxcpus};
3402
3403 die "you can't add more cores than maxcpus\n"
3404 if $cores > $conf->{maxcpus};
3405
3406 my $currentcores = $conf->{cores} || 1;
3407 die "online cpu unplug is not yet possible\n"
3408 if $cores < $currentcores;
838776ab
AD
3409
3410 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
3a11fadb
DM
3411 die "cores number if running vm is different than configuration\n"
3412 if scalar(@{$currentrunningcores}) != $currentcores;
838776ab 3413
3a11fadb 3414 for (my $i = $currentcores; $i < $cores; $i++) {
838776ab
AD
3415 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3416 }
3417}
3418
affd2f88
AD
3419sub qemu_block_set_io_throttle {
3420 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3421
f3f323a3
AD
3422 return if !check_running($vmid) ;
3423
f3f323a3
AD
3424 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3425
affd2f88
AD
3426}
3427
f5eb281a 3428# old code, only used to shutdown old VM after update
dab36e1e
DM
3429sub __read_avail {
3430 my ($fh, $timeout) = @_;
3431
3432 my $sel = new IO::Select;
3433 $sel->add($fh);
3434
3435 my $res = '';
3436 my $buf;
3437
3438 my @ready;
3439 while (scalar (@ready = $sel->can_read($timeout))) {
3440 my $count;
3441 if ($count = $fh->sysread($buf, 8192)) {
3442 if ($buf =~ /^(.*)\(qemu\) $/s) {
3443 $res .= $1;
3444 last;
3445 } else {
3446 $res .= $buf;
3447 }
3448 } else {
3449 if (!defined($count)) {
3450 die "$!\n";
3451 }
3452 last;
3453 }
3454 }
3455
3456 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3457
dab36e1e
DM
3458 return $res;
3459}
3460
f5eb281a 3461# old code, only used to shutdown old VM after update
dab36e1e
DM
3462sub vm_monitor_command {
3463 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3464
dab36e1e
DM
3465 my $res;
3466
3467 eval {
3468 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3469
3470 my $sname = "${var_run_tmpdir}/$vmid.mon";
3471
3472 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3473 die "unable to connect to VM $vmid socket - $!\n";
3474
3475 my $timeout = 3;
3476
3477 # hack: migrate sometime blocks the monitor (when migrate_downtime
3478 # is set)
3479 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3480 $timeout = 60*60; # 1 hour
3481 }
3482
3483 # read banner;
3484 my $data = __read_avail($sock, $timeout);
3485
3486 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3487 die "got unexpected qemu monitor banner\n";
3488 }
3489
3490 my $sel = new IO::Select;
3491 $sel->add($sock);
3492
3493 if (!scalar(my @ready = $sel->can_write($timeout))) {
3494 die "monitor write error - timeout";
3495 }
3496
3497 my $fullcmd = "$cmdstr\r";
3498
3499 # syslog('info', "VM $vmid monitor command: $cmdstr");
3500
3501 my $b;
3502 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3503 die "monitor write error - $!";
3504 }
3505
3506 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3507
3508 $timeout = 20;
3509
3510 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3511 $timeout = 60*60; # 1 hour
3512 } elsif ($cmdstr =~ m/^(eject|change)/) {
3513 $timeout = 60; # note: cdrom mount command is slow
3514 }
3515 if ($res = __read_avail($sock, $timeout)) {
3516
3517 my @lines = split("\r?\n", $res);
f5eb281a 3518
dab36e1e 3519 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3520
dab36e1e
DM
3521 $res = join("\n", @lines);
3522 $res .= "\n";
3523 }
3524 };
3525
3526 my $err = $@;
3527
3528 if ($err) {
3529 syslog("err", "VM $vmid monitor command failed - $err");
3530 die $err;
3531 }
f5eb281a 3532
dab36e1e
DM
3533 return $res;
3534}
3535
c1175c92
AD
3536sub qemu_block_resize {
3537 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3538
ed221350 3539 my $running = check_running($vmid);
c1175c92
AD
3540
3541 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3542
3543 return if !$running;
3544
3545 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3546
3547}
3548
1ab0057c
AD
3549sub qemu_volume_snapshot {
3550 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3551
ed221350 3552 my $running = check_running($vmid);
1ab0057c
AD
3553
3554 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3555
3556 return if !$running;
3557
3558 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3559
3560}
3561
fc46aff9
AD
3562sub qemu_volume_snapshot_delete {
3563 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3564
ed221350 3565 my $running = check_running($vmid);
fc46aff9
AD
3566
3567 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3568
3569 return if !$running;
3570
18bfb361 3571 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3572}
3573
264e519f
DM
3574sub set_migration_caps {
3575 my ($vmid) = @_;
a89fded1 3576
8b8345f3 3577 my $cap_ref = [];
a89fded1
AD
3578
3579 my $enabled_cap = {
8b8345f3
DM
3580 "auto-converge" => 1,
3581 "xbzrle" => 0,
3582 "x-rdma-pin-all" => 0,
3583 "zero-blocks" => 0,
a89fded1
AD
3584 };
3585
8b8345f3 3586 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3587
8b8345f3 3588 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3589 push @$cap_ref, {
3590 capability => $supported_capability->{capability},
22430fa2
DM
3591 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3592 };
a89fded1
AD
3593 }
3594
8b8345f3
DM
3595 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3596}
a89fded1 3597
3a11fadb
DM
3598# hotplug changes in [PENDING]
3599# $selection hash can be used to only apply specified options, for
3600# example: { cores => 1 } (only apply changed 'cores')
3601# $errors ref is used to return error messages
c427973b 3602sub vmconfig_hotplug_pending {
3a11fadb 3603 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
c427973b 3604
8e90138a 3605 my $defaults = load_defaults();
c427973b
DM
3606
3607 # commit values which do not have any impact on running VM first
3a11fadb
DM
3608 # Note: those option cannot raise errors, we we do not care about
3609 # $selection and always apply them.
3610
3611 my $add_error = sub {
3612 my ($opt, $msg) = @_;
3613 $errors->{$opt} = "hotplug problem - $msg";
3614 };
c427973b
DM
3615
3616 my $changes = 0;
3617 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3618 if ($opt eq 'name' || $opt eq 'hotplug' || $opt eq 'onboot' || $opt eq 'shares') {
3619 $conf->{$opt} = $conf->{pending}->{$opt};
3620 delete $conf->{pending}->{$opt};
3621 $changes = 1;
3622 }
3623 }
3624
3625 if ($changes) {
3626 update_config_nolock($vmid, $conf, 1);
3627 $conf = load_config($vmid); # update/reload
3628 }
3629
3a11fadb 3630 my $hotplug = defined($conf->{hotplug}) ? $conf->{hotplug} : $defaults->{hotplug};
c427973b 3631
3d7389fe
DM
3632 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3633 foreach my $opt (@delete) {
3a11fadb 3634 next if $selection && !$selection->{$opt};
3a11fadb
DM
3635 eval {
3636 if ($opt eq 'tablet') {
e56beeda 3637 die "skip\n" if !$hotplug;
3a11fadb
DM
3638 if ($defaults->{tablet}) {
3639 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3640 } else {
3641 vm_deviceunplug($vmid, $conf, $opt);
3642 }
3643 } elsif ($opt eq 'cores') {
e56beeda 3644 die "skip\n" if !$hotplug;
3a11fadb 3645 qemu_cpu_hotplug($vmid, $conf, 1);
3eec5767
DM
3646 } elsif ($opt =~ m/^net(\d+)$/) {
3647 die "skip\n" if !$hotplug;
3648 vm_deviceunplug($vmid, $conf, $opt);
3d7389fe 3649 } else {
e56beeda 3650 die "skip\n";
3d7389fe 3651 }
3a11fadb
DM
3652 };
3653 if (my $err = $@) {
e56beeda
DM
3654 &$add_error($opt, $err) if $err ne "skip\n";
3655 } else {
3a11fadb
DM
3656 # save new config if hotplug was successful
3657 delete $conf->{$opt};
3658 vmconfig_undelete_pending_option($conf, $opt);
3659 update_config_nolock($vmid, $conf, 1);
3660 $conf = load_config($vmid); # update/reload
3d7389fe 3661 }
3d7389fe
DM
3662 }
3663
3664 foreach my $opt (keys %{$conf->{pending}}) {
3a11fadb 3665 next if $selection && !$selection->{$opt};
3d7389fe 3666 my $value = $conf->{pending}->{$opt};
3a11fadb
DM
3667 eval {
3668 if ($opt eq 'tablet') {
e56beeda 3669 die "skip\n" if !$hotplug;
3a11fadb
DM
3670 if ($value == 1) {
3671 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3672 } elsif ($value == 0) {
3673 vm_deviceunplug($vmid, $conf, $opt);
3674 }
3675 } elsif ($opt eq 'cores') {
e56beeda 3676 die "skip\n" if !$hotplug;
3a11fadb
DM
3677 qemu_cpu_hotplug($vmid, $conf, $value);
3678 } elsif ($opt eq 'balloon') {
e56beeda 3679 die "skip\n" if !(defined($conf->{shares}) && ($conf->{shares} == 0));
3a11fadb
DM
3680 # allow manual ballooning if shares is set to zero
3681 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
3682 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
3eec5767
DM
3683 } elsif ($opt =~ m/^net(\d+)$/) {
3684 # some changes can be done without hotplug
3685 vmconfig_update_net($storecfg, $conf, $vmid, $opt, $value);
3a11fadb 3686 } else {
e56beeda 3687 die "skip\n"; # skip non-hot-pluggable options
3d7389fe 3688 }
3a11fadb
DM
3689 };
3690 if (my $err = $@) {
e56beeda
DM
3691 &$add_error($opt, $err) if $err ne "skip\n";
3692 } else {
3a11fadb
DM
3693 # save new config if hotplug was successful
3694 $conf->{$opt} = $value;
3695 delete $conf->{pending}->{$opt};
3696 update_config_nolock($vmid, $conf, 1);
3697 $conf = load_config($vmid); # update/reload
3d7389fe 3698 }
3d7389fe 3699 }
c427973b 3700}
055d554d
DM
3701
3702sub vmconfig_apply_pending {
3a11fadb 3703 my ($vmid, $conf, $storecfg) = @_;
c427973b
DM
3704
3705 # cold plug
055d554d
DM
3706
3707 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3708 foreach my $opt (@delete) { # delete
3709 die "internal error" if $opt =~ m/^unused/;
3710 $conf = load_config($vmid); # update/reload
3711 if (!defined($conf->{$opt})) {
3712 vmconfig_undelete_pending_option($conf, $opt);
3713 update_config_nolock($vmid, $conf, 1);
3714 } elsif (valid_drivename($opt)) {
3715 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
3716 vmconfig_undelete_pending_option($conf, $opt);
3717 delete $conf->{$opt};
3718 update_config_nolock($vmid, $conf, 1);
3719 } else {
3720 vmconfig_undelete_pending_option($conf, $opt);
3721 delete $conf->{$opt};
3722 update_config_nolock($vmid, $conf, 1);
3723 }
3724 }
3725
3726 $conf = load_config($vmid); # update/reload
3727
3728 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3729 $conf = load_config($vmid); # update/reload
3730
3731 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
3732 # skip if nothing changed
3733 } elsif (valid_drivename($opt)) {
3734 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
3735 if defined($conf->{$opt});
3736 $conf->{$opt} = $conf->{pending}->{$opt};
3737 } else {
3738 $conf->{$opt} = $conf->{pending}->{$opt};
3739 }
3740
3741 delete $conf->{pending}->{$opt};
3742 update_config_nolock($vmid, $conf, 1);
3743 }
3744}
3745
3eec5767
DM
3746my $safe_num_ne = sub {
3747 my ($a, $b) = @_;
3748
3749 return 0 if !defined($a) && !defined($b);
3750 return 1 if !defined($a);
3751 return 1 if !defined($b);
3752
3753 return $a != $b;
3754};
3755
3756my $safe_string_ne = sub {
3757 my ($a, $b) = @_;
3758
3759 return 0 if !defined($a) && !defined($b);
3760 return 1 if !defined($a);
3761 return 1 if !defined($b);
3762
3763 return $a ne $b;
3764};
3765
3766sub vmconfig_update_net {
3767 my ($storecfg, $conf, $vmid, $opt, $value) = @_;
3768
3769 my $newnet = parse_net($value);
3770
3771 if ($conf->{$opt}) {
3772 my $oldnet = parse_net($conf->{$opt});
3773
3774 if (&$safe_string_ne($oldnet->{model}, $newnet->{model}) ||
3775 &$safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
3776 &$safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
3777 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
3778
3779 # for non online change, we try to hot-unplug
3780 die "skip\n" if !$conf->{hotplug};
3781 vm_deviceunplug($vmid, $conf, $opt);
3782 } else {
3783
3784 die "internal error" if $opt !~ m/net(\d+)/;
3785 my $iface = "tap${vmid}i$1";
3786
3787 if (&$safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
3788 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3789 }
3790
3791 if(&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
3792 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
3793 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3794 PVE::Network::tap_unplug($iface);
3795 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall});
3796 }
3797 }
3798 }
3799
3800 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet);
3801}
3802
1e3baf05 3803sub vm_start {
1d794448 3804 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 3805
6b64503e 3806 lock_config($vmid, sub {
7e8dcf2c 3807 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 3808
8b43bc11 3809 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 3810
6b64503e 3811 check_lock($conf) if !$skiplock;
1e3baf05 3812
7e8dcf2c 3813 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 3814
055d554d 3815 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3a11fadb 3816 vmconfig_apply_pending($vmid, $conf, $storecfg);
055d554d
DM
3817 $conf = load_config($vmid); # update/reload
3818 }
3819
6c47d546
DM
3820 my $defaults = load_defaults();
3821
3822 # set environment variable useful inside network script
3823 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3824
1d794448 3825 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 3826
1e3baf05 3827 my $migrate_port = 0;
5bc1e039 3828 my $migrate_uri;
1e3baf05
DM
3829 if ($statefile) {
3830 if ($statefile eq 'tcp') {
5bc1e039
SP
3831 my $localip = "localhost";
3832 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3833 if ($datacenterconf->{migration_unsecure}) {
3834 my $nodename = PVE::INotify::nodename();
3835 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3836 }
f9a971e0 3837 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 3838 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
3839 push @$cmd, '-incoming', $migrate_uri;
3840 push @$cmd, '-S';
1e3baf05 3841 } else {
6c47d546 3842 push @$cmd, '-loadstate', $statefile;
1e3baf05 3843 }
91bd6c90
DM
3844 } elsif ($paused) {
3845 push @$cmd, '-S';
1e3baf05
DM
3846 }
3847
1e3baf05 3848 # host pci devices
040b06b7
DA
3849 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3850 my $d = parse_hostpci($conf->{"hostpci$i"});
3851 next if !$d;
b1f72af6
AD
3852 my $pcidevices = $d->{pciid};
3853 foreach my $pcidevice (@$pcidevices) {
3854 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 3855
b1f72af6
AD
3856 my $info = pci_device_info("0000:$pciid");
3857 die "IOMMU not present\n" if !check_iommu_support();
3858 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 3859
b1f72af6
AD
3860 if ($d->{driver} && $d->{driver} eq "vfio") {
3861 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3862 } else {
3863 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3864 }
3865
8f3e88af 3866 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 3867 }
040b06b7 3868 }
1e3baf05
DM
3869
3870 PVE::Storage::activate_volumes($storecfg, $vollist);
3871
585b6e28
DM
3872 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3873 umask => 0077); };
1e3baf05 3874 my $err = $@;
ff1a2432 3875 die "start failed: $err" if $err;
1e3baf05 3876
5bc1e039 3877 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 3878
8c609afd 3879 if ($statefile && $statefile ne 'tcp') {
95381ce0 3880 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 3881 warn $@ if $@;
62de2cbd
DM
3882 }
3883
1d794448 3884 if ($migratedfrom) {
a89fded1
AD
3885
3886 eval {
8e90138a 3887 set_migration_caps($vmid);
a89fded1 3888 };
1d794448 3889 warn $@ if $@;
a89fded1 3890
1d794448
DM
3891 if ($spice_port) {
3892 print "spice listens on port $spice_port\n";
3893 if ($spice_ticket) {
8e90138a
DM
3894 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
3895 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
3896 }
3897 }
3898
1d794448 3899 } else {
4ec05c4c 3900
15b1fc93 3901 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 3902 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 3903 if $conf->{balloon};
be190583
DM
3904 vm_mon_cmd_nocheck($vmid, 'qom-set',
3905 path => "machine/peripheral/balloon0",
3906 property => "guest-stats-polling-interval",
4ec05c4c
AD
3907 value => 2);
3908 }
e18b0b99 3909 }
1e3baf05
DM
3910 });
3911}
3912
0eedc444
AD
3913sub vm_mon_cmd {
3914 my ($vmid, $execute, %params) = @_;
3915
26f11676
DM
3916 my $cmd = { execute => $execute, arguments => \%params };
3917 vm_qmp_command($vmid, $cmd);
0eedc444
AD
3918}
3919
3920sub vm_mon_cmd_nocheck {
3921 my ($vmid, $execute, %params) = @_;
3922
26f11676
DM
3923 my $cmd = { execute => $execute, arguments => \%params };
3924 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
3925}
3926
c971c4f2 3927sub vm_qmp_command {
c5a07de5 3928 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 3929
c971c4f2 3930 my $res;
26f11676 3931
14db5366
DM
3932 my $timeout;
3933 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
3934 $timeout = $cmd->{arguments}->{timeout};
3935 delete $cmd->{arguments}->{timeout};
3936 }
be190583 3937
c971c4f2
AD
3938 eval {
3939 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
3940 my $sname = qmp_socket($vmid);
3941 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 3942 my $qmpclient = PVE::QMPClient->new();
dab36e1e 3943
14db5366 3944 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 3945 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
3946 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
3947 if scalar(%{$cmd->{arguments}});
3948 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
3949 } else {
3950 die "unable to open monitor socket\n";
3951 }
c971c4f2 3952 };
26f11676 3953 if (my $err = $@) {
c971c4f2
AD
3954 syslog("err", "VM $vmid qmp command failed - $err");
3955 die $err;
3956 }
3957
3958 return $res;
3959}
3960
9df5cbcc
DM
3961sub vm_human_monitor_command {
3962 my ($vmid, $cmdline) = @_;
3963
3964 my $res;
3965
f5eb281a 3966 my $cmd = {
9df5cbcc
DM
3967 execute => 'human-monitor-command',
3968 arguments => { 'command-line' => $cmdline},
3969 };
3970
3971 return vm_qmp_command($vmid, $cmd);
3972}
3973
1e3baf05
DM
3974sub vm_commandline {
3975 my ($storecfg, $vmid) = @_;
3976
6b64503e 3977 my $conf = load_config($vmid);
1e3baf05
DM
3978
3979 my $defaults = load_defaults();
3980
6b64503e 3981 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 3982
6b64503e 3983 return join(' ', @$cmd);
1e3baf05
DM
3984}
3985
3986sub vm_reset {
3987 my ($vmid, $skiplock) = @_;
3988
6b64503e 3989 lock_config($vmid, sub {
1e3baf05 3990
6b64503e 3991 my $conf = load_config($vmid);
1e3baf05 3992
6b64503e 3993 check_lock($conf) if !$skiplock;
1e3baf05 3994
816e2c4a 3995 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
3996 });
3997}
3998
3999sub get_vm_volumes {
4000 my ($conf) = @_;
1e3baf05 4001
ff1a2432 4002 my $vollist = [];
d5769dc2
DM
4003 foreach_volid($conf, sub {
4004 my ($volid, $is_cdrom) = @_;
ff1a2432 4005
d5769dc2 4006 return if $volid =~ m|^/|;
ff1a2432 4007
d5769dc2
DM
4008 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4009 return if !$sid;
ff1a2432
DM
4010
4011 push @$vollist, $volid;
1e3baf05 4012 });
ff1a2432
DM
4013
4014 return $vollist;
4015}
4016
4017sub vm_stop_cleanup {
254575e9 4018 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 4019
745fed70
DM
4020 eval {
4021 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 4022
254575e9
DM
4023 if (!$keepActive) {
4024 my $vollist = get_vm_volumes($conf);
4025 PVE::Storage::deactivate_volumes($storecfg, $vollist);
4026 }
961bfcb2 4027
ab6a046f 4028 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
4029 unlink "/var/run/qemu-server/${vmid}.$ext";
4030 }
745fed70
DM
4031 };
4032 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
4033}
4034
e6c3b671 4035# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
4036# We need that when migration VMs to other nodes (files already moved)
4037# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 4038sub vm_stop {
af30308f 4039 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 4040
9269013a 4041 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 4042
af30308f
DM
4043 if ($migratedfrom){
4044 my $pid = check_running($vmid, $nocheck, $migratedfrom);
4045 kill 15, $pid if $pid;
4046 my $conf = load_config($vmid, $migratedfrom);
4047 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
4048 return;
4049 }
4050
e6c3b671 4051 lock_config($vmid, sub {
1e3baf05 4052
e6c3b671 4053 my $pid = check_running($vmid, $nocheck);
ff1a2432 4054 return if !$pid;
1e3baf05 4055
ff1a2432 4056 my $conf;
e6c3b671 4057 if (!$nocheck) {
ff1a2432 4058 $conf = load_config($vmid);
e6c3b671 4059 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
4060 if (!defined($timeout) && $shutdown && $conf->{startup}) {
4061 my $opts = parse_startup($conf->{startup});
4062 $timeout = $opts->{down} if $opts->{down};
4063 }
e6c3b671 4064 }
19672434 4065
7f4a5b5a 4066 $timeout = 60 if !defined($timeout);
67fb9de6 4067
9269013a
DM
4068 eval {
4069 if ($shutdown) {
6fab033c 4070 if (!$nocheck && $conf->{agent}) {
2ea54503 4071 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 4072 } else {
2ea54503 4073 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 4074 }
9269013a 4075 } else {
2ea54503 4076 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 4077 }
9269013a 4078 };
1e3baf05
DM
4079 my $err = $@;
4080
4081 if (!$err) {
1e3baf05 4082 my $count = 0;
e6c3b671 4083 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4084 $count++;
4085 sleep 1;
4086 }
4087
4088 if ($count >= $timeout) {
9269013a
DM
4089 if ($force) {
4090 warn "VM still running - terminating now with SIGTERM\n";
4091 kill 15, $pid;
4092 } else {
4093 die "VM quit/powerdown failed - got timeout\n";
4094 }
4095 } else {
254575e9 4096 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 4097 return;
1e3baf05
DM
4098 }
4099 } else {
9269013a
DM
4100 if ($force) {
4101 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4102 kill 15, $pid;
4103 } else {
afdb31d5 4104 die "VM quit/powerdown failed\n";
9269013a 4105 }
1e3baf05
DM
4106 }
4107
4108 # wait again
ff1a2432 4109 $timeout = 10;
1e3baf05
DM
4110
4111 my $count = 0;
e6c3b671 4112 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4113 $count++;
4114 sleep 1;
4115 }
4116
4117 if ($count >= $timeout) {
ff1a2432 4118 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 4119 kill 9, $pid;
ff1a2432 4120 sleep 1;
1e3baf05
DM
4121 }
4122
254575e9 4123 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 4124 });
1e3baf05
DM
4125}
4126
4127sub vm_suspend {
4128 my ($vmid, $skiplock) = @_;
4129
6b64503e 4130 lock_config($vmid, sub {
1e3baf05 4131
6b64503e 4132 my $conf = load_config($vmid);
1e3baf05 4133
051347aa 4134 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 4135
f77f91f3 4136 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
4137 });
4138}
4139
4140sub vm_resume {
4141 my ($vmid, $skiplock) = @_;
4142
6b64503e 4143 lock_config($vmid, sub {
1e3baf05 4144
6b64503e 4145 my $conf = load_config($vmid);
1e3baf05 4146
051347aa 4147 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 4148
12060fe8 4149 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
4150 });
4151}
4152
5fdbe4f0
DM
4153sub vm_sendkey {
4154 my ($vmid, $skiplock, $key) = @_;
1e3baf05 4155
6b64503e 4156 lock_config($vmid, sub {
1e3baf05 4157
6b64503e 4158 my $conf = load_config($vmid);
f5eb281a 4159
7b7c6d1b
DM
4160 # there is no qmp command, so we use the human monitor command
4161 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
4162 });
4163}
4164
4165sub vm_destroy {
4166 my ($storecfg, $vmid, $skiplock) = @_;
4167
6b64503e 4168 lock_config($vmid, sub {
1e3baf05 4169
6b64503e 4170 my $conf = load_config($vmid);
1e3baf05 4171
6b64503e 4172 check_lock($conf) if !$skiplock;
1e3baf05 4173
ff1a2432
DM
4174 if (!check_running($vmid)) {
4175 fairsched_rmnod($vmid); # try to destroy group
4176 destroy_vm($storecfg, $vmid);
4177 } else {
4178 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
4179 }
4180 });
4181}
4182
1e3baf05
DM
4183# pci helpers
4184
4185sub file_write {
4186 my ($filename, $buf) = @_;
4187
6b64503e 4188 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
4189 return undef if !$fh;
4190
4191 my $res = print $fh $buf;
4192
4193 $fh->close();
4194
4195 return $res;
4196}
4197
4198sub pci_device_info {
4199 my ($name) = @_;
4200
4201 my $res;
4202
4203 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
4204 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
4205
4206 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
4207 return undef if !defined($irq) || $irq !~ m/^\d+$/;
4208
4209 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
4210 return undef if !defined($vendor) || $vendor !~ s/^0x//;
4211
4212 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
4213 return undef if !defined($product) || $product !~ s/^0x//;
4214
4215 $res = {
4216 name => $name,
4217 vendor => $vendor,
4218 product => $product,
4219 domain => $domain,
4220 bus => $bus,
4221 slot => $slot,
4222 func => $func,
4223 irq => $irq,
4224 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
4225 };
4226
4227 return $res;
4228}
4229
4230sub pci_dev_reset {
4231 my ($dev) = @_;
4232
4233 my $name = $dev->{name};
4234
4235 my $fn = "$pcisysfs/devices/$name/reset";
4236
6b64503e 4237 return file_write($fn, "1");
1e3baf05
DM
4238}
4239
4240sub pci_dev_bind_to_stub {
4241 my ($dev) = @_;
4242
4243 my $name = $dev->{name};
4244
4245 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
4246 return 1 if -d $testdir;
4247
4248 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 4249 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
4250
4251 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 4252 if (!file_write($fn, $name)) {
1e3baf05
DM
4253 return undef if -f $fn;
4254 }
4255
4256 $fn = "$pcisysfs/drivers/pci-stub/bind";
4257 if (! -d $testdir) {
6b64503e 4258 return undef if !file_write($fn, $name);
1e3baf05
DM
4259 }
4260
4261 return -d $testdir;
4262}
4263
000fc0a2
SP
4264sub pci_dev_bind_to_vfio {
4265 my ($dev) = @_;
4266
4267 my $name = $dev->{name};
4268
4269 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4270
4271 if (!-d $vfio_basedir) {
4272 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4273 }
4274 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4275
4276 my $testdir = "$vfio_basedir/$name";
4277 return 1 if -d $testdir;
4278
4279 my $data = "$dev->{vendor} $dev->{product}";
4280 return undef if !file_write("$vfio_basedir/new_id", $data);
4281
4282 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4283 if (!file_write($fn, $name)) {
4284 return undef if -f $fn;
4285 }
4286
4287 $fn = "$vfio_basedir/bind";
4288 if (! -d $testdir) {
4289 return undef if !file_write($fn, $name);
4290 }
4291
4292 return -d $testdir;
4293}
4294
4295sub pci_dev_group_bind_to_vfio {
4296 my ($pciid) = @_;
4297
4298 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4299
4300 if (!-d $vfio_basedir) {
4301 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4302 }
4303 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4304
4305 # get IOMMU group devices
4306 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
4307 my @devs = grep /^0000:/, readdir($D);
4308 closedir($D);
4309
4310 foreach my $pciid (@devs) {
4311 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
4312 my $info = pci_device_info($1);
4313 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
4314 }
4315
4316 return 1;
4317}
4318
afdb31d5 4319sub print_pci_addr {
5bdcf937 4320 my ($id, $bridges) = @_;
6b64503e 4321
72a063e4 4322 my $res = '';
6b64503e 4323 my $devices = {
24f0d39a 4324 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 4325 #addr2 : first videocard
13b5a753 4326 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 4327 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
4328 scsihw0 => { bus => 0, addr => 5 },
4329 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 4330 ahci0 => { bus => 0, addr => 7 },
ab6a046f 4331 qga0 => { bus => 0, addr => 8 },
1011b570 4332 spice => { bus => 0, addr => 9 },
6b64503e
DM
4333 virtio0 => { bus => 0, addr => 10 },
4334 virtio1 => { bus => 0, addr => 11 },
4335 virtio2 => { bus => 0, addr => 12 },
4336 virtio3 => { bus => 0, addr => 13 },
4337 virtio4 => { bus => 0, addr => 14 },
4338 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
4339 hostpci0 => { bus => 0, addr => 16 },
4340 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
4341 net0 => { bus => 0, addr => 18 },
4342 net1 => { bus => 0, addr => 19 },
4343 net2 => { bus => 0, addr => 20 },
4344 net3 => { bus => 0, addr => 21 },
4345 net4 => { bus => 0, addr => 22 },
4346 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
4347 vga1 => { bus => 0, addr => 24 },
4348 vga2 => { bus => 0, addr => 25 },
4349 vga3 => { bus => 0, addr => 26 },
5cffb2d2
AD
4350 hostpci2 => { bus => 0, addr => 27 },
4351 hostpci3 => { bus => 0, addr => 28 },
e5f7f8ed 4352 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
4353 'pci.1' => { bus => 0, addr => 30 },
4354 'pci.2' => { bus => 0, addr => 31 },
4355 'net6' => { bus => 1, addr => 1 },
4356 'net7' => { bus => 1, addr => 2 },
4357 'net8' => { bus => 1, addr => 3 },
4358 'net9' => { bus => 1, addr => 4 },
4359 'net10' => { bus => 1, addr => 5 },
4360 'net11' => { bus => 1, addr => 6 },
4361 'net12' => { bus => 1, addr => 7 },
4362 'net13' => { bus => 1, addr => 8 },
4363 'net14' => { bus => 1, addr => 9 },
4364 'net15' => { bus => 1, addr => 10 },
4365 'net16' => { bus => 1, addr => 11 },
4366 'net17' => { bus => 1, addr => 12 },
4367 'net18' => { bus => 1, addr => 13 },
4368 'net19' => { bus => 1, addr => 14 },
4369 'net20' => { bus => 1, addr => 15 },
4370 'net21' => { bus => 1, addr => 16 },
4371 'net22' => { bus => 1, addr => 17 },
4372 'net23' => { bus => 1, addr => 18 },
4373 'net24' => { bus => 1, addr => 19 },
4374 'net25' => { bus => 1, addr => 20 },
4375 'net26' => { bus => 1, addr => 21 },
4376 'net27' => { bus => 1, addr => 22 },
4377 'net28' => { bus => 1, addr => 23 },
4378 'net29' => { bus => 1, addr => 24 },
4379 'net30' => { bus => 1, addr => 25 },
4380 'net31' => { bus => 1, addr => 26 },
4381 'virtio6' => { bus => 2, addr => 1 },
4382 'virtio7' => { bus => 2, addr => 2 },
4383 'virtio8' => { bus => 2, addr => 3 },
4384 'virtio9' => { bus => 2, addr => 4 },
4385 'virtio10' => { bus => 2, addr => 5 },
4386 'virtio11' => { bus => 2, addr => 6 },
4387 'virtio12' => { bus => 2, addr => 7 },
4388 'virtio13' => { bus => 2, addr => 8 },
4389 'virtio14' => { bus => 2, addr => 9 },
4390 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
4391 };
4392
4393 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 4394 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
4395 my $bus = $devices->{$id}->{bus};
4396 $res = ",bus=pci.$bus,addr=$addr";
98627641 4397 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
4398 }
4399 return $res;
4400
4401}
4402
2e3b7e2a
AD
4403sub print_pcie_addr {
4404 my ($id) = @_;
4405
4406 my $res = '';
4407 my $devices = {
4408 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4409 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4410 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4411 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4412 };
4413
4414 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4415 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4416 my $bus = $devices->{$id}->{bus};
4417 $res = ",bus=$bus,addr=$addr";
4418 }
4419 return $res;
4420
4421}
4422
3e16d5fc
DM
4423# vzdump restore implementaion
4424
ed221350 4425sub tar_archive_read_firstfile {
3e16d5fc 4426 my $archive = shift;
afdb31d5 4427
3e16d5fc
DM
4428 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4429
4430 # try to detect archive type first
4431 my $pid = open (TMP, "tar tf '$archive'|") ||
4432 die "unable to open file '$archive'\n";
4433 my $firstfile = <TMP>;
4434 kill 15, $pid;
4435 close TMP;
4436
4437 die "ERROR: archive contaions no data\n" if !$firstfile;
4438 chomp $firstfile;
4439
4440 return $firstfile;
4441}
4442
ed221350
DM
4443sub tar_restore_cleanup {
4444 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
4445
4446 print STDERR "starting cleanup\n";
4447
4448 if (my $fd = IO::File->new($statfile, "r")) {
4449 while (defined(my $line = <$fd>)) {
4450 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4451 my $volid = $2;
4452 eval {
4453 if ($volid =~ m|^/|) {
4454 unlink $volid || die 'unlink failed\n';
4455 } else {
ed221350 4456 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 4457 }
afdb31d5 4458 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
4459 };
4460 print STDERR "unable to cleanup '$volid' - $@" if $@;
4461 } else {
4462 print STDERR "unable to parse line in statfile - $line";
afdb31d5 4463 }
3e16d5fc
DM
4464 }
4465 $fd->close();
4466 }
4467}
4468
4469sub restore_archive {
a0d1b1a2 4470 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 4471
91bd6c90
DM
4472 my $format = $opts->{format};
4473 my $comp;
4474
4475 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4476 $format = 'tar' if !$format;
4477 $comp = 'gzip';
4478 } elsif ($archive =~ m/\.tar$/) {
4479 $format = 'tar' if !$format;
4480 } elsif ($archive =~ m/.tar.lzo$/) {
4481 $format = 'tar' if !$format;
4482 $comp = 'lzop';
4483 } elsif ($archive =~ m/\.vma$/) {
4484 $format = 'vma' if !$format;
4485 } elsif ($archive =~ m/\.vma\.gz$/) {
4486 $format = 'vma' if !$format;
4487 $comp = 'gzip';
4488 } elsif ($archive =~ m/\.vma\.lzo$/) {
4489 $format = 'vma' if !$format;
4490 $comp = 'lzop';
4491 } else {
4492 $format = 'vma' if !$format; # default
4493 }
4494
4495 # try to detect archive format
4496 if ($format eq 'tar') {
4497 return restore_tar_archive($archive, $vmid, $user, $opts);
4498 } else {
4499 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4500 }
4501}
4502
4503sub restore_update_config_line {
4504 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4505
4506 return if $line =~ m/^\#qmdump\#/;
4507 return if $line =~ m/^\#vzdump\#/;
4508 return if $line =~ m/^lock:/;
4509 return if $line =~ m/^unused\d+:/;
4510 return if $line =~ m/^parent:/;
ca3e4fa4 4511 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4512
4513 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4514 # try to convert old 1.X settings
4515 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4516 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4517 my ($model, $macaddr) = split(/\=/, $devconfig);
4518 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4519 my $net = {
4520 model => $model,
4521 bridge => "vmbr$ind",
4522 macaddr => $macaddr,
4523 };
4524 my $netstr = print_net($net);
4525
4526 print $outfd "net$cookie->{netcount}: $netstr\n";
4527 $cookie->{netcount}++;
4528 }
4529 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4530 my ($id, $netstr) = ($1, $2);
4531 my $net = parse_net($netstr);
4532 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4533 $netstr = print_net($net);
4534 print $outfd "$id: $netstr\n";
4535 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4536 my $virtdev = $1;
907ea891 4537 my $value = $3;
91bd6c90
DM
4538 if ($line =~ m/backup=no/) {
4539 print $outfd "#$line";
4540 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4541 my $di = parse_drive($virtdev, $value);
8fd57431 4542 delete $di->{format}; # format can change on restore
91bd6c90 4543 $di->{file} = $map->{$virtdev};
ed221350 4544 $value = print_drive($vmid, $di);
91bd6c90
DM
4545 print $outfd "$virtdev: $value\n";
4546 } else {
4547 print $outfd $line;
4548 }
4549 } else {
4550 print $outfd $line;
4551 }
4552}
4553
4554sub scan_volids {
4555 my ($cfg, $vmid) = @_;
4556
4557 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4558
4559 my $volid_hash = {};
4560 foreach my $storeid (keys %$info) {
4561 foreach my $item (@{$info->{$storeid}}) {
4562 next if !($item->{volid} && $item->{size});
5996a936 4563 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4564 $volid_hash->{$item->{volid}} = $item;
4565 }
4566 }
4567
4568 return $volid_hash;
4569}
4570
a8e2f942
DM
4571sub get_used_paths {
4572 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4573
4574 my $used_path = {};
4575
4576 my $scan_config = sub {
4577 my ($cref, $snapname) = @_;
4578
4579 foreach my $key (keys %$cref) {
4580 my $value = $cref->{$key};
4581 if (valid_drivename($key)) {
4582 next if $skip_drive && $key eq $skip_drive;
4583 my $drive = parse_drive($key, $value);
4584 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4585 if ($drive->{file} =~ m!^/!) {
4586 $used_path->{$drive->{file}}++; # = 1;
4587 } else {
4588 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4589 next if !$storeid;
4590 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4591 next if !$scfg;
4592 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4593 $used_path->{$path}++; # = 1;
4594 }
4595 }
4596 }
4597 };
4598
4599 &$scan_config($conf);
4600
4601 undef $skip_drive;
4602
4603 if ($scan_snapshots) {
4604 foreach my $snapname (keys %{$conf->{snapshots}}) {
4605 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4606 }
4607 }
4608
4609 return $used_path;
4610}
4611
91bd6c90
DM
4612sub update_disksize {
4613 my ($vmid, $conf, $volid_hash) = @_;
be190583 4614
91bd6c90
DM
4615 my $changes;
4616
4617 my $used = {};
4618
5996a936
DM
4619 # Note: it is allowed to define multiple storages with same path (alias), so
4620 # we need to check both 'volid' and real 'path' (two different volid can point
4621 # to the same path).
4622
4623 my $usedpath = {};
be190583 4624
91bd6c90
DM
4625 # update size info
4626 foreach my $opt (keys %$conf) {
ed221350
DM
4627 if (valid_drivename($opt)) {
4628 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4629 my $volid = $drive->{file};
4630 next if !$volid;
4631
4632 $used->{$volid} = 1;
be190583 4633 if ($volid_hash->{$volid} &&
5996a936
DM
4634 (my $path = $volid_hash->{$volid}->{path})) {
4635 $usedpath->{$path} = 1;
4636 }
91bd6c90 4637
ed221350 4638 next if drive_is_cdrom($drive);
91bd6c90
DM
4639 next if !$volid_hash->{$volid};
4640
4641 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4642 my $new = print_drive($vmid, $drive);
4643 if ($new ne $conf->{$opt}) {
4644 $changes = 1;
4645 $conf->{$opt} = $new;
4646 }
91bd6c90
DM
4647 }
4648 }
4649
5996a936
DM
4650 # remove 'unusedX' entry if volume is used
4651 foreach my $opt (keys %$conf) {
4652 next if $opt !~ m/^unused\d+$/;
4653 my $volid = $conf->{$opt};
4654 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4655 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4656 $changes = 1;
4657 delete $conf->{$opt};
4658 }
4659 }
4660
91bd6c90
DM
4661 foreach my $volid (sort keys %$volid_hash) {
4662 next if $volid =~ m/vm-$vmid-state-/;
4663 next if $used->{$volid};
5996a936
DM
4664 my $path = $volid_hash->{$volid}->{path};
4665 next if !$path; # just to be sure
4666 next if $usedpath->{$path};
91bd6c90 4667 $changes = 1;
ed221350 4668 add_unused_volume($conf, $volid);
05937a14 4669 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4670 }
4671
4672 return $changes;
4673}
4674
4675sub rescan {
4676 my ($vmid, $nolock) = @_;
4677
4678 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4679
4680 my $volid_hash = scan_volids($cfg, $vmid);
4681
4682 my $updatefn = sub {
4683 my ($vmid) = @_;
4684
ed221350 4685 my $conf = load_config($vmid);
be190583 4686
ed221350 4687 check_lock($conf);
91bd6c90 4688
03da3f0d
DM
4689 my $vm_volids = {};
4690 foreach my $volid (keys %$volid_hash) {
4691 my $info = $volid_hash->{$volid};
4692 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4693 }
4694
4695 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 4696
ed221350 4697 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
4698 };
4699
4700 if (defined($vmid)) {
4701 if ($nolock) {
4702 &$updatefn($vmid);
4703 } else {
ed221350 4704 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
4705 }
4706 } else {
4707 my $vmlist = config_list();
4708 foreach my $vmid (keys %$vmlist) {
4709 if ($nolock) {
4710 &$updatefn($vmid);
4711 } else {
ed221350 4712 lock_config($vmid, $updatefn, $vmid);
be190583 4713 }
91bd6c90
DM
4714 }
4715 }
4716}
4717
4718sub restore_vma_archive {
4719 my ($archive, $vmid, $user, $opts, $comp) = @_;
4720
4721 my $input = $archive eq '-' ? "<&STDIN" : undef;
4722 my $readfrom = $archive;
4723
4724 my $uncomp = '';
4725 if ($comp) {
4726 $readfrom = '-';
4727 my $qarchive = PVE::Tools::shellquote($archive);
4728 if ($comp eq 'gzip') {
4729 $uncomp = "zcat $qarchive|";
4730 } elsif ($comp eq 'lzop') {
4731 $uncomp = "lzop -d -c $qarchive|";
4732 } else {
4733 die "unknown compression method '$comp'\n";
4734 }
be190583 4735
91bd6c90
DM
4736 }
4737
4738 my $tmpdir = "/var/tmp/vzdumptmp$$";
4739 rmtree $tmpdir;
4740
4741 # disable interrupts (always do cleanups)
4742 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4743 warn "got interrupt - ignored\n";
4744 };
4745
4746 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4747 POSIX::mkfifo($mapfifo, 0600);
4748 my $fifofh;
4749
4750 my $openfifo = sub {
4751 open($fifofh, '>', $mapfifo) || die $!;
4752 };
4753
4754 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4755
4756 my $oldtimeout;
4757 my $timeout = 5;
4758
4759 my $devinfo = {};
4760
4761 my $rpcenv = PVE::RPCEnvironment::get();
4762
ed221350 4763 my $conffile = config_file($vmid);
91bd6c90
DM
4764 my $tmpfn = "$conffile.$$.tmp";
4765
ed221350
DM
4766 # Note: $oldconf is undef if VM does not exists
4767 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4768
91bd6c90
DM
4769 my $print_devmap = sub {
4770 my $virtdev_hash = {};
4771
4772 my $cfgfn = "$tmpdir/qemu-server.conf";
4773
4774 # we can read the config - that is already extracted
4775 my $fh = IO::File->new($cfgfn, "r") ||
4776 "unable to read qemu-server.conf - $!\n";
4777
4778 while (defined(my $line = <$fh>)) {
4779 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4780 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4781 die "archive does not contain data for drive '$virtdev'\n"
4782 if !$devinfo->{$devname};
4783 if (defined($opts->{storage})) {
4784 $storeid = $opts->{storage} || 'local';
4785 } elsif (!$storeid) {
4786 $storeid = 'local';
4787 }
4788 $format = 'raw' if !$format;
4789 $devinfo->{$devname}->{devname} = $devname;
4790 $devinfo->{$devname}->{virtdev} = $virtdev;
4791 $devinfo->{$devname}->{format} = $format;
4792 $devinfo->{$devname}->{storeid} = $storeid;
4793
be190583 4794 # check permission on storage
91bd6c90
DM
4795 my $pool = $opts->{pool}; # todo: do we need that?
4796 if ($user ne 'root@pam') {
4797 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4798 }
4799
4800 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4801 }
4802 }
4803
4804 foreach my $devname (keys %$devinfo) {
be190583
DM
4805 die "found no device mapping information for device '$devname'\n"
4806 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
4807 }
4808
91bd6c90 4809 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
4810
4811 # create empty/temp config
be190583 4812 if ($oldconf) {
ed221350
DM
4813 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4814 foreach_drive($oldconf, sub {
4815 my ($ds, $drive) = @_;
4816
4817 return if drive_is_cdrom($drive);
4818
4819 my $volid = $drive->{file};
4820
4821 return if !$volid || $volid =~ m|^/|;
4822
4823 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4824 return if !$path || !$owner || ($owner != $vmid);
4825
4826 # Note: only delete disk we want to restore
4827 # other volumes will become unused
4828 if ($virtdev_hash->{$ds}) {
4829 PVE::Storage::vdisk_free($cfg, $volid);
4830 }
4831 });
4832 }
4833
4834 my $map = {};
91bd6c90
DM
4835 foreach my $virtdev (sort keys %$virtdev_hash) {
4836 my $d = $virtdev_hash->{$virtdev};
4837 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4838 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
4839
4840 # test if requested format is supported
4841 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4842 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4843 $d->{format} = $defFormat if !$supported;
4844
91bd6c90
DM
4845 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4846 $d->{format}, undef, $alloc_size);
4847 print STDERR "new volume ID is '$volid'\n";
4848 $d->{volid} = $volid;
4849 my $path = PVE::Storage::path($cfg, $volid);
4850
4851 my $write_zeros = 1;
4852 # fixme: what other storages types initialize volumes with zero?
244f2577 4853 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 4854 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
4855 $write_zeros = 0;
4856 }
4857
4858 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4859
4860 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4861 $map->{$virtdev} = $volid;
4862 }
4863
4864 $fh->seek(0, 0) || die "seek failed - $!\n";
4865
4866 my $outfd = new IO::File ($tmpfn, "w") ||
4867 die "unable to write config for VM $vmid\n";
4868
4869 my $cookie = { netcount => 0 };
4870 while (defined(my $line = <$fh>)) {
be190583 4871 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
4872 }
4873
4874 $fh->close();
4875 $outfd->close();
4876 };
4877
4878 eval {
4879 # enable interrupts
4880 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4881 die "interrupted by signal\n";
4882 };
4883 local $SIG{ALRM} = sub { die "got timeout\n"; };
4884
4885 $oldtimeout = alarm($timeout);
4886
4887 my $parser = sub {
4888 my $line = shift;
4889
4890 print "$line\n";
4891
4892 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
4893 my ($dev_id, $size, $devname) = ($1, $2, $3);
4894 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
4895 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 4896 # we correctly received the vma config, so we can disable
3cf90d7a
DM
4897 # the timeout now for disk allocation (set to 10 minutes, so
4898 # that we always timeout if something goes wrong)
4899 alarm(600);
91bd6c90
DM
4900 &$print_devmap();
4901 print $fifofh "done\n";
4902 my $tmp = $oldtimeout || 0;
4903 $oldtimeout = undef;
4904 alarm($tmp);
4905 close($fifofh);
4906 }
4907 };
be190583 4908
91bd6c90
DM
4909 print "restore vma archive: $cmd\n";
4910 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
4911 };
4912 my $err = $@;
4913
4914 alarm($oldtimeout) if $oldtimeout;
4915
4916 unlink $mapfifo;
4917
4918 if ($err) {
4919 rmtree $tmpdir;
4920 unlink $tmpfn;
4921
4922 my $cfg = cfs_read_file('storage.cfg');
4923 foreach my $devname (keys %$devinfo) {
4924 my $volid = $devinfo->{$devname}->{volid};
4925 next if !$volid;
4926 eval {
4927 if ($volid =~ m|^/|) {
4928 unlink $volid || die 'unlink failed\n';
4929 } else {
4930 PVE::Storage::vdisk_free($cfg, $volid);
4931 }
4932 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4933 };
4934 print STDERR "unable to cleanup '$volid' - $@" if $@;
4935 }
4936 die $err;
4937 }
4938
4939 rmtree $tmpdir;
ed221350
DM
4940
4941 rename($tmpfn, $conffile) ||
91bd6c90
DM
4942 die "unable to commit configuration file '$conffile'\n";
4943
ed221350
DM
4944 PVE::Cluster::cfs_update(); # make sure we read new file
4945
91bd6c90
DM
4946 eval { rescan($vmid, 1); };
4947 warn $@ if $@;
4948}
4949
4950sub restore_tar_archive {
4951 my ($archive, $vmid, $user, $opts) = @_;
4952
9c502e26 4953 if ($archive ne '-') {
ed221350 4954 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
4955 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
4956 if $firstfile ne 'qemu-server.conf';
4957 }
3e16d5fc 4958
ed221350 4959 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 4960
ed221350 4961 # destroy existing data - keep empty config
8e90138a 4962 my $vmcfgfn = config_file($vmid);
ebb55558 4963 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 4964
3e16d5fc
DM
4965 my $tocmd = "/usr/lib/qemu-server/qmextract";
4966
2415a446 4967 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 4968 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
4969 $tocmd .= ' --prealloc' if $opts->{prealloc};
4970 $tocmd .= ' --info' if $opts->{info};
4971
a0d1b1a2 4972 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 4973 # so we pipe to zcat
2415a446
DM
4974 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
4975 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
4976
4977 my $tmpdir = "/var/tmp/vzdumptmp$$";
4978 mkpath $tmpdir;
4979
4980 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
4981 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 4982 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 4983
ed221350 4984 my $conffile = config_file($vmid);
3e16d5fc
DM
4985 my $tmpfn = "$conffile.$$.tmp";
4986
4987 # disable interrupts (always do cleanups)
4988 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4989 print STDERR "got interrupt - ignored\n";
4990 };
4991
afdb31d5 4992 eval {
3e16d5fc
DM
4993 # enable interrupts
4994 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4995 die "interrupted by signal\n";
4996 };
4997
9c502e26
DM
4998 if ($archive eq '-') {
4999 print "extracting archive from STDIN\n";
5000 run_command($cmd, input => "<&STDIN");
5001 } else {
5002 print "extracting archive '$archive'\n";
5003 run_command($cmd);
5004 }
3e16d5fc
DM
5005
5006 return if $opts->{info};
5007
5008 # read new mapping
5009 my $map = {};
5010 my $statfile = "$tmpdir/qmrestore.stat";
5011 if (my $fd = IO::File->new($statfile, "r")) {
5012 while (defined (my $line = <$fd>)) {
5013 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5014 $map->{$1} = $2 if $1;
5015 } else {
5016 print STDERR "unable to parse line in statfile - $line\n";
5017 }
5018 }
5019 $fd->close();
5020 }
5021
5022 my $confsrc = "$tmpdir/qemu-server.conf";
5023
5024 my $srcfd = new IO::File($confsrc, "r") ||
5025 die "unable to open file '$confsrc'\n";
5026
5027 my $outfd = new IO::File ($tmpfn, "w") ||
5028 die "unable to write config for VM $vmid\n";
5029
91bd6c90 5030 my $cookie = { netcount => 0 };
3e16d5fc 5031 while (defined (my $line = <$srcfd>)) {
be190583 5032 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
5033 }
5034
5035 $srcfd->close();
5036 $outfd->close();
5037 };
5038 my $err = $@;
5039
afdb31d5 5040 if ($err) {
3e16d5fc
DM
5041
5042 unlink $tmpfn;
5043
ed221350 5044 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 5045
3e16d5fc 5046 die $err;
afdb31d5 5047 }
3e16d5fc
DM
5048
5049 rmtree $tmpdir;
5050
5051 rename $tmpfn, $conffile ||
5052 die "unable to commit configuration file '$conffile'\n";
91bd6c90 5053
ed221350
DM
5054 PVE::Cluster::cfs_update(); # make sure we read new file
5055
91bd6c90
DM
5056 eval { rescan($vmid, 1); };
5057 warn $@ if $@;
3e16d5fc
DM
5058};
5059
0d18dcfc
DM
5060
5061# Internal snapshots
5062
5063# NOTE: Snapshot create/delete involves several non-atomic
5064# action, and can take a long time.
5065# So we try to avoid locking the file and use 'lock' variable
5066# inside the config file instead.
5067
ef59d1ca
DM
5068my $snapshot_copy_config = sub {
5069 my ($source, $dest) = @_;
5070
5071 foreach my $k (keys %$source) {
5072 next if $k eq 'snapshots';
982c7f12
DM
5073 next if $k eq 'snapstate';
5074 next if $k eq 'snaptime';
18bfb361 5075 next if $k eq 'vmstate';
ef59d1ca
DM
5076 next if $k eq 'lock';
5077 next if $k eq 'digest';
db7c26e5 5078 next if $k eq 'description';
ef59d1ca 5079 next if $k =~ m/^unused\d+$/;
be190583 5080
ef59d1ca
DM
5081 $dest->{$k} = $source->{$k};
5082 }
5083};
5084
5085my $snapshot_apply_config = sub {
5086 my ($conf, $snap) = @_;
5087
5088 # copy snapshot list
5089 my $newconf = {
5090 snapshots => $conf->{snapshots},
5091 };
5092
db7c26e5 5093 # keep description and list of unused disks
ef59d1ca 5094 foreach my $k (keys %$conf) {
db7c26e5 5095 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
5096 $newconf->{$k} = $conf->{$k};
5097 }
5098
5099 &$snapshot_copy_config($snap, $newconf);
5100
5101 return $newconf;
5102};
5103
18bfb361
DM
5104sub foreach_writable_storage {
5105 my ($conf, $func) = @_;
5106
5107 my $sidhash = {};
5108
5109 foreach my $ds (keys %$conf) {
5110 next if !valid_drivename($ds);
5111
5112 my $drive = parse_drive($ds, $conf->{$ds});
5113 next if !$drive;
5114 next if drive_is_cdrom($drive);
5115
5116 my $volid = $drive->{file};
5117
5118 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 5119 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
5120 }
5121
5122 foreach my $sid (sort keys %$sidhash) {
5123 &$func($sid);
5124 }
5125}
5126
5127my $alloc_vmstate_volid = sub {
5128 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 5129
18bfb361
DM
5130 # Note: we try to be smart when selecting a $target storage
5131
5132 my $target;
5133
5134 # search shared storage first
5135 foreach_writable_storage($conf, sub {
5136 my ($sid) = @_;
5137 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5138 return if !$scfg->{shared};
5139
5140 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
5141 });
5142
5143 if (!$target) {
5144 # now search local storage
5145 foreach_writable_storage($conf, sub {
5146 my ($sid) = @_;
5147 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5148 return if $scfg->{shared};
5149
5150 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
5151 });
5152 }
5153
5154 $target = 'local' if !$target;
5155
fe6249f4
DM
5156 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
5157 # we abort live save after $conf->{memory}, so we need at max twice that space
5158 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
5159
5160 my $name = "vm-$vmid-state-$snapname";
5161 my $scfg = PVE::Storage::storage_config($storecfg, $target);
5162 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
5163 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
5164
5165 return $volid;
5166};
5167
0d18dcfc 5168my $snapshot_prepare = sub {
18bfb361 5169 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
5170
5171 my $snap;
0d18dcfc
DM
5172
5173 my $updatefn = sub {
5174
5175 my $conf = load_config($vmid);
5176
be190583 5177 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
5178 if is_template($conf);
5179
0d18dcfc
DM
5180 check_lock($conf);
5181
22c377f0
DM
5182 $conf->{lock} = 'snapshot';
5183
be190583
DM
5184 die "snapshot name '$snapname' already used\n"
5185 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 5186
ee2f90b1 5187 my $storecfg = PVE::Storage::config();
7ea975ef 5188 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 5189
782f4f75 5190 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 5191
18bfb361
DM
5192 if ($save_vmstate && check_running($vmid)) {
5193 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
5194 }
5195
ef59d1ca 5196 &$snapshot_copy_config($conf, $snap);
0d18dcfc 5197
782f4f75
DM
5198 $snap->{snapstate} = "prepare";
5199 $snap->{snaptime} = time();
5200 $snap->{description} = $comment if $comment;
5201
4b15803d
DM
5202 # always overwrite machine if we save vmstate. This makes sure we
5203 # can restore it later using correct machine type
5204 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
5205
0d18dcfc
DM
5206 update_config_nolock($vmid, $conf, 1);
5207 };
5208
5209 lock_config($vmid, $updatefn);
22c377f0
DM
5210
5211 return $snap;
0d18dcfc
DM
5212};
5213
5214my $snapshot_commit = sub {
5215 my ($vmid, $snapname) = @_;
5216
5217 my $updatefn = sub {
5218
5219 my $conf = load_config($vmid);
5220
be190583
DM
5221 die "missing snapshot lock\n"
5222 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc 5223
7946e0fa
DM
5224 my $has_machine_config = defined($conf->{machine});
5225
0d18dcfc
DM
5226 my $snap = $conf->{snapshots}->{$snapname};
5227
be190583
DM
5228 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5229
5230 die "wrong snapshot state\n"
5231 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 5232
0d18dcfc 5233 delete $snap->{snapstate};
ee2f90b1 5234 delete $conf->{lock};
0d18dcfc 5235
ef59d1ca 5236 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 5237
7946e0fa
DM
5238 delete $newconf->{machine} if !$has_machine_config;
5239
05e5ad3f
DM
5240 $newconf->{parent} = $snapname;
5241
0d18dcfc
DM
5242 update_config_nolock($vmid, $newconf, 1);
5243 };
5244
5245 lock_config($vmid, $updatefn);
5246};
5247
22c377f0
DM
5248sub snapshot_rollback {
5249 my ($vmid, $snapname) = @_;
5250
5251 my $snap;
5252
5253 my $prepare = 1;
5254
a3222b91 5255 my $storecfg = PVE::Storage::config();
be190583 5256
22c377f0
DM
5257 my $updatefn = sub {
5258
5259 my $conf = load_config($vmid);
5260
8b43bc11 5261 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 5262
ab33a7c2
DM
5263 $snap = $conf->{snapshots}->{$snapname};
5264
be190583 5265 die "snapshot '$snapname' does not exist\n" if !defined($snap);
ab33a7c2 5266
be190583 5267 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
5268 if $snap->{snapstate};
5269
a3222b91
DM
5270 if ($prepare) {
5271 check_lock($conf);
5272 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
5273 }
22c377f0
DM
5274
5275 die "unable to rollback vm $vmid: vm is running\n"
5276 if check_running($vmid);
5277
5278 if ($prepare) {
5279 $conf->{lock} = 'rollback';
5280 } else {
5281 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
5282 delete $conf->{lock};
5283 }
5284
4b15803d
DM
5285 my $forcemachine;
5286
22c377f0 5287 if (!$prepare) {
4b15803d
DM
5288 my $has_machine_config = defined($conf->{machine});
5289
22c377f0 5290 # copy snapshot config to current config
ef59d1ca
DM
5291 $conf = &$snapshot_apply_config($conf, $snap);
5292 $conf->{parent} = $snapname;
4b15803d 5293
d8b916fd
DM
5294 # Note: old code did not store 'machine', so we try to be smart
5295 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
5296 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 5297 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
5298 # in the original config.
5299 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
5300 }
5301
5302 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
5303
5304 if (!$prepare && $snap->{vmstate}) {
5305 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 5306 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 5307 }
22c377f0
DM
5308 };
5309
5310 lock_config($vmid, $updatefn);
be190583 5311
22c377f0
DM
5312 foreach_drive($snap, sub {
5313 my ($ds, $drive) = @_;
5314
5315 return if drive_is_cdrom($drive);
5316
5317 my $volid = $drive->{file};
5318 my $device = "drive-$ds";
5319
79e57b29 5320 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
5321 });
5322
5323 $prepare = 0;
5324 lock_config($vmid, $updatefn);
5325}
5326
9dcf4909
DM
5327my $savevm_wait = sub {
5328 my ($vmid) = @_;
5329
5330 for(;;) {
ed221350 5331 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
5332 if (!$stat->{status}) {
5333 die "savevm not active\n";
5334 } elsif ($stat->{status} eq 'active') {
5335 sleep(1);
5336 next;
5337 } elsif ($stat->{status} eq 'completed') {
5338 last;
5339 } else {
5340 die "query-savevm returned status '$stat->{status}'\n";
5341 }
5342 }
5343};
5344
0d18dcfc 5345sub snapshot_create {
af9110dd 5346 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
0d18dcfc 5347
18bfb361 5348 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 5349
af9110dd 5350 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
18bfb361 5351
67fb9de6
DM
5352 my $config = load_config($vmid);
5353
af9110dd
WL
5354 my $running = check_running($vmid);
5355
67fb9de6 5356 my $freezefs = $running && $config->{agent};
af9110dd
WL
5357 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5358
5359 my $drivehash = {};
5360
5361 if ($freezefs) {
65994ad7
WL
5362 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5363 warn "guest-fsfreeze-freeze problems - $@" if $@;
5364 }
67fb9de6 5365
0d18dcfc
DM
5366 eval {
5367 # create internal snapshots of all drives
22c377f0
DM
5368
5369 my $storecfg = PVE::Storage::config();
a3222b91
DM
5370
5371 if ($running) {
5372 if ($snap->{vmstate}) {
be190583 5373 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
5374 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5375 &$savevm_wait($vmid);
a3222b91 5376 } else {
9dcf4909 5377 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
5378 }
5379 };
5380
22c377f0
DM
5381 foreach_drive($snap, sub {
5382 my ($ds, $drive) = @_;
5383
5384 return if drive_is_cdrom($drive);
0d18dcfc 5385
22c377f0
DM
5386 my $volid = $drive->{file};
5387 my $device = "drive-$ds";
5388
5389 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 5390 $drivehash->{$ds} = 1;
22c377f0 5391 });
0d18dcfc 5392 };
22c377f0
DM
5393 my $err = $@;
5394
65994ad7
WL
5395 if ($running) {
5396 eval { vm_mon_cmd($vmid, "savevm-end") };
5397 warn $@ if $@;
22c377f0 5398
af9110dd 5399 if ($freezefs) {
67fb9de6 5400 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
65994ad7
WL
5401 warn "guest-fsfreeze-thaw problems - $@" if $@;
5402 }
22c377f0 5403
65994ad7 5404 # savevm-end is async, we need to wait
f34ebd52 5405 for (;;) {
2c9e8036
AD
5406 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5407 if (!$stat->{bytes}) {
5408 last;
5409 } else {
5410 print "savevm not yet finished\n";
5411 sleep(1);
5412 next;
5413 }
5414 }
5415 }
5416
22c377f0 5417 if ($err) {
0d18dcfc 5418 warn "snapshot create failed: starting cleanup\n";
3ee28e38 5419 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
5420 warn $@ if $@;
5421 die $err;
5422 }
5423
5424 &$snapshot_commit($vmid, $snapname);
5425}
5426
3ee28e38 5427# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 5428sub snapshot_delete {
3ee28e38 5429 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
5430
5431 my $prepare = 1;
5432
22c377f0 5433 my $snap;
ee2f90b1 5434 my $unused = [];
0d18dcfc 5435
6cb1a8cf
DM
5436 my $unlink_parent = sub {
5437 my ($confref, $new_parent) = @_;
5438
5439 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5440 if ($new_parent) {
5441 $confref->{parent} = $new_parent;
5442 } else {
5443 delete $confref->{parent};
5444 }
5445 }
5446 };
be190583 5447
0d18dcfc 5448 my $updatefn = sub {
2009f324 5449 my ($remove_drive) = @_;
0d18dcfc 5450
22c377f0 5451 my $conf = load_config($vmid);
0d18dcfc 5452
5295b23d
DM
5453 if (!$drivehash) {
5454 check_lock($conf);
be190583 5455 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
5456 if is_template($conf);
5457 }
0d18dcfc 5458
22c377f0 5459 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 5460
be190583 5461 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
5462
5463 # remove parent refs
8fd882a4
SP
5464 if (!$prepare) {
5465 &$unlink_parent($conf, $snap->{parent});
5466 foreach my $sn (keys %{$conf->{snapshots}}) {
5467 next if $sn eq $snapname;
5468 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5469 }
0d18dcfc
DM
5470 }
5471
2009f324 5472 if ($remove_drive) {
18bfb361
DM
5473 if ($remove_drive eq 'vmstate') {
5474 delete $snap->{$remove_drive};
5475 } else {
5476 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5477 my $volid = $drive->{file};
5478 delete $snap->{$remove_drive};
5479 add_unused_volume($conf, $volid);
5480 }
2009f324
DM
5481 }
5482
0d18dcfc
DM
5483 if ($prepare) {
5484 $snap->{snapstate} = 'delete';
5485 } else {
5486 delete $conf->{snapshots}->{$snapname};
3ee28e38 5487 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
5488 foreach my $volid (@$unused) {
5489 add_unused_volume($conf, $volid);
5490 }
0d18dcfc
DM
5491 }
5492
5493 update_config_nolock($vmid, $conf, 1);
5494 };
5495
5496 lock_config($vmid, $updatefn);
5497
18bfb361 5498 # now remove vmstate file
0d18dcfc 5499
22c377f0
DM
5500 my $storecfg = PVE::Storage::config();
5501
18bfb361
DM
5502 if ($snap->{vmstate}) {
5503 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5504 if (my $err = $@) {
5505 die $err if !$force;
5506 warn $err;
5507 }
5508 # save changes (remove vmstate from snapshot)
5509 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5510 };
5511
5512 # now remove all internal snapshots
5513 foreach_drive($snap, sub {
22c377f0
DM
5514 my ($ds, $drive) = @_;
5515
5516 return if drive_is_cdrom($drive);
3ee28e38 5517
22c377f0
DM
5518 my $volid = $drive->{file};
5519 my $device = "drive-$ds";
5520
2009f324
DM
5521 if (!$drivehash || $drivehash->{$ds}) {
5522 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5523 if (my $err = $@) {
5524 die $err if !$force;
5525 warn $err;
5526 }
3ee28e38 5527 }
2009f324
DM
5528
5529 # save changes (remove drive fron snapshot)
5530 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5531 push @$unused, $volid;
22c377f0 5532 });
0d18dcfc
DM
5533
5534 # now cleanup config
5535 $prepare = 0;
5536 lock_config($vmid, $updatefn);
5537}
5538
9cd07842 5539sub has_feature {
7ea975ef
AD
5540 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5541
719893a9 5542 my $err;
7ea975ef
AD
5543 foreach_drive($conf, sub {
5544 my ($ds, $drive) = @_;
5545
5546 return if drive_is_cdrom($drive);
5547 my $volid = $drive->{file};
5548 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5549 });
5550
719893a9 5551 return $err ? 0 : 1;
7ea975ef 5552}
04a69bb4
AD
5553
5554sub template_create {
5555 my ($vmid, $conf, $disk) = @_;
5556
04a69bb4 5557 my $storecfg = PVE::Storage::config();
04a69bb4 5558
9cd07842
DM
5559 foreach_drive($conf, sub {
5560 my ($ds, $drive) = @_;
5561
5562 return if drive_is_cdrom($drive);
5563 return if $disk && $ds ne $disk;
5564
5565 my $volid = $drive->{file};
bbd56097 5566 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5567
04a69bb4
AD
5568 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5569 $drive->{file} = $voliddst;
152fe752
DM
5570 $conf->{$ds} = print_drive($vmid, $drive);
5571 update_config_nolock($vmid, $conf, 1);
04a69bb4 5572 });
04a69bb4
AD
5573}
5574
624361b3
AD
5575sub is_template {
5576 my ($conf) = @_;
5577
96d695c0 5578 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5579}
5580
5133de42
AD
5581sub qemu_img_convert {
5582 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5583
5584 my $storecfg = PVE::Storage::config();
5585 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5586 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5587
5588 if ($src_storeid && $dst_storeid) {
5589 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5590 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5591
5592 my $src_format = qemu_img_format($src_scfg, $src_volname);
5593 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5594
5595 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5596 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5597
5598 my $cmd = [];
71ddbff9 5599 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5600 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5601 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5602
5603 my $parser = sub {
5604 my $line = shift;
5605 if($line =~ m/\((\S+)\/100\%\)/){
5606 my $percent = $1;
5607 my $transferred = int($size * $percent / 100);
5608 my $remaining = $size - $transferred;
5609
5610 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5611 }
5612
5613 };
5614
5615 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5616 my $err = $@;
5617 die "copy failed: $err" if $err;
5618 }
5619}
5620
5621sub qemu_img_format {
5622 my ($scfg, $volname) = @_;
5623
ccb5c001 5624 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5625 return $1;
ccb5c001 5626 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5627 return "host_device";
be190583 5628 } else {
5133de42 5629 return "raw";
5133de42
AD
5630 }
5631}
5632
cfad42af 5633sub qemu_drive_mirror {
ab6ecffe 5634 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
cfad42af 5635
ab6ecffe 5636 my $count = 0;
cfad42af
AD
5637 my $old_len = 0;
5638 my $frozen = undef;
ab6ecffe 5639 my $maxwait = 120;
cfad42af
AD
5640
5641 my $storecfg = PVE::Storage::config();
08ac653f 5642 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
152fe752 5643
08ac653f 5644 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 5645
08ac653f
DM
5646 my $format;
5647 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5648 $format = $1;
5649 }
21ccdb50 5650
08ac653f 5651 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 5652
88383920
DM
5653 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5654 $opts->{format} = $format if $format;
5655
5656 #fixme : sometime drive-mirror timeout, but works fine after.
5657 # (I have see the problem with big volume > 200GB), so we need to eval
f34ebd52 5658 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
88383920 5659 # ignore errors here
21ccdb50 5660
08ac653f
DM
5661 eval {
5662 while (1) {
5663 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5664 my $stat = @$stats[0];
5665 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5666 die "error job is not mirroring" if $stat->{type} ne "mirror";
5667
08ac653f
DM
5668 my $busy = $stat->{busy};
5669
6f708643
DM
5670 if (my $total = $stat->{len}) {
5671 my $transferred = $stat->{offset} || 0;
5672 my $remaining = $total - $transferred;
5673 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
67fb9de6 5674
6f708643
DM
5675 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
5676 }
f34ebd52 5677
08ac653f
DM
5678 if ($stat->{len} == $stat->{offset}) {
5679 if ($busy eq 'false') {
5680
5681 last if $vmiddst != $vmid;
f34ebd52 5682
08ac653f
DM
5683 # try to switch the disk if source and destination are on the same guest
5684 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
5685 last if !$@;
5686 die $@ if $@ !~ m/cannot be completed/;
cfad42af 5687 }
b467f79a 5688
08ac653f
DM
5689 if ($count > $maxwait) {
5690 # if too much writes to disk occurs at the end of migration
5691 #the disk needs to be freezed to be able to complete the migration
5692 vm_suspend($vmid,1);
5693 $frozen = 1;
bcc87408 5694 }
08ac653f
DM
5695 $count ++
5696 }
5697 $old_len = $stat->{offset};
5698 sleep 1;
cfad42af
AD
5699 }
5700
08ac653f
DM
5701 vm_resume($vmid, 1) if $frozen;
5702
5703 };
88383920 5704 my $err = $@;
08ac653f 5705
88383920 5706 my $cancel_job = sub {
08ac653f
DM
5707 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
5708 while (1) {
5709 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5710 my $stat = @$stats[0];
5711 last if !$stat;
5712 sleep 1;
cfad42af 5713 }
88383920
DM
5714 };
5715
5716 if ($err) {
f34ebd52 5717 eval { &$cancel_job(); };
88383920
DM
5718 die "mirroring error: $err";
5719 }
5720
5721 if ($vmiddst != $vmid) {
5722 # if we clone a disk for a new target vm, we don't switch the disk
5723 &$cancel_job(); # so we call block-job-cancel
cfad42af
AD
5724 }
5725}
5726
152fe752 5727sub clone_disk {
be190583 5728 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
5729 $newvmid, $storage, $format, $full, $newvollist) = @_;
5730
5731 my $newvolid;
5732
5733 if (!$full) {
5734 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 5735 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
5736 push @$newvollist, $newvolid;
5737 } else {
5738 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5739 $storeid = $storage if $storage;
5740
1377d7b0
DM
5741 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5742 if (!$format) {
5743 $format = $drive->{format} || $defFormat;
152fe752
DM
5744 }
5745
1377d7b0
DM
5746 # test if requested format is supported - else use default
5747 my $supported = grep { $_ eq $format } @$validFormats;
5748 $format = $defFormat if !$supported;
5749
152fe752
DM
5750 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5751
5752 print "create full clone of drive $drivename ($drive->{file})\n";
5753 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5754 push @$newvollist, $newvolid;
5755
5756 if (!$running || $snapname) {
5757 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5758 } else {
5759 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 5760 }
152fe752
DM
5761 }
5762
5763 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5764
5765 my $disk = $drive;
5766 $disk->{format} = undef;
5767 $disk->{file} = $newvolid;
5768 $disk->{size} = $size;
5769
5770 return $disk;
5771}
5772
ff556cf2
DM
5773# this only works if VM is running
5774sub get_current_qemu_machine {
5775 my ($vmid) = @_;
5776
5777 my $cmd = { execute => 'query-machines', arguments => {} };
8e90138a 5778 my $res = vm_qmp_command($vmid, $cmd);
ff556cf2
DM
5779
5780 my ($current, $default);
5781 foreach my $e (@$res) {
5782 $default = $e->{name} if $e->{'is-default'};
5783 $current = $e->{name} if $e->{'is-current'};
5784 }
5785
5786 # fallback to the default machine if current is not supported by qemu
5787 return $current || $default || 'pc';
5788}
5789
4543ecf0
AD
5790sub lspci {
5791
5792 my $devices = {};
5793
5794 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5795 my (undef, $id, $function) = @_;
5796 my $res = { id => $id, function => $function};
5797 push @{$devices->{$id}}, $res;
5798 });
5799
5800 return $devices;
5801}
5802
1e3baf05 58031;