]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
vmconfig_hotplug_pending : add update_disk
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05 154my $confdesc = {
7183bd9a
AD
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
1e3baf05
DM
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
2ff09f52
DA
173 hotplug => {
174 optional => 1,
e8b9c17c 175 type => 'boolean',
6c52b679 176 description => "Allow hotplug for disk and network device",
2dbe827e 177 default => 0,
2ff09f52 178 },
1e3baf05
DM
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
22c377f0 189 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
7878afeb 209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
210 minimum => 16,
211 default => 512,
212 },
13a48620
DA
213 balloon => {
214 optional => 1,
215 type => 'integer',
8b1accf7
DM
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
13a48620 226 },
1e3baf05
DM
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 231 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
7fabe17d 236 type => 'string', format => 'dns-name',
1e3baf05
DM
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
cdd20088
AD
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
5b952ff5 243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
244 default => 'lsi',
245 },
1e3baf05
DM
246 description => {
247 optional => 1,
248 type => 'string',
0581fe4f 249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
6b9d84cf 254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
255 description => <<EODESC,
256Used to enable special optimization/features for specific
257operating systems:
258
259other => unspecified OS
260wxp => Microsoft Windows XP
261w2k => Microsoft Windows 2000
262w2k3 => Microsoft Windows 2003
263w2k8 => Microsoft Windows 2008
264wvista => Microsoft Windows Vista
265win7 => Microsoft Windows 7
a70ebde3 266win8 => Microsoft Windows 8/2012
1e3baf05
DM
267l24 => Linux 2.4 Kernel
268l26 => Linux 2.6/3.X Kernel
6b9d84cf 269solaris => solaris/opensolaris/openindiania kernel
1e3baf05 270
6b9d84cf 271other|l24|l26|solaris ... no special behaviour
a70ebde3 272wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
273EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
32baffb4 280 default => 'cdn',
1e3baf05
DM
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
03e480fc 286 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
8a010eae
AD
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
3bd18e48
AD
315 maxcpus => {
316 optional => 1,
317 type => 'integer',
318 description => "Maximum cpus for hotplug.",
319 minimum => 1,
320 default => 1,
321 },
1e3baf05
DM
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
bc84dcca 328 agent => {
ab6a046f
AD
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
be79c214 332 default => 0,
ab6a046f 333 },
1e3baf05
DM
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
8c559505
DM
343 description => "Enable/disable time drift fix.",
344 default => 0,
1e3baf05 345 },
19672434 346 localtime => {
1e3baf05
DM
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
ef5e2be2 359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 361 },
0ea9541d
DM
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
1e3baf05
DM
368 startdate => {
369 optional => 1,
19672434 370 type => 'string',
1e3baf05
DM
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
59411c4e
DM
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
68eda3ab
AD
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
1e3baf05
DM
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394args: -no-reboot -no-hpet
395EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
5acbfe9e 401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
04432191 412 type => 'number',
1e3baf05
DM
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
04432191 415 default => 0.1,
1e3baf05
DM
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
3aefd6fd 427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 428 default => 'kvm64',
1e3baf05 429 },
b7ba6b79
DM
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
982c7f12
DM
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
18bfb361
DM
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
3bafc510
DM
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
2796e7d5
DM
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
1e3baf05
DM
459};
460
461# what about other qemu settings ?
462#cpu => 'string',
463#machine => 'string',
464#fda => 'file',
465#fdb => 'file',
466#mtdblock => 'file',
467#sd => 'file',
468#pflash => 'file',
469#snapshot => 'bool',
470#bootp => 'file',
471##tftp => 'dir',
472##smb => 'dir',
473#kernel => 'file',
474#append => 'string',
475#initrd => 'file',
476##soundhw => 'string',
477
478while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480}
481
482my $MAX_IDE_DISKS = 4;
f62db2a4 483my $MAX_SCSI_DISKS = 14;
a2650619 484my $MAX_VIRTIO_DISKS = 16;
cdb0931f 485my $MAX_SATA_DISKS = 6;
1e3baf05 486my $MAX_USB_DEVICES = 5;
5bdcf937 487my $MAX_NETS = 32;
1e3baf05 488my $MAX_UNUSED_DISKS = 8;
5cffb2d2 489my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 490my $MAX_SERIAL_PORTS = 4;
1989a89c 491my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
492my $MAX_NUMA = 8;
493
494my $numadesc = {
495 optional => 1,
496 type => 'string', format => 'pve-qm-numanode',
497 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>][,policy=<preferred|bind|interleave>]]",
498 description => "numa topology",
499};
500PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
501
502for (my $i = 0; $i < $MAX_NUMA; $i++) {
503 $confdesc->{"numa$i"} = $numadesc;
504}
1e3baf05
DM
505
506my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
e4c6e0b8 507 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
6b64503e 508my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 509
1e3baf05
DM
510my $netdesc = {
511 optional => 1,
512 type => 'string', format => 'pve-qm-net',
a9410357 513 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
1e3baf05 514 description => <<EODESCR,
19672434 515Specify network devices.
1e3baf05
DM
516
517MODEL is one of: $nic_model_list_txt
518
19672434 519XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
520automatically generated if not specified.
521
522The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
523
524Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
525
526If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
527
52810.0.2.2 Gateway
52910.0.2.3 DNS Server
53010.0.2.4 SMB Server
531
532The DHCP server assign addresses to the guest starting from 10.0.2.15.
533
534EODESCR
535};
536PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
537
538for (my $i = 0; $i < $MAX_NETS; $i++) {
539 $confdesc->{"net$i"} = $netdesc;
540}
541
542my $drivename_hash;
19672434 543
1e3baf05
DM
544my $idedesc = {
545 optional => 1,
546 type => 'string', format => 'pve-qm-drive',
8d87f8aa 547 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 548 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
549};
550PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
551
552my $scsidesc = {
553 optional => 1,
554 type => 'string', format => 'pve-qm-drive',
8d87f8aa 555 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 556 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
557};
558PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
559
cdb0931f
DA
560my $satadesc = {
561 optional => 1,
562 type => 'string', format => 'pve-qm-drive',
8d87f8aa 563 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 564 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
565};
566PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
567
1e3baf05
DM
568my $virtiodesc = {
569 optional => 1,
570 type => 'string', format => 'pve-qm-drive',
8d87f8aa 571 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 572 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
573};
574PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
575
576my $usbdesc = {
577 optional => 1,
578 type => 'string', format => 'pve-qm-usb-device',
80401dd8 579 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 580 description => <<EODESCR,
2fe1a152 581Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
582pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
583
19672434 584'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
585'vendor_id:product_id' (hexadeciaml numbers)
586
19672434 587You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
588
589Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
590
80401dd8
DM
591The value 'spice' can be used to add a usb redirection devices for spice.
592
1e3baf05
DM
593EODESCR
594};
595PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
596
040b06b7
DA
597my $hostpcidesc = {
598 optional => 1,
599 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 600 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
601 description => <<EODESCR,
602Map host pci devices. HOSTPCIDEVICE syntax is:
603
604'bus:dev.func' (hexadecimal numbers)
605
606You can us the 'lspci' command to list existing pci devices.
607
0cea6a01
DM
608The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
609
040b06b7
DA
610Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
611
612Experimental: user reported problems with this option.
613EODESCR
614};
615PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
616
bae179aa
DA
617my $serialdesc = {
618 optional => 1,
ca0cef26 619 type => 'string',
1b0b51ed 620 pattern => '(/dev/.+|socket)',
bae179aa 621 description => <<EODESCR,
1b0b51ed 622Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
623
624Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
625
626Experimental: user reported problems with this option.
627EODESCR
628};
bae179aa 629
1989a89c
DA
630my $paralleldesc= {
631 optional => 1,
ca0cef26 632 type => 'string',
9ecc8431 633 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 634 description => <<EODESCR,
19672434 635Map host parallel devices (n is 0 to 2).
1989a89c
DA
636
637Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
638
639Experimental: user reported problems with this option.
640EODESCR
641};
1989a89c
DA
642
643for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
644 $confdesc->{"parallel$i"} = $paralleldesc;
645}
646
bae179aa
DA
647for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
648 $confdesc->{"serial$i"} = $serialdesc;
649}
650
040b06b7
DA
651for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
652 $confdesc->{"hostpci$i"} = $hostpcidesc;
653}
1e3baf05
DM
654
655for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
656 $drivename_hash->{"ide$i"} = 1;
657 $confdesc->{"ide$i"} = $idedesc;
658}
659
cdb0931f
DA
660for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
661 $drivename_hash->{"sata$i"} = 1;
662 $confdesc->{"sata$i"} = $satadesc;
663}
664
1e3baf05
DM
665for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
666 $drivename_hash->{"scsi$i"} = 1;
667 $confdesc->{"scsi$i"} = $scsidesc ;
668}
669
670for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
671 $drivename_hash->{"virtio$i"} = 1;
672 $confdesc->{"virtio$i"} = $virtiodesc;
673}
674
675for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
676 $confdesc->{"usb$i"} = $usbdesc;
677}
678
679my $unuseddesc = {
680 optional => 1,
681 type => 'string', format => 'pve-volume-id',
682 description => "Reference to unused volumes.",
683};
684
685for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
686 $confdesc->{"unused$i"} = $unuseddesc;
687}
688
689my $kvm_api_version = 0;
690
691sub kvm_version {
692
693 return $kvm_api_version if $kvm_api_version;
694
6b64503e 695 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
696 return 0;
697
6b64503e 698 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
699 $kvm_api_version = $v;
700 }
701
702 $fh->close();
703
704 return $kvm_api_version;
705}
706
707my $kvm_user_version;
708
709sub kvm_user_version {
710
711 return $kvm_user_version if $kvm_user_version;
712
713 $kvm_user_version = 'unknown';
714
715 my $tmp = `kvm -help 2>/dev/null`;
19672434 716
fa7ae705 717 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
718 $kvm_user_version = $2;
719 }
720
721 return $kvm_user_version;
722
723}
724
725my $kernel_has_vhost_net = -c '/dev/vhost-net';
726
727sub disknames {
728 # order is important - used to autoselect boot disk
19672434 729 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 730 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
731 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
732 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
733}
734
735sub valid_drivename {
736 my $dev = shift;
737
6b64503e 738 return defined($drivename_hash->{$dev});
1e3baf05
DM
739}
740
741sub option_exists {
742 my $key = shift;
743 return defined($confdesc->{$key});
19672434 744}
1e3baf05
DM
745
746sub nic_models {
747 return $nic_model_list;
748}
749
750sub os_list_description {
751
752 return {
753 other => 'Other',
754 wxp => 'Windows XP',
755 w2k => 'Windows 2000',
756 w2k3 =>, 'Windows 2003',
757 w2k8 => 'Windows 2008',
758 wvista => 'Windows Vista',
759 win7 => 'Windows 7',
a70ebde3 760 win8 => 'Windows 8/2012',
1e3baf05
DM
761 l24 => 'Linux 2.4',
762 l26 => 'Linux 2.6',
19672434 763 };
1e3baf05
DM
764}
765
1e3baf05
DM
766my $cdrom_path;
767
768sub get_cdrom_path {
769
770 return $cdrom_path if $cdrom_path;
771
772 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
773 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
774 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
775}
776
777sub get_iso_path {
778 my ($storecfg, $vmid, $cdrom) = @_;
779
780 if ($cdrom eq 'cdrom') {
781 return get_cdrom_path();
782 } elsif ($cdrom eq 'none') {
783 return '';
784 } elsif ($cdrom =~ m|^/|) {
785 return $cdrom;
786 } else {
6b64503e 787 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
788 }
789}
790
791# try to convert old style file names to volume IDs
792sub filename_to_volume_id {
793 my ($vmid, $file, $media) = @_;
794
795 if (!($file eq 'none' || $file eq 'cdrom' ||
796 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 797
1e3baf05 798 return undef if $file =~ m|/|;
19672434 799
1e3baf05
DM
800 if ($media && $media eq 'cdrom') {
801 $file = "local:iso/$file";
802 } else {
803 $file = "local:$vmid/$file";
804 }
805 }
806
807 return $file;
808}
809
810sub verify_media_type {
811 my ($opt, $vtype, $media) = @_;
812
813 return if !$media;
814
815 my $etype;
816 if ($media eq 'disk') {
a125592c 817 $etype = 'images';
1e3baf05
DM
818 } elsif ($media eq 'cdrom') {
819 $etype = 'iso';
820 } else {
821 die "internal error";
822 }
823
824 return if ($vtype eq $etype);
19672434 825
1e3baf05
DM
826 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
827}
828
829sub cleanup_drive_path {
830 my ($opt, $storecfg, $drive) = @_;
831
832 # try to convert filesystem paths to volume IDs
833
834 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
835 ($drive->{file} !~ m|^/dev/.+|) &&
836 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 837 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
838 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
839 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
840 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
841 verify_media_type($opt, $vtype, $drive->{media});
842 $drive->{file} = $volid;
843 }
844
845 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
846}
847
848sub create_conf_nolock {
849 my ($vmid, $settings) = @_;
850
6b64503e 851 my $filename = config_file($vmid);
1e3baf05
DM
852
853 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 854
1e3baf05
DM
855 my $defaults = load_defaults();
856
857 $settings->{name} = "vm$vmid" if !$settings->{name};
858 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
859
860 my $data = '';
861 foreach my $opt (keys %$settings) {
862 next if !$confdesc->{$opt};
863
864 my $value = $settings->{$opt};
865 next if !$value;
866
867 $data .= "$opt: $value\n";
868 }
869
870 PVE::Tools::file_set_contents($filename, $data);
871}
872
f36ed4f4
DM
873my $parse_size = sub {
874 my ($value) = @_;
875
9bf371a6 876 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
877 my ($size, $unit) = ($1, $3);
878 if ($unit) {
879 if ($unit eq 'K') {
880 $size = $size * 1024;
881 } elsif ($unit eq 'M') {
882 $size = $size * 1024 * 1024;
883 } elsif ($unit eq 'G') {
884 $size = $size * 1024 * 1024 * 1024;
885 }
886 }
887 return int($size);
888};
889
890my $format_size = sub {
891 my ($size) = @_;
892
893 $size = int($size);
894
895 my $kb = int($size/1024);
896 return $size if $kb*1024 != $size;
897
898 my $mb = int($kb/1024);
899 return "${kb}K" if $mb*1024 != $kb;
900
901 my $gb = int($mb/1024);
902 return "${mb}M" if $gb*1024 != $mb;
903
904 return "${gb}G";
905};
906
1e3baf05
DM
907# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
908# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 909# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 910# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
911
912sub parse_drive {
913 my ($key, $data) = @_;
914
915 my $res = {};
19672434 916
1e3baf05
DM
917 # $key may be undefined - used to verify JSON parameters
918 if (!defined($key)) {
919 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
920 $res->{index} = 0;
921 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
922 $res->{interface} = $1;
923 $res->{index} = $2;
924 } else {
925 return undef;
926 }
927
928 foreach my $p (split (/,/, $data)) {
929 next if $p =~ m/^\s*$/;
930
74edd76b 931 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
932 my ($k, $v) = ($1, $2);
933
934 $k = 'file' if $k eq 'volume';
935
936 return undef if defined $res->{$k};
19672434 937
9bf371a6
DM
938 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
939 return undef if !$v || $v !~ m/^\d+/;
940 $k = "m$k";
941 $v = sprintf("%.3f", $v / (1024*1024));
942 }
1e3baf05
DM
943 $res->{$k} = $v;
944 } else {
945 if (!$res->{file} && $p !~ m/=/) {
946 $res->{file} = $p;
947 } else {
948 return undef;
949 }
950 }
951 }
952
953 return undef if !$res->{file};
954
bdf3f362
AD
955 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
956 $res->{format} = $1;
957 }
958
19672434 959 return undef if $res->{cache} &&
e482cec3 960 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
961 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
962 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
963 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
964 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
965 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
966 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
967 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
968 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
969 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
970 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
971 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 972 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 973
9bf371a6
DM
974 return undef if $res->{mbps_rd} && $res->{mbps};
975 return undef if $res->{mbps_wr} && $res->{mbps};
976
977 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 978 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 979 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 980 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 981 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 982 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 983
affd2f88
AD
984 return undef if $res->{iops_rd} && $res->{iops};
985 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
986
987
affd2f88 988 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 989 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 990 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 991 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 992 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 993 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
994
995
24afaca0 996 if ($res->{size}) {
be190583 997 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
998 }
999
1e3baf05
DM
1000 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1001 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1002 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1003 return undef if $res->{interface} eq 'virtio';
1004 }
1005
1006 # rerror does not work with scsi drives
1007 if ($res->{rerror}) {
1008 return undef if $res->{interface} eq 'scsi';
1009 }
1010
1011 return $res;
1012}
1013
74edd76b 1014my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
1015
1016sub print_drive {
1017 my ($vmid, $drive) = @_;
1018
1019 my $opts = '';
74edd76b 1020 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
1021 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1022 }
1023
24afaca0
DM
1024 if ($drive->{size}) {
1025 $opts .= ",size=" . &$format_size($drive->{size});
1026 }
1027
1e3baf05
DM
1028 return "$drive->{file}$opts";
1029}
1030
28ef82d3
DM
1031sub scsi_inquiry {
1032 my($fh, $noerr) = @_;
1033
1034 my $SG_IO = 0x2285;
1035 my $SG_GET_VERSION_NUM = 0x2282;
1036
1037 my $versionbuf = "\x00" x 8;
1038 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1039 if (!$ret) {
1040 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1041 return undef;
1042 }
97d62eb7 1043 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1044 if ($version < 30000) {
1045 die "scsi generic interface too old\n" if !$noerr;
1046 return undef;
1047 }
97d62eb7 1048
28ef82d3
DM
1049 my $buf = "\x00" x 36;
1050 my $sensebuf = "\x00" x 8;
f334aa3e 1051 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1052
28ef82d3
DM
1053 # see /usr/include/scsi/sg.h
1054 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1055
97d62eb7
DM
1056 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1057 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1058 $cmd, $sensebuf, 6000);
1059
1060 $ret = ioctl($fh, $SG_IO, $packet);
1061 if (!$ret) {
1062 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1063 return undef;
1064 }
97d62eb7 1065
28ef82d3
DM
1066 my @res = unpack($sg_io_hdr_t, $packet);
1067 if ($res[17] || $res[18]) {
1068 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1069 return undef;
1070 }
1071
1072 my $res = {};
09984754 1073 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1074 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1075
09984754
DM
1076 $res->{removable} = $byte1 & 128 ? 1 : 0;
1077 $res->{type} = $byte0 & 31;
1078
28ef82d3
DM
1079 return $res;
1080}
1081
1082sub path_is_scsi {
1083 my ($path) = @_;
1084
1085 my $fh = IO::File->new("+<$path") || return undef;
1086 my $res = scsi_inquiry($fh, 1);
1087 close($fh);
1088
1089 return $res;
1090}
1091
db656e5f
DM
1092sub machine_type_is_q35 {
1093 my ($conf) = @_;
b467f79a 1094
db656e5f
DM
1095 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1096}
1097
1098sub print_tabletdevice_full {
1099 my ($conf) = @_;
b467f79a 1100
db656e5f
DM
1101 my $q35 = machine_type_is_q35($conf);
1102
1103 # we use uhci for old VMs because tablet driver was buggy in older qemu
1104 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1105
db656e5f
DM
1106 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1107}
1108
ca916ecc 1109sub print_drivedevice_full {
5bdcf937 1110 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1111
1112 my $device = '';
1113 my $maxdev = 0;
19672434 1114
ca916ecc 1115 if ($drive->{interface} eq 'virtio') {
5bdcf937 1116 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1117 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
7183bd9a 1118 $device .= ",iothread=iothread0" if $conf->{iothread};
2ed36a41 1119 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1120 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1121 my $controller = int($drive->{index} / $maxdev);
1122 my $unit = $drive->{index} % $maxdev;
1123 my $devicetype = 'hd';
231f2e13
DA
1124 my $path = '';
1125 if (drive_is_cdrom($drive)) {
1126 $devicetype = 'cd';
29b19529 1127 } else {
231f2e13
DA
1128 if ($drive->{file} =~ m|^/|) {
1129 $path = $drive->{file};
1130 } else {
1131 $path = PVE::Storage::path($storecfg, $drive->{file});
1132 }
d454d040
AD
1133
1134 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1135 $devicetype = 'generic';
1136 } else {
09984754
DM
1137 if (my $info = path_is_scsi($path)) {
1138 if ($info->{type} == 0) {
1139 $devicetype = 'block';
1140 } elsif ($info->{type} == 1) { # tape
1141 $devicetype = 'generic';
1142 }
1143 }
d454d040 1144 }
231f2e13 1145 }
ca916ecc 1146
5b952ff5
DM
1147 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1148 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1149 } else {
1150 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1151 }
1152
2ed36a41
DM
1153 } elsif ($drive->{interface} eq 'ide'){
1154 $maxdev = 2;
1155 my $controller = int($drive->{index} / $maxdev);
1156 my $unit = $drive->{index} % $maxdev;
1157 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1158
7ebe888a 1159 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1160 } elsif ($drive->{interface} eq 'sata'){
1161 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1162 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1163 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1164 } elsif ($drive->{interface} eq 'usb') {
1165 die "implement me";
1166 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1167 } else {
1168 die "unsupported interface type";
ca916ecc
DA
1169 }
1170
3b408e82
DM
1171 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1172
ca916ecc
DA
1173 return $device;
1174}
1175
15b21acc 1176sub get_initiator_name {
46f58b5f 1177 my $initiator;
15b21acc 1178
46f58b5f
DM
1179 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1180 while (defined(my $line = <$fh>)) {
1181 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1182 $initiator = $1;
1183 last;
1184 }
46f58b5f
DM
1185 $fh->close();
1186
15b21acc
MR
1187 return $initiator;
1188}
1189
1e3baf05
DM
1190sub print_drive_full {
1191 my ($storecfg, $vmid, $drive) = @_;
1192
1193 my $opts = '';
1194 foreach my $o (@qemu_drive_options) {
3b408e82 1195 next if $o eq 'bootindex';
1e3baf05 1196 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1197 }
1e3baf05 1198
9bf371a6
DM
1199 foreach my $o (qw(bps bps_rd bps_wr)) {
1200 my $v = $drive->{"m$o"};
1201 $opts .= ",$o=" . int($v*1024*1024) if $v;
1202 }
1203
1e3baf05 1204 # use linux-aio by default (qemu default is threads)
19672434 1205 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1206
1207 my $path;
1208 my $volid = $drive->{file};
6b64503e
DM
1209 if (drive_is_cdrom($drive)) {
1210 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1211 } else {
1212 if ($volid =~ m|^/|) {
1213 $path = $volid;
1214 } else {
6b64503e 1215 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1216 }
1217 }
1218
ef86170e 1219 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1220
f1e05305
AD
1221 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1222 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1223
1e3baf05
DM
1224 my $pathinfo = $path ? "file=$path," : '';
1225
3ebfcc86 1226 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1227}
1228
cc4d6182 1229sub print_netdevice_full {
5bdcf937 1230 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1231
1232 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1233
1234 my $device = $net->{model};
1235 if ($net->{model} eq 'virtio') {
1236 $device = 'virtio-net-pci';
1237 };
1238
1239 # qemu > 0.15 always try to boot from network - we disable that by
1240 # not loading the pxe rom file
1241 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
5bdcf937 1242 my $pciaddr = print_pci_addr("$netid", $bridges);
cc4d6182 1243 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1244 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1245 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1246 my $vectors = $net->{queues} * 2 + 2;
1247 $tmpstr .= ",vectors=$vectors,mq=on";
1248 }
cc4d6182
DA
1249 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1250 return $tmpstr;
1251}
1252
1253sub print_netdev_full {
1254 my ($vmid, $conf, $net, $netid) = @_;
1255
1256 my $i = '';
1257 if ($netid =~ m/^net(\d+)$/) {
1258 $i = int($1);
1259 }
1260
1261 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1262
1263 my $ifname = "tap${vmid}i$i";
1264
1265 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1266 die "interface name '$ifname' is too long (max 15 character)\n"
1267 if length($ifname) >= 16;
1268
1269 my $vhostparam = '';
1270 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1271
1272 my $vmname = $conf->{name} || "vm$vmid";
1273
a9410357
AD
1274 my $netdev = "";
1275
cc4d6182 1276 if ($net->{bridge}) {
a9410357 1277 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1278 } else {
a9410357 1279 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1280 }
a9410357
AD
1281
1282 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1283
1284 return $netdev;
cc4d6182 1285}
1e3baf05
DM
1286
1287sub drive_is_cdrom {
1288 my ($drive) = @_;
1289
1290 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1291
1292}
1293
2ed5d572
AD
1294sub parse_numa {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 foreach my $kvp (split(/,/, $data)) {
1300
1301 if ($kvp =~ m/^memory=(\S+)$/) {
1302 $res->{memory} = $1;
1303 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1304 $res->{policy} = $1;
1305 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1306 $res->{cpus}->{start} = $1;
1307 $res->{cpus}->{end} = $3;
1308 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1309 $res->{hostnodes}->{start} = $1;
1310 $res->{hostnodes}->{end} = $3;
1311 } else {
1312 return undef;
1313 }
1314 }
1315
1316 return $res;
1317}
1318
040b06b7
DA
1319sub parse_hostpci {
1320 my ($value) = @_;
1321
1322 return undef if !$value;
1323
0cea6a01
DM
1324
1325 my @list = split(/,/, $value);
1326 my $found;
1327
040b06b7 1328 my $res = {};
0cea6a01 1329 foreach my $kv (@list) {
040b06b7 1330
4543ecf0 1331 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1332 $found = 1;
4543ecf0
AD
1333 if(defined($4)){
1334 push @{$res->{pciid}}, { id => $2 , function => $4};
1335
1336 }else{
1337 my $pcidevices = lspci($2);
1338 $res->{pciid} = $pcidevices->{$2};
1339 }
0cea6a01
DM
1340 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1341 $res->{driver} = $1;
1342 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1343 $res->{rombar} = $1;
2e3b7e2a
AD
1344 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1345 $res->{'x-vga'} = $1;
1346 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1347 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1348 } else {
1349 warn "unknown hostpci setting '$kv'\n";
1350 }
040b06b7
DA
1351 }
1352
0cea6a01
DM
1353 return undef if !$found;
1354
040b06b7
DA
1355 return $res;
1356}
1357
1e3baf05
DM
1358# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1359sub parse_net {
1360 my ($data) = @_;
1361
1362 my $res = {};
1363
6b64503e 1364 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1365
e4c6e0b8 1366 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1367 my $model = lc($1);
92f0fedc 1368 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1369 $res->{model} = $model;
1370 $res->{macaddr} = $mac;
1371 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1372 $res->{bridge} = $1;
a9410357
AD
1373 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1374 $res->{queues} = $1;
1e3baf05
DM
1375 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1376 $res->{rate} = $1;
5070f384
DA
1377 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1378 $res->{tag} = $1;
2dd4aa4c
AD
1379 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1380 $res->{firewall} = $1;
1e3baf05
DM
1381 } else {
1382 return undef;
1383 }
19672434 1384
1e3baf05
DM
1385 }
1386
1387 return undef if !$res->{model};
1388
1389 return $res;
1390}
1391
1392sub print_net {
1393 my $net = shift;
1394
1395 my $res = "$net->{model}";
1396 $res .= "=$net->{macaddr}" if $net->{macaddr};
1397 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1398 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1399 $res .= ",tag=$net->{tag}" if $net->{tag};
28138e9a 1400 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1e3baf05
DM
1401
1402 return $res;
1403}
1404
1405sub add_random_macs {
1406 my ($settings) = @_;
1407
1408 foreach my $opt (keys %$settings) {
1409 next if $opt !~ m/^net(\d+)$/;
1410 my $net = parse_net($settings->{$opt});
1411 next if !$net;
1412 $settings->{$opt} = print_net($net);
1413 }
1414}
1415
1416sub add_unused_volume {
1858638f 1417 my ($config, $volid) = @_;
1e3baf05
DM
1418
1419 my $key;
1420 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1421 my $test = "unused$ind";
1422 if (my $vid = $config->{$test}) {
1423 return if $vid eq $volid; # do not add duplicates
1424 } else {
1425 $key = $test;
19672434 1426 }
1e3baf05
DM
1427 }
1428
1429 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1430
1858638f 1431 $config->{$key} = $volid;
1e3baf05 1432
1858638f 1433 return $key;
1e3baf05
DM
1434}
1435
055d554d
DM
1436sub vm_is_volid_owner {
1437 my ($storecfg, $vmid, $volid) = @_;
1438
1439 if ($volid !~ m|^/|) {
1440 my ($path, $owner);
1441 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1442 if ($owner && ($owner == $vmid)) {
1443 return 1;
1444 }
1445 }
1446
1447 return undef;
1448}
1449
1450sub vmconfig_delete_pending_option {
1451 my ($conf, $key) = @_;
1452
1453 delete $conf->{pending}->{$key};
1454 my $pending_delete_hash = { $key => 1 };
1455 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1456 $pending_delete_hash->{$opt} = 1;
1457 }
1458 $conf->{pending}->{delete} = join(',', keys %$pending_delete_hash);
1459}
1460
1461sub vmconfig_undelete_pending_option {
1462 my ($conf, $key) = @_;
1463
1464 my $pending_delete_hash = {};
1465 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1466 $pending_delete_hash->{$opt} = 1;
1467 }
1468 delete $pending_delete_hash->{$key};
1469
1470 my @keylist = keys %$pending_delete_hash;
1471 if (scalar(@keylist)) {
1472 $conf->{pending}->{delete} = join(',', @keylist);
1473 } else {
1474 delete $conf->{pending}->{delete};
1475 }
1476}
1477
1478sub vmconfig_register_unused_drive {
1479 my ($storecfg, $vmid, $conf, $drive) = @_;
1480
1481 if (!drive_is_cdrom($drive)) {
1482 my $volid = $drive->{file};
1483 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
1484 add_unused_volume($conf, $volid, $vmid);
1485 }
1486 }
1487}
1488
c750e90a
DM
1489sub vmconfig_cleanup_pending {
1490 my ($conf) = @_;
1491
1492 # remove pending changes when nothing changed
1493 my $changes;
1494 foreach my $opt (keys %{$conf->{pending}}) {
1495 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1496 $changes = 1;
1497 delete $conf->{pending}->{$opt};
1498 }
1499 }
1500
1501 # remove delete if option is not set
1502 my $pending_delete_hash = {};
1503 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1504 if (defined($conf->{$opt})) {
1505 $pending_delete_hash->{$opt} = 1;
1506 } else {
1507 $changes = 1;
1508 }
1509 }
1510
1511 my @keylist = keys %$pending_delete_hash;
1512 if (scalar(@keylist)) {
1513 $conf->{pending}->{delete} = join(',', @keylist);
1514 } else {
1515 delete $conf->{pending}->{delete};
1516 }
1517
1518 return $changes;
1519}
1520
2796e7d5
DM
1521my $valid_smbios1_options = {
1522 manufacturer => '\S+',
1523 product => '\S+',
1524 version => '\S+',
1525 serial => '\S+',
1526 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1527 sku => '\S+',
1528 family => '\S+',
1529};
1530
1531# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1532sub parse_smbios1 {
1533 my ($data) = @_;
1534
1535 my $res = {};
1536
1537 foreach my $kvp (split(/,/, $data)) {
1538 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1539 my ($k, $v) = split(/=/, $kvp);
1540 return undef if !defined($k) || !defined($v);
1541 return undef if !$valid_smbios1_options->{$k};
1542 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1543 $res->{$k} = $v;
1544 }
1545
1546 return $res;
1547}
1548
cd11416f
DM
1549sub print_smbios1 {
1550 my ($smbios1) = @_;
1551
1552 my $data = '';
1553 foreach my $k (keys %$smbios1) {
1554 next if !defined($smbios1->{$k});
1555 next if !$valid_smbios1_options->{$k};
1556 $data .= ',' if $data;
1557 $data .= "$k=$smbios1->{$k}";
1558 }
1559 return $data;
1560}
1561
2796e7d5
DM
1562PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1563sub verify_smbios1 {
1564 my ($value, $noerr) = @_;
1565
1566 return $value if parse_smbios1($value);
1567
1568 return undef if $noerr;
1569
1570 die "unable to parse smbios (type 1) options\n";
1571}
1572
1e3baf05
DM
1573PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1574sub verify_bootdisk {
1575 my ($value, $noerr) = @_;
1576
19672434 1577 return $value if valid_drivename($value);
1e3baf05
DM
1578
1579 return undef if $noerr;
1580
1581 die "invalid boot disk '$value'\n";
1582}
1583
2ed5d572
AD
1584PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1585sub verify_numa {
1586 my ($value, $noerr) = @_;
1587
1588 return $value if parse_numa($value);
1589
1590 return undef if $noerr;
1591
1592 die "unable to parse numa options\n";
1593}
1594
1e3baf05
DM
1595PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1596sub verify_net {
1597 my ($value, $noerr) = @_;
1598
1599 return $value if parse_net($value);
1600
1601 return undef if $noerr;
19672434 1602
1e3baf05
DM
1603 die "unable to parse network options\n";
1604}
1605
1606PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1607sub verify_drive {
1608 my ($value, $noerr) = @_;
1609
6b64503e 1610 return $value if parse_drive(undef, $value);
1e3baf05
DM
1611
1612 return undef if $noerr;
19672434 1613
1e3baf05
DM
1614 die "unable to parse drive options\n";
1615}
1616
1617PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1618sub verify_hostpci {
1619 my ($value, $noerr) = @_;
1620
040b06b7
DA
1621 return $value if parse_hostpci($value);
1622
1623 return undef if $noerr;
1624
1625 die "unable to parse pci id\n";
1e3baf05
DM
1626}
1627
0ea9541d
DM
1628PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1629sub verify_watchdog {
1630 my ($value, $noerr) = @_;
1631
1632 return $value if parse_watchdog($value);
1633
1634 return undef if $noerr;
19672434 1635
0ea9541d
DM
1636 die "unable to parse watchdog options\n";
1637}
1638
1639sub parse_watchdog {
1640 my ($value) = @_;
1641
1642 return undef if !$value;
1643
1644 my $res = {};
1645
6b64503e 1646 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1647 next if $p =~ m/^\s*$/;
1648
1649 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1650 $res->{model} = $2;
1651 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1652 $res->{action} = $2;
1653 } else {
1654 return undef;
1655 }
1656 }
1657
1658 return $res;
1659}
1660
59411c4e
DM
1661PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1662sub verify_startup {
1663 my ($value, $noerr) = @_;
1664
1665 return $value if parse_startup($value);
1666
1667 return undef if $noerr;
1668
1669 die "unable to parse startup options\n";
1670}
1671
1672sub parse_startup {
1673 my ($value) = @_;
1674
1675 return undef if !$value;
1676
1677 my $res = {};
1678
1679 foreach my $p (split(/,/, $value)) {
1680 next if $p =~ m/^\s*$/;
1681
1682 if ($p =~ m/^(order=)?(\d+)$/) {
1683 $res->{order} = $2;
1684 } elsif ($p =~ m/^up=(\d+)$/) {
1685 $res->{up} = $1;
1686 } elsif ($p =~ m/^down=(\d+)$/) {
1687 $res->{down} = $1;
1688 } else {
1689 return undef;
1690 }
1691 }
1692
1693 return $res;
1694}
1695
1e3baf05
DM
1696sub parse_usb_device {
1697 my ($value) = @_;
1698
1699 return undef if !$value;
1700
6b64503e 1701 my @dl = split(/,/, $value);
1e3baf05
DM
1702 my $found;
1703
1704 my $res = {};
1705 foreach my $v (@dl) {
036e0e2b 1706 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1707 $found = 1;
036e0e2b
DM
1708 $res->{vendorid} = $2;
1709 $res->{productid} = $4;
1e3baf05
DM
1710 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1711 $found = 1;
1712 $res->{hostbus} = $1;
1713 $res->{hostport} = $2;
80401dd8
DM
1714 } elsif ($v =~ m/^spice$/) {
1715 $found = 1;
1716 $res->{spice} = 1;
1e3baf05
DM
1717 } else {
1718 return undef;
1719 }
1720 }
1721 return undef if !$found;
1722
1723 return $res;
1724}
19672434 1725
1e3baf05
DM
1726PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1727sub verify_usb_device {
1728 my ($value, $noerr) = @_;
1729
1730 return $value if parse_usb_device($value);
1731
1732 return undef if $noerr;
19672434 1733
1e3baf05
DM
1734 die "unable to parse usb device\n";
1735}
1736
1e3baf05
DM
1737# add JSON properties for create and set function
1738sub json_config_properties {
1739 my $prop = shift;
1740
1741 foreach my $opt (keys %$confdesc) {
18bfb361 1742 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1743 $prop->{$opt} = $confdesc->{$opt};
1744 }
1745
1746 return $prop;
1747}
1748
1749sub check_type {
1750 my ($key, $value) = @_;
1751
1752 die "unknown setting '$key'\n" if !$confdesc->{$key};
1753
1754 my $type = $confdesc->{$key}->{type};
1755
6b64503e 1756 if (!defined($value)) {
1e3baf05
DM
1757 die "got undefined value\n";
1758 }
1759
1760 if ($value =~ m/[\n\r]/) {
1761 die "property contains a line feed\n";
1762 }
1763
1764 if ($type eq 'boolean') {
19672434
DM
1765 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1766 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1767 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1768 } elsif ($type eq 'integer') {
1769 return int($1) if $value =~ m/^(\d+)$/;
1770 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1771 } elsif ($type eq 'number') {
1772 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1773 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1774 } elsif ($type eq 'string') {
1775 if (my $fmt = $confdesc->{$key}->{format}) {
1776 if ($fmt eq 'pve-qm-drive') {
1777 # special case - we need to pass $key to parse_drive()
6b64503e 1778 my $drive = parse_drive($key, $value);
1e3baf05
DM
1779 return $value if $drive;
1780 die "unable to parse drive options\n";
1781 }
1782 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1783 return $value;
1784 }
1e3baf05 1785 $value =~ s/^\"(.*)\"$/$1/;
19672434 1786 return $value;
1e3baf05
DM
1787 } else {
1788 die "internal error"
1789 }
1790}
1791
191435c6
DM
1792sub lock_config_full {
1793 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1794
6b64503e 1795 my $filename = config_file_lock($vmid);
1e3baf05 1796
191435c6 1797 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1798
1799 die $@ if $@;
5fdbe4f0
DM
1800
1801 return $res;
1e3baf05
DM
1802}
1803
4e4f83fe
DM
1804sub lock_config_mode {
1805 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1806
1807 my $filename = config_file_lock($vmid);
1808
4e4f83fe 1809 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1810
1811 die $@ if $@;
1812
1813 return $res;
1814}
1815
191435c6
DM
1816sub lock_config {
1817 my ($vmid, $code, @param) = @_;
1818
1819 return lock_config_full($vmid, 10, $code, @param);
1820}
1821
1e3baf05 1822sub cfs_config_path {
a78ccf26 1823 my ($vmid, $node) = @_;
1e3baf05 1824
a78ccf26
DM
1825 $node = $nodename if !$node;
1826 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1827}
1828
040b06b7
DA
1829sub check_iommu_support{
1830 #fixme : need to check IOMMU support
1831 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1832
1833 my $iommu=1;
1834 return $iommu;
1835
1836}
1837
1e3baf05 1838sub config_file {
a78ccf26 1839 my ($vmid, $node) = @_;
1e3baf05 1840
a78ccf26 1841 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1842 return "/etc/pve/$cfspath";
1843}
1844
1845sub config_file_lock {
1846 my ($vmid) = @_;
1847
1848 return "$lock_dir/lock-$vmid.conf";
1849}
1850
1851sub touch_config {
1852 my ($vmid) = @_;
1853
6b64503e 1854 my $conf = config_file($vmid);
1e3baf05
DM
1855 utime undef, undef, $conf;
1856}
1857
1e3baf05 1858sub destroy_vm {
a6af7b3e 1859 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1860
6b64503e 1861 my $conffile = config_file($vmid);
1e3baf05 1862
6b64503e 1863 my $conf = load_config($vmid);
1e3baf05 1864
6b64503e 1865 check_lock($conf);
1e3baf05 1866
19672434 1867 # only remove disks owned by this VM
1e3baf05
DM
1868 foreach_drive($conf, sub {
1869 my ($ds, $drive) = @_;
1870
6b64503e 1871 return if drive_is_cdrom($drive);
1e3baf05
DM
1872
1873 my $volid = $drive->{file};
ed221350 1874
ff1a2432 1875 return if !$volid || $volid =~ m|^/|;
1e3baf05 1876
6b64503e 1877 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1878 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1879
6b64503e 1880 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1881 });
19672434 1882
a6af7b3e 1883 if ($keep_empty_config) {
9c502e26 1884 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1885 } else {
1886 unlink $conffile;
1887 }
1e3baf05
DM
1888
1889 # also remove unused disk
1890 eval {
6b64503e 1891 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1892
1893 eval {
6b64503e 1894 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1895 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1896 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1897 });
1898 };
1899 warn $@ if $@;
1900
1901 };
1902 warn $@ if $@;
1903}
1904
1e3baf05 1905sub load_config {
7e8dcf2c 1906 my ($vmid, $node) = @_;
1e3baf05 1907
7e8dcf2c 1908 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1909
1910 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1911
1912 die "no such VM ('$vmid')\n" if !defined($conf);
1913
1914 return $conf;
19672434 1915}
1e3baf05
DM
1916
1917sub parse_vm_config {
1918 my ($filename, $raw) = @_;
1919
1920 return undef if !defined($raw);
1921
554ac7e7 1922 my $res = {
fc1ddcdc 1923 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1924 snapshots => {},
0d732d16 1925 pending => {},
554ac7e7 1926 };
1e3baf05 1927
19672434 1928 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1929 || die "got strange filename '$filename'";
1930
1931 my $vmid = $1;
1932
0d18dcfc 1933 my $conf = $res;
0581fe4f 1934 my $descr = '';
e297c490 1935 my $section = '';
0581fe4f 1936
0d18dcfc
DM
1937 my @lines = split(/\n/, $raw);
1938 foreach my $line (@lines) {
1e3baf05 1939 next if $line =~ m/^\s*$/;
be190583 1940
eab09f4e 1941 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 1942 $section = 'pending';
0d732d16
DM
1943 $conf->{description} = $descr if $descr;
1944 $descr = '';
e297c490 1945 $conf = $res->{$section} = {};
eab09f4e
AD
1946 next;
1947
0d732d16 1948 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 1949 $section = $1;
0d18dcfc 1950 $conf->{description} = $descr if $descr;
782f4f75 1951 $descr = '';
e297c490 1952 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
1953 next;
1954 }
1e3baf05 1955
0581fe4f
DM
1956 if ($line =~ m/^\#(.*)\s*$/) {
1957 $descr .= PVE::Tools::decode_text($1) . "\n";
1958 next;
1959 }
1960
1e3baf05 1961 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1962 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1963 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1964 $conf->{snapstate} = $1;
1e3baf05
DM
1965 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1966 my $key = $1;
1967 my $value = $2;
0d18dcfc 1968 $conf->{$key} = $value;
ef824322 1969 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
e297c490 1970 my $value = $1;
ef824322
DM
1971 if ($section eq 'pending') {
1972 $conf->{delete} = $value; # we parse this later
1973 } else {
1974 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
eab09f4e 1975 }
1e3baf05
DM
1976 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1977 my $key = $1;
1978 my $value = $2;
1979 eval { $value = check_type($key, $value); };
1980 if ($@) {
1981 warn "vm $vmid - unable to parse value of '$key' - $@";
1982 } else {
1983 my $fmt = $confdesc->{$key}->{format};
1984 if ($fmt && $fmt eq 'pve-qm-drive') {
1985 my $v = parse_drive($key, $value);
1986 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1987 $v->{file} = $volid;
6b64503e 1988 $value = print_drive($vmid, $v);
1e3baf05
DM
1989 } else {
1990 warn "vm $vmid - unable to parse value of '$key'\n";
1991 next;
1992 }
1993 }
1994
1995 if ($key eq 'cdrom') {
0d18dcfc 1996 $conf->{ide2} = $value;
1e3baf05 1997 } else {
0d18dcfc 1998 $conf->{$key} = $value;
1e3baf05
DM
1999 }
2000 }
2001 }
2002 }
2003
0d18dcfc 2004 $conf->{description} = $descr if $descr;
0581fe4f 2005
0d18dcfc 2006 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
2007
2008 return $res;
2009}
2010
1858638f
DM
2011sub write_vm_config {
2012 my ($filename, $conf) = @_;
1e3baf05 2013
0d18dcfc
DM
2014 delete $conf->{snapstate}; # just to be sure
2015
1858638f
DM
2016 if ($conf->{cdrom}) {
2017 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2018 $conf->{ide2} = $conf->{cdrom};
2019 delete $conf->{cdrom};
2020 }
1e3baf05
DM
2021
2022 # we do not use 'smp' any longer
1858638f
DM
2023 if ($conf->{sockets}) {
2024 delete $conf->{smp};
2025 } elsif ($conf->{smp}) {
2026 $conf->{sockets} = $conf->{smp};
2027 delete $conf->{cores};
2028 delete $conf->{smp};
1e3baf05
DM
2029 }
2030
264e519f 2031 if ($conf->{maxcpus} && $conf->{sockets}) {
3bd18e48
AD
2032 delete $conf->{sockets};
2033 }
264e519f 2034
ee2f90b1 2035 my $used_volids = {};
0d18dcfc 2036
ee2f90b1 2037 my $cleanup_config = sub {
ef824322 2038 my ($cref, $pending, $snapname) = @_;
1858638f 2039
ee2f90b1
DM
2040 foreach my $key (keys %$cref) {
2041 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
ef824322 2042 $key eq 'snapstate' || $key eq 'pending';
ee2f90b1 2043 my $value = $cref->{$key};
ef824322
DM
2044 if ($key eq 'delete') {
2045 die "propertry 'delete' is only allowed in [PENDING]\n"
2046 if !$pending;
2047 # fixme: check syntax?
2048 next;
2049 }
ee2f90b1
DM
2050 eval { $value = check_type($key, $value); };
2051 die "unable to parse value of '$key' - $@" if $@;
1858638f 2052
ee2f90b1
DM
2053 $cref->{$key} = $value;
2054
a8e2f942 2055 if (!$snapname && valid_drivename($key)) {
ed221350 2056 my $drive = parse_drive($key, $value);
ee2f90b1
DM
2057 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2058 }
1e3baf05 2059 }
ee2f90b1
DM
2060 };
2061
2062 &$cleanup_config($conf);
ef824322
DM
2063
2064 &$cleanup_config($conf->{pending}, 1);
2065
ee2f90b1 2066 foreach my $snapname (keys %{$conf->{snapshots}}) {
ef824322
DM
2067 die "internal error" if $snapname eq 'pending';
2068 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
1e3baf05
DM
2069 }
2070
1858638f
DM
2071 # remove 'unusedX' settings if we re-add a volume
2072 foreach my $key (keys %$conf) {
2073 my $value = $conf->{$key};
ee2f90b1 2074 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 2075 delete $conf->{$key};
1e3baf05 2076 }
1858638f 2077 }
be190583 2078
0d18dcfc
DM
2079 my $generate_raw_config = sub {
2080 my ($conf) = @_;
0581fe4f 2081
0d18dcfc
DM
2082 my $raw = '';
2083
2084 # add description as comment to top of file
2085 my $descr = $conf->{description} || '';
2086 foreach my $cl (split(/\n/, $descr)) {
2087 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2088 }
2089
2090 foreach my $key (sort keys %$conf) {
ef824322 2091 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
0d18dcfc
DM
2092 $raw .= "$key: $conf->{$key}\n";
2093 }
2094 return $raw;
2095 };
0581fe4f 2096
0d18dcfc 2097 my $raw = &$generate_raw_config($conf);
ef824322
DM
2098
2099 if (scalar(keys %{$conf->{pending}})){
2100 $raw .= "\n[PENDING]\n";
2101 $raw .= &$generate_raw_config($conf->{pending});
2102 }
2103
0d18dcfc
DM
2104 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2105 $raw .= "\n[$snapname]\n";
2106 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2107 }
1e3baf05 2108
1858638f
DM
2109 return $raw;
2110}
1e3baf05 2111
1858638f
DM
2112sub update_config_nolock {
2113 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2114
1858638f 2115 check_lock($conf) if !$skiplock;
97d62eb7 2116
1858638f 2117 my $cfspath = cfs_config_path($vmid);
1e3baf05 2118
1858638f
DM
2119 PVE::Cluster::cfs_write_file($cfspath, $conf);
2120}
1e3baf05 2121
1858638f
DM
2122sub update_config {
2123 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2124
1858638f 2125 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
2126}
2127
19672434 2128sub load_defaults {
1e3baf05
DM
2129
2130 my $res = {};
2131
2132 # we use static defaults from our JSON schema configuration
2133 foreach my $key (keys %$confdesc) {
2134 if (defined(my $default = $confdesc->{$key}->{default})) {
2135 $res->{$key} = $default;
2136 }
2137 }
19672434 2138
1e3baf05
DM
2139 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2140 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2141
2142 return $res;
2143}
2144
2145sub config_list {
2146 my $vmlist = PVE::Cluster::get_vmlist();
2147 my $res = {};
2148 return $res if !$vmlist || !$vmlist->{ids};
2149 my $ids = $vmlist->{ids};
2150
1e3baf05
DM
2151 foreach my $vmid (keys %$ids) {
2152 my $d = $ids->{$vmid};
2153 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2154 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2155 $res->{$vmid}->{exists} = 1;
2156 }
2157 return $res;
2158}
2159
64e13401
DM
2160# test if VM uses local resources (to prevent migration)
2161sub check_local_resources {
2162 my ($conf, $noerr) = @_;
2163
2164 my $loc_res = 0;
19672434 2165
e0ab7331
DM
2166 $loc_res = 1 if $conf->{hostusb}; # old syntax
2167 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2168
0d29ab3b 2169 foreach my $k (keys %$conf) {
49ca581d 2170 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 2171 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2172 }
2173
2174 die "VM uses local resources\n" if $loc_res && !$noerr;
2175
2176 return $loc_res;
2177}
2178
719893a9 2179# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2180sub check_storage_availability {
2181 my ($storecfg, $conf, $node) = @_;
2182
2183 foreach_drive($conf, sub {
2184 my ($ds, $drive) = @_;
2185
2186 my $volid = $drive->{file};
2187 return if !$volid;
2188
2189 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2190 return if !$sid;
2191
2192 # check if storage is available on both nodes
2193 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2194 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2195 });
2196}
2197
719893a9
DM
2198# list nodes where all VM images are available (used by has_feature API)
2199sub shared_nodes {
2200 my ($conf, $storecfg) = @_;
2201
2202 my $nodelist = PVE::Cluster::get_nodelist();
2203 my $nodehash = { map { $_ => 1 } @$nodelist };
2204 my $nodename = PVE::INotify::nodename();
be190583 2205
719893a9
DM
2206 foreach_drive($conf, sub {
2207 my ($ds, $drive) = @_;
2208
2209 my $volid = $drive->{file};
2210 return if !$volid;
2211
2212 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2213 if ($storeid) {
2214 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2215 if ($scfg->{disable}) {
2216 $nodehash = {};
2217 } elsif (my $avail = $scfg->{nodes}) {
2218 foreach my $node (keys %$nodehash) {
2219 delete $nodehash->{$node} if !$avail->{$node};
2220 }
2221 } elsif (!$scfg->{shared}) {
2222 foreach my $node (keys %$nodehash) {
2223 delete $nodehash->{$node} if $node ne $nodename
2224 }
2225 }
2226 }
2227 });
2228
2229 return $nodehash
2230}
2231
1e3baf05
DM
2232sub check_lock {
2233 my ($conf) = @_;
2234
2235 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2236}
2237
2238sub check_cmdline {
2239 my ($pidfile, $pid) = @_;
2240
6b64503e
DM
2241 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2242 if (defined($fh)) {
1e3baf05
DM
2243 my $line = <$fh>;
2244 $fh->close;
2245 return undef if !$line;
6b64503e 2246 my @param = split(/\0/, $line);
1e3baf05
DM
2247
2248 my $cmd = $param[0];
06094efd 2249 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2250
2251 for (my $i = 0; $i < scalar (@param); $i++) {
2252 my $p = $param[$i];
2253 next if !$p;
2254 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2255 my $p = $param[$i+1];
2256 return 1 if $p && ($p eq $pidfile);
2257 return undef;
2258 }
2259 }
2260 }
2261 return undef;
2262}
2263
2264sub check_running {
7e8dcf2c 2265 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2266
7e8dcf2c 2267 my $filename = config_file($vmid, $node);
1e3baf05
DM
2268
2269 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2270 if !$nocheck && ! -f $filename;
1e3baf05 2271
e6c3b671 2272 my $pidfile = pidfile_name($vmid);
1e3baf05 2273
e6c3b671
DM
2274 if (my $fd = IO::File->new("<$pidfile")) {
2275 my $st = stat($fd);
1e3baf05 2276 my $line = <$fd>;
6b64503e 2277 close($fd);
1e3baf05
DM
2278
2279 my $mtime = $st->mtime;
2280 if ($mtime > time()) {
2281 warn "file '$filename' modified in future\n";
2282 }
2283
2284 if ($line =~ m/^(\d+)$/) {
2285 my $pid = $1;
e6c3b671
DM
2286 if (check_cmdline($pidfile, $pid)) {
2287 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2288 return $pid;
2289 }
2290 }
1e3baf05
DM
2291 }
2292 }
2293
2294 return undef;
2295}
2296
2297sub vzlist {
19672434 2298
1e3baf05
DM
2299 my $vzlist = config_list();
2300
6b64503e 2301 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2302
19672434 2303 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2304 next if $de !~ m/^(\d+)\.pid$/;
2305 my $vmid = $1;
6b64503e
DM
2306 next if !defined($vzlist->{$vmid});
2307 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2308 $vzlist->{$vmid}->{pid} = $pid;
2309 }
2310 }
2311
2312 return $vzlist;
2313}
2314
1e3baf05
DM
2315sub disksize {
2316 my ($storecfg, $conf) = @_;
2317
2318 my $bootdisk = $conf->{bootdisk};
2319 return undef if !$bootdisk;
2320 return undef if !valid_drivename($bootdisk);
2321
2322 return undef if !$conf->{$bootdisk};
2323
2324 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2325 return undef if !defined($drive);
2326
2327 return undef if drive_is_cdrom($drive);
2328
2329 my $volid = $drive->{file};
2330 return undef if !$volid;
2331
24afaca0 2332 return $drive->{size};
1e3baf05
DM
2333}
2334
2335my $last_proc_pid_stat;
2336
03a33f30
DM
2337# get VM status information
2338# This must be fast and should not block ($full == false)
2339# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2340sub vmstatus {
03a33f30 2341 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2342
2343 my $res = {};
2344
19672434 2345 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2346
2347 my $list = vzlist();
694fcad4 2348 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2349
ae4915a2
DM
2350 my $cpucount = $cpuinfo->{cpus} || 1;
2351
1e3baf05
DM
2352 foreach my $vmid (keys %$list) {
2353 next if $opt_vmid && ($vmid ne $opt_vmid);
2354
2355 my $cfspath = cfs_config_path($vmid);
2356 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2357
2358 my $d = {};
2359 $d->{pid} = $list->{$vmid}->{pid};
2360
2361 # fixme: better status?
2362 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2363
af990afe
DM
2364 my $size = disksize($storecfg, $conf);
2365 if (defined($size)) {
2366 $d->{disk} = 0; # no info available
1e3baf05
DM
2367 $d->{maxdisk} = $size;
2368 } else {
2369 $d->{disk} = 0;
2370 $d->{maxdisk} = 0;
2371 }
2372
2373 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2374 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2375
1e3baf05 2376 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2377 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2378
8b1accf7 2379 if ($conf->{balloon}) {
4bdb0514 2380 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2381 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2382 }
2383
1e3baf05
DM
2384 $d->{uptime} = 0;
2385 $d->{cpu} = 0;
1e3baf05
DM
2386 $d->{mem} = 0;
2387
2388 $d->{netout} = 0;
2389 $d->{netin} = 0;
2390
2391 $d->{diskread} = 0;
2392 $d->{diskwrite} = 0;
2393
4d8c851b
AD
2394 $d->{template} = is_template($conf);
2395
1e3baf05
DM
2396 $res->{$vmid} = $d;
2397 }
2398
2399 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2400 foreach my $dev (keys %$netdev) {
2401 next if $dev !~ m/^tap([1-9]\d*)i/;
2402 my $vmid = $1;
2403 my $d = $res->{$vmid};
2404 next if !$d;
19672434 2405
1e3baf05
DM
2406 $d->{netout} += $netdev->{$dev}->{receive};
2407 $d->{netin} += $netdev->{$dev}->{transmit};
2408 }
2409
1e3baf05
DM
2410 my $ctime = gettimeofday;
2411
2412 foreach my $vmid (keys %$list) {
2413
2414 my $d = $res->{$vmid};
2415 my $pid = $d->{pid};
2416 next if !$pid;
2417
694fcad4
DM
2418 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2419 next if !$pstat; # not running
19672434 2420
694fcad4 2421 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2422
694fcad4 2423 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2424
694fcad4 2425 if ($pstat->{vsize}) {
6b64503e 2426 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2427 }
2428
2429 my $old = $last_proc_pid_stat->{$pid};
2430 if (!$old) {
19672434
DM
2431 $last_proc_pid_stat->{$pid} = {
2432 time => $ctime,
1e3baf05
DM
2433 used => $used,
2434 cpu => 0,
1e3baf05
DM
2435 };
2436 next;
2437 }
2438
7f0b5beb 2439 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2440
2441 if ($dtime > 1000) {
2442 my $dutime = $used - $old->{used};
2443
ae4915a2 2444 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2445 $last_proc_pid_stat->{$pid} = {
19672434 2446 time => $ctime,
1e3baf05
DM
2447 used => $used,
2448 cpu => $d->{cpu},
1e3baf05
DM
2449 };
2450 } else {
2451 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2452 }
2453 }
2454
f5eb281a 2455 return $res if !$full;
03a33f30
DM
2456
2457 my $qmpclient = PVE::QMPClient->new();
2458
64e7fcf2
DM
2459 my $ballooncb = sub {
2460 my ($vmid, $resp) = @_;
2461
2462 my $info = $resp->{'return'};
2463 return if !$info->{max_mem};
be190583 2464
64e7fcf2
DM
2465 my $d = $res->{$vmid};
2466
2467 # use memory assigned to VM
2468 $d->{maxmem} = $info->{max_mem};
2469 $d->{balloon} = $info->{actual};
be190583 2470
64e7fcf2
DM
2471 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2472 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2473 $d->{freemem} = $info->{free_mem};
2474 }
2475
2476 };
2477
03a33f30
DM
2478 my $blockstatscb = sub {
2479 my ($vmid, $resp) = @_;
2480 my $data = $resp->{'return'} || [];
2481 my $totalrdbytes = 0;
2482 my $totalwrbytes = 0;
2483 for my $blockstat (@$data) {
2484 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2485 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2486 }
2487 $res->{$vmid}->{diskread} = $totalrdbytes;
2488 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2489 };
2490
2491 my $statuscb = sub {
2492 my ($vmid, $resp) = @_;
64e7fcf2 2493
03a33f30 2494 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2495 # this fails if ballon driver is not loaded, so this must be
2496 # the last commnand (following command are aborted if this fails).
2497 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2498
2499 my $status = 'unknown';
2500 if (!defined($status = $resp->{'return'}->{status})) {
2501 warn "unable to get VM status\n";
2502 return;
2503 }
2504
2505 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2506 };
2507
2508 foreach my $vmid (keys %$list) {
2509 next if $opt_vmid && ($vmid ne $opt_vmid);
2510 next if !$res->{$vmid}->{pid}; # not running
2511 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2512 }
2513
c8125172 2514 $qmpclient->queue_execute(undef, 1);
03a33f30
DM
2515
2516 foreach my $vmid (keys %$list) {
2517 next if $opt_vmid && ($vmid ne $opt_vmid);
2518 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2519 }
2520
1e3baf05
DM
2521 return $res;
2522}
2523
2524sub foreach_drive {
2525 my ($conf, $func) = @_;
2526
2527 foreach my $ds (keys %$conf) {
2528 next if !valid_drivename($ds);
2529
6b64503e 2530 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2531 next if !$drive;
2532
2533 &$func($ds, $drive);
2534 }
2535}
2536
d5769dc2
DM
2537sub foreach_volid {
2538 my ($conf, $func) = @_;
be190583 2539
d5769dc2
DM
2540 my $volhash = {};
2541
2542 my $test_volid = sub {
2543 my ($volid, $is_cdrom) = @_;
2544
2545 return if !$volid;
be190583 2546
d5769dc2
DM
2547 $volhash->{$volid} = $is_cdrom || 0;
2548 };
2549
ed221350 2550 foreach_drive($conf, sub {
d5769dc2
DM
2551 my ($ds, $drive) = @_;
2552 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2553 });
2554
2555 foreach my $snapname (keys %{$conf->{snapshots}}) {
2556 my $snap = $conf->{snapshots}->{$snapname};
2557 &$test_volid($snap->{vmstate}, 0);
ed221350 2558 foreach_drive($snap, sub {
d5769dc2
DM
2559 my ($ds, $drive) = @_;
2560 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2561 });
2562 }
2563
2564 foreach my $volid (keys %$volhash) {
be190583 2565 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2566 }
2567}
2568
86b8228b
DM
2569sub vga_conf_has_spice {
2570 my ($vga) = @_;
2571
590e698c
DM
2572 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2573
2574 return $1 || 1;
86b8228b
DM
2575}
2576
1e3baf05 2577sub config_to_command {
952958bc 2578 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2579
2580 my $cmd = [];
8c559505
DM
2581 my $globalFlags = [];
2582 my $machineFlags = [];
2583 my $rtcFlags = [];
519ed28c 2584 my $cpuFlags = [];
5bdcf937 2585 my $devices = [];
b78ebef7 2586 my $pciaddr = '';
5bdcf937 2587 my $bridges = {};
1e3baf05
DM
2588 my $kvmver = kvm_user_version();
2589 my $vernum = 0; # unknown
a3c52213
DM
2590 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2591 $vernum = $1*1000000+$2*1000;
2592 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2593 $vernum = $1*1000000+$2*1000+$3;
2594 }
2595
a3c52213 2596 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2597
2598 my $have_ovz = -f '/proc/vz/vestat';
2599
db656e5f
DM
2600 my $q35 = machine_type_is_q35($conf);
2601
1e3baf05
DM
2602 push @$cmd, '/usr/bin/kvm';
2603
2604 push @$cmd, '-id', $vmid;
2605
2606 my $use_virtio = 0;
2607
c971c4f2
AD
2608 my $qmpsocket = qmp_socket($vmid);
2609 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2610 push @$cmd, '-mon', "chardev=qmp,mode=control";
2611
7b7c6d1b 2612 my $socket = vnc_socket($vmid);
1e3baf05
DM
2613 push @$cmd, '-vnc', "unix:$socket,x509,password";
2614
6b64503e 2615 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2616
1e3baf05
DM
2617 push @$cmd, '-daemonize';
2618
2796e7d5
DM
2619 if ($conf->{smbios1}) {
2620 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2621 }
2622
7183bd9a
AD
2623 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2624
db656e5f 2625 if ($q35) {
b467f79a 2626 # the q35 chipset support native usb2, so we enable usb controller
db656e5f 2627 # by default for this machine type
f8e83f05 2628 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2629 } else {
f8e83f05
AD
2630 $pciaddr = print_pci_addr("piix3", $bridges);
2631 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2632
f8e83f05 2633 my $use_usb2 = 0;
db656e5f
DM
2634 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2635 next if !$conf->{"usb$i"};
2636 $use_usb2 = 1;
2637 }
2638 # include usb device config
2639 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2640 }
19672434 2641
5acbfe9e 2642 my $vga = $conf->{vga};
2fa3151e 2643
590e698c
DM
2644 my $qxlnum = vga_conf_has_spice($vga);
2645 $vga = 'qxl' if $qxlnum;
2fa3151e 2646
5acbfe9e 2647 if (!$vga) {
264e519f
DM
2648 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2649 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2650 $conf->{ostype} eq 'w2k8')) {
2651 $vga = 'std';
2652 } else {
2653 $vga = 'cirrus';
2654 }
2655 }
2656
1e3baf05 2657 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2658 my $tablet;
2659 if (defined($conf->{tablet})) {
2660 $tablet = $conf->{tablet};
2661 } else {
2662 $tablet = $defaults->{tablet};
590e698c 2663 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2664 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2665 }
2666
db656e5f 2667 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2668
1e3baf05 2669 # host pci devices
040b06b7 2670 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2671 my $d = parse_hostpci($conf->{"hostpci$i"});
2672 next if !$d;
2673
2674 my $pcie = $d->{pcie};
2675 if($pcie){
2676 die "q35 machine model is not enabled" if !$q35;
2677 $pciaddr = print_pcie_addr("hostpci$i");
2678 }else{
2679 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2680 }
2681
2682 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2683 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2684 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2685 if ($xvga && $xvga ne '') {
2686 push @$cpuFlags, 'kvm=off';
2687 $vga = 'none';
2688 }
2e3b7e2a 2689 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2690 my $pcidevices = $d->{pciid};
2691 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2692
4543ecf0
AD
2693 my $j=0;
2694 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2695
4543ecf0
AD
2696 my $id = "hostpci$i";
2697 $id .= ".$j" if $multifunction;
2698 my $addr = $pciaddr;
2699 $addr .= ".$j" if $multifunction;
2700 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2701
2702 if($j == 0){
2703 $devicestr .= "$rombar$xvga";
2704 $devicestr .= ",multifunction=on" if $multifunction;
2705 }
2706
2707 push @$devices, '-device', $devicestr;
2708 $j++;
2709 }
1e3baf05
DM
2710 }
2711
2712 # usb devices
2713 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2714 my $d = parse_usb_device($conf->{"usb$i"});
2715 next if !$d;
2716 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2717 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2718 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2719 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2720 } elsif ($d->{spice}) {
2721 # usb redir support for spice
2722 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2723 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2724 }
2725 }
2726
1e3baf05 2727 # serial devices
bae179aa 2728 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2729 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2730 if ($path eq 'socket') {
2731 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2732 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2733 push @$devices, '-device', "isa-serial,chardev=serial$i";
2734 } else {
2735 die "no such serial device\n" if ! -c $path;
2736 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2737 push @$devices, '-device', "isa-serial,chardev=serial$i";
2738 }
34978be3 2739 }
1e3baf05
DM
2740 }
2741
2742 # parallel devices
1989a89c 2743 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2744 if (my $path = $conf->{"parallel$i"}) {
19672434 2745 die "no such parallel device\n" if ! -c $path;
32e69805 2746 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2747 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2748 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2749 }
1e3baf05
DM
2750 }
2751
2752 my $vmname = $conf->{name} || "vm$vmid";
2753
2754 push @$cmd, '-name', $vmname;
19672434 2755
1e3baf05
DM
2756 my $sockets = 1;
2757 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2758 $sockets = $conf->{sockets} if $conf->{sockets};
2759
2760 my $cores = $conf->{cores} || 1;
3bd18e48
AD
2761 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2762
76267728
WL
2763 my $total_cores = $sockets * $cores;
2764 my $allowed_cores = $cpuinfo->{cpus};
2765
f34ebd52 2766 die "MAX $allowed_cores cores allowed per VM on this node\n"
76267728
WL
2767 if ($allowed_cores < $total_cores);
2768
264e519f 2769 if ($maxcpus) {
3bd18e48 2770 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
264e519f 2771 } else {
3bd18e48
AD
2772 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2773 }
1e3baf05 2774
1e3baf05
DM
2775 push @$cmd, '-nodefaults';
2776
32baffb4 2777 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2778
0888fdce
DM
2779 my $bootindex_hash = {};
2780 my $i = 1;
2781 foreach my $o (split(//, $bootorder)) {
2782 $bootindex_hash->{$o} = $i*100;
2783 $i++;
afdb31d5 2784 }
3b408e82
DM
2785
2786 push @$cmd, '-boot', "menu=on";
1e3baf05 2787
6b64503e 2788 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2789
6b64503e 2790 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2791
ef5e2be2 2792 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2793
2794 # time drift fix
6b64503e 2795 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2796
6b64503e 2797 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2798 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2799
2800 if (my $ost = $conf->{ostype}) {
6b9d84cf 2801 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2802
2803 if ($ost =~ m/^w/) { # windows
8c559505 2804 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2805
8c559505 2806 # use time drift fix when acpi is enabled
6b64503e 2807 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2808 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2809 }
2810 }
2811
be190583 2812 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2813 $ost eq 'wvista') {
8c559505 2814 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2815 push @$cmd, '-no-hpet';
462e8d19
AD
2816 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2817 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2818 }
2819
2820 if ($ost eq 'win7' || $ost eq 'win8') {
2821 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2822 }
1e3baf05
DM
2823 }
2824
8c559505
DM
2825 push @$rtcFlags, 'driftfix=slew' if $tdf;
2826
7f0b5beb 2827 if ($nokvm) {
8c559505 2828 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2829 } else {
2830 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2831 }
1e3baf05 2832
952958bc
DM
2833 my $machine_type = $forcemachine || $conf->{machine};
2834 if ($machine_type) {
2835 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2836 }
2837
8c559505
DM
2838 if ($conf->{startdate}) {
2839 push @$rtcFlags, "base=$conf->{startdate}";
2840 } elsif ($useLocaltime) {
2841 push @$rtcFlags, 'base=localtime';
2842 }
1e3baf05 2843
519ed28c
AD
2844 my $cpu = $nokvm ? "qemu64" : "kvm64";
2845 $cpu = $conf->{cpu} if $conf->{cpu};
2846
4dc339e7
AD
2847 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2848
6b9d84cf
AD
2849 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2850
2851 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2852
2e1a5389
AD
2853 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2854
be190583 2855 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2856
c0efd8cd
DM
2857 # Note: enforce needs kernel 3.10, so we do not use it for now
2858 # push @$cmd, '-cpu', "$cpu,enforce";
2859 push @$cmd, '-cpu', $cpu;
519ed28c 2860
67fb9de6 2861 my $memory = $conf->{memory} || $defaults->{memory};
8a010eae
AD
2862 push @$cmd, '-m', $memory;
2863
67fb9de6 2864 if ($conf->{numa}) {
8a010eae 2865
2ed5d572
AD
2866 my $numa_totalmemory = undef;
2867 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2868 next if !$conf->{"numa$i"};
2869 my $numa = parse_numa($conf->{"numa$i"});
2870 next if !$numa;
67fb9de6
DM
2871 # memory
2872 die "missing numa node$i memory value\n" if !$numa->{memory};
2ed5d572
AD
2873 my $numa_memory = $numa->{memory};
2874 $numa_totalmemory += $numa_memory;
2875 my $numa_object = "memory-backend-ram,id=ram-node$i,size=$numa_memory"."M";
2876
67fb9de6 2877 # cpus
2ed5d572 2878 my $cpus_start = $numa->{cpus}->{start};
67fb9de6 2879 die "missing numa node$i cpus\n" if !defined($cpus_start);
2ed5d572
AD
2880 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2881 my $cpus = $cpus_start;
2882 if (defined($cpus_end)) {
2883 $cpus .= "-$cpus_end";
67fb9de6 2884 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2ed5d572 2885 }
8a010eae 2886
67fb9de6 2887 # hostnodes
2ed5d572
AD
2888 my $hostnodes_start = $numa->{hostnodes}->{start};
2889 if (defined($hostnodes_start)) {
2890 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2891 my $hostnodes = $hostnodes_start;
2892 if (defined($hostnodes_end)) {
2893 $hostnodes .= "-$hostnodes_end";
67fb9de6 2894 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2ed5d572 2895 }
8a010eae 2896
2ed5d572
AD
2897 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2898 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
67fb9de6 2899 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2ed5d572 2900 }
8a010eae 2901
67fb9de6 2902 # policy
2ed5d572 2903 my $policy = $numa->{policy};
67fb9de6
DM
2904 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2905 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2ed5d572
AD
2906 }
2907
2908 push @$cmd, '-object', $numa_object;
8a010eae
AD
2909 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2910 }
67fb9de6
DM
2911
2912 die "total memory for NUMA nodes must be equal to vm memory\n"
2913 if $numa_totalmemory && $numa_totalmemory != $memory;
2ed5d572
AD
2914
2915 #if no custom tology, we split memory and cores across numa nodes
2916 if(!$numa_totalmemory) {
2917
67fb9de6 2918 my $numa_memory = ($memory / $sockets) . "M";
2ed5d572
AD
2919
2920 for (my $i = 0; $i < $sockets; $i++) {
2921
2922 my $cpustart = ($cores * $i);
2923 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2924 my $cpus = $cpustart;
2925 $cpus .= "-$cpuend" if $cpuend;
2926
2927 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2928 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2929 }
2930 }
8a010eae
AD
2931 }
2932
1e3baf05
DM
2933 push @$cmd, '-S' if $conf->{freeze};
2934
2935 # set keyboard layout
2936 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2937 push @$cmd, '-k', $kb if $kb;
2938
2939 # enable sound
2940 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2941 #push @$cmd, '-soundhw', 'es1370';
2942 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 2943
bc84dcca 2944 if($conf->{agent}) {
7a6c2150 2945 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
2946 my $pciaddr = print_pci_addr("qga0", $bridges);
2947 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2948 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2949 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2950 }
2951
1d794448 2952 my $spice_port;
2fa3151e 2953
590e698c
DM
2954 if ($qxlnum) {
2955 if ($qxlnum > 1) {
2956 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2957 for(my $i = 1; $i < $qxlnum; $i++){
2958 my $pciaddr = print_pci_addr("vga$i", $bridges);
2959 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2960 }
2961 } else {
2962 # assume other OS works like Linux
2963 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2964 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
2965 }
2966 }
2967
1011b570 2968 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 2969
cd339d1f 2970 $spice_port = PVE::Tools::next_spice_port();
943340a6 2971
d2da6d9b 2972 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 2973
d2da6d9b
AD
2974 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2975 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2976 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
2977 }
2978
8d9ae0d2
DM
2979 # enable balloon by default, unless explicitly disabled
2980 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2981 $pciaddr = print_pci_addr("balloon0", $bridges);
2982 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2983 }
1e3baf05 2984
0ea9541d
DM
2985 if ($conf->{watchdog}) {
2986 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 2987 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 2988 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
2989 push @$devices, '-device', "$watchdog$pciaddr";
2990 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
2991 }
2992
1e3baf05 2993 my $vollist = [];
941e0c42 2994 my $scsicontroller = {};
26ee04b6 2995 my $ahcicontroller = {};
cdd20088 2996 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 2997
5881b913
DM
2998 # Add iscsi initiator name if available
2999 if (my $initiator = get_initiator_name()) {
3000 push @$devices, '-iscsi', "initiator-name=$initiator";
3001 }
3002
1e3baf05
DM
3003 foreach_drive($conf, sub {
3004 my ($ds, $drive) = @_;
3005
ff1a2432 3006 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 3007 push @$vollist, $drive->{file};
ff1a2432 3008 }
afdb31d5 3009
1e3baf05 3010 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
3011
3012 if (drive_is_cdrom ($drive)) {
3013 if ($bootindex_hash->{d}) {
3014 $drive->{bootindex} = $bootindex_hash->{d};
3015 $bootindex_hash->{d} += 1;
3016 }
3017 } else {
3018 if ($bootindex_hash->{c}) {
3019 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3020 $bootindex_hash->{c} += 1;
3021 }
3022 }
3023
941e0c42 3024 if ($drive->{interface} eq 'scsi') {
cdd20088 3025
5b952ff5 3026 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 3027 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
3028 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
3029 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 3030 $scsicontroller->{$controller}=1;
941e0c42 3031 }
3b408e82 3032
26ee04b6
DA
3033 if ($drive->{interface} eq 'sata') {
3034 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
3035 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3036 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
3037 $ahcicontroller->{$controller}=1;
3038 }
46f58b5f 3039
15b21acc
MR
3040 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3041 push @$devices, '-drive',$drive_cmd;
46f58b5f 3042 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
3043 });
3044
cc4d6182 3045 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 3046 next if !$conf->{"net$i"};
cc4d6182
DA
3047 my $d = parse_net($conf->{"net$i"});
3048 next if !$d;
1e3baf05 3049
cc4d6182 3050 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 3051
cc4d6182
DA
3052 if ($bootindex_hash->{n}) {
3053 $d->{bootindex} = $bootindex_hash->{n};
3054 $bootindex_hash->{n} += 1;
3055 }
1e3baf05 3056
cc4d6182 3057 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
3058 push @$devices, '-netdev', $netdevfull;
3059
3060 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
3061 push @$devices, '-device', $netdevicefull;
3062 }
1e3baf05 3063
db656e5f
DM
3064 if (!$q35) {
3065 # add pci bridges
f8e83f05
AD
3066 while (my ($k, $v) = each %$bridges) {
3067 $pciaddr = print_pci_addr("pci.$k");
3068 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3069 }
19672434
DM
3070 }
3071
1e3baf05
DM
3072 # hack: virtio with fairsched is unreliable, so we do not use fairsched
3073 # when the VM uses virtio devices.
19672434
DM
3074 if (!$use_virtio && $have_ovz) {
3075
6b64503e 3076 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
3077 $conf->{cpuunits} : $defaults->{cpuunits};
3078
3079 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
3080
3081 # fixme: cpulimit is currently ignored
3082 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
3083 }
3084
3085 # add custom args
3086 if ($conf->{args}) {
3ada46c9 3087 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
3088 push @$cmd, @$aa;
3089 }
3090
5bdcf937 3091 push @$cmd, @$devices;
be190583 3092 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 3093 if scalar(@$rtcFlags);
be190583 3094 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
3095 if scalar(@$machineFlags);
3096 push @$cmd, '-global', join(',', @$globalFlags)
3097 if scalar(@$globalFlags);
3098
1d794448 3099 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 3100}
19672434 3101
1e3baf05
DM
3102sub vnc_socket {
3103 my ($vmid) = @_;
3104 return "${var_run_tmpdir}/$vmid.vnc";
3105}
3106
943340a6 3107sub spice_port {
1011b570 3108 my ($vmid) = @_;
943340a6 3109
1d794448 3110 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
3111
3112 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3113}
3114
c971c4f2 3115sub qmp_socket {
693d12a2
AD
3116 my ($vmid, $qga) = @_;
3117 my $sockettype = $qga ? 'qga' : 'qmp';
3118 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3119}
3120
1e3baf05
DM
3121sub pidfile_name {
3122 my ($vmid) = @_;
3123 return "${var_run_tmpdir}/$vmid.pid";
3124}
3125
86fdcfb2
DA
3126sub vm_devices_list {
3127 my ($vmid) = @_;
3128
ceea9078 3129 my $res = vm_mon_cmd($vmid, 'query-pci');
ceea9078
DM
3130 my $devices = {};
3131 foreach my $pcibus (@$res) {
3132 foreach my $device (@{$pcibus->{devices}}) {
3133 next if !$device->{'qdev_id'};
f78cc802
AD
3134 $devices->{$device->{'qdev_id'}} = 1;
3135 }
3136 }
3137
3138 my $resblock = vm_mon_cmd($vmid, 'query-block');
3139 foreach my $block (@$resblock) {
3140 if($block->{device} =~ m/^drive-(\S+)/){
3141 $devices->{$1} = 1;
1dc4f496
DM
3142 }
3143 }
86fdcfb2 3144
3d7389fe
DM
3145 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3146 foreach my $mice (@$resmice) {
3147 if ($mice->{name} eq 'QEMU HID Tablet') {
3148 $devices->{tablet} = 1;
3149 last;
3150 }
3151 }
3152
1dc4f496 3153 return $devices;
86fdcfb2
DA
3154}
3155
ec21aa11 3156sub vm_deviceplug {
f19d1c47 3157 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3158
fee46675 3159 die "internal error" if !$conf->{hotplug};
db656e5f
DM
3160
3161 my $q35 = machine_type_is_q35($conf);
3162
95d6343b
DA
3163 my $devices_list = vm_devices_list($vmid);
3164 return 1 if defined($devices_list->{$deviceid});
3165
fee46675
DM
3166 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid); # add PCI bridge if we need it for the device
3167
3d7389fe 3168 if ($deviceid eq 'tablet') {
fee46675 3169
3d7389fe 3170 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3d7389fe 3171
fee46675 3172 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
40f28a9f 3173
fee46675 3174 qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3175 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
fee46675 3176
5e5dcb73 3177 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3178 eval { qemu_deviceaddverify($vmid, $deviceid); };
3179 if (my $err = $@) {
63c2da2f
DM
3180 eval { qemu_drivedel($vmid, $deviceid); };
3181 warn $@ if $@;
fee46675 3182 die $err;
5e5dcb73 3183 }
cfc817c7 3184
fee46675
DM
3185 } elsif ($deviceid =~ m/^(scsihw)(\d+)$/) {
3186
cdd20088 3187 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3188 my $pciaddr = print_pci_addr($deviceid);
cdd20088 3189 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
fee46675 3190
cfc817c7 3191 qemu_deviceadd($vmid, $devicefull);
fee46675 3192 qemu_deviceaddverify($vmid, $deviceid);
cfc817c7 3193
fee46675
DM
3194 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3195
3196 qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
3197 qemu_driveadd($storecfg, $vmid, $device);
3198
3199 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3200 eval { qemu_deviceadd($vmid, $devicefull); };
3201 if (my $err = $@) {
63c2da2f
DM
3202 eval { qemu_drivedel($vmid, $deviceid); };
3203 warn $@ if $@;
fee46675 3204 die $err;
a4f091a0 3205 }
a4f091a0 3206
fee46675
DM
3207 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3208
2630d2a9
DA
3209 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3210 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3211 qemu_deviceadd($vmid, $netdevicefull);
fee46675
DM
3212 eval { qemu_deviceaddverify($vmid, $deviceid); };
3213 if (my $err = $@) {
3214 eval { qemu_netdevdel($vmid, $deviceid); };
3215 warn $@ if $@;
3216 die $err;
2630d2a9 3217 }
2630d2a9 3218
fee46675 3219 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
b467f79a 3220
40f28a9f
AD
3221 my $bridgeid = $2;
3222 my $pciaddr = print_pci_addr($deviceid);
3223 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
fee46675 3224
40f28a9f 3225 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3226 qemu_deviceaddverify($vmid, $deviceid);
3227
3228 } else {
3229 die "can't hotplug device '$deviceid'\n";
40f28a9f
AD
3230 }
3231
5e5dcb73 3232 return 1;
a4dea331
DA
3233}
3234
3eec5767 3235# fixme: this should raise exceptions on error!
ec21aa11 3236sub vm_deviceunplug {
f19d1c47 3237 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3238
63c2da2f 3239 die "internal error" if !$conf->{hotplug};
873c2d69 3240
95d6343b
DA
3241 my $devices_list = vm_devices_list($vmid);
3242 return 1 if !defined($devices_list->{$deviceid});
3243
63c2da2f
DM
3244 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3245
3d7389fe 3246 if ($deviceid eq 'tablet') {
63c2da2f 3247
3d7389fe 3248 qemu_devicedel($vmid, $deviceid);
3d7389fe 3249
63c2da2f 3250 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
f19d1c47 3251
5e5dcb73 3252 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3253 qemu_devicedelverify($vmid, $deviceid);
3254 qemu_drivedel($vmid, $deviceid);
3255
3256 } elsif ($deviceid =~ m/^(lsi)(\d+)$/) {
3257
3258 qemu_devicedel($vmid, $deviceid);
3259
3260 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
cfc817c7 3261
63c2da2f
DM
3262 qemu_devicedel($vmid, $deviceid);
3263 qemu_drivedel($vmid, $deviceid);
3264
3265 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
a4f091a0 3266
2630d2a9 3267 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3268 qemu_devicedelverify($vmid, $deviceid);
3269 qemu_netdevdel($vmid, $deviceid);
3270
3271 } else {
3272 die "can't unplug device '$deviceid'\n";
2630d2a9
DA
3273 }
3274
5e5dcb73
DA
3275 return 1;
3276}
3277
3278sub qemu_deviceadd {
3279 my ($vmid, $devicefull) = @_;
873c2d69 3280
d695b5b7
AD
3281 $devicefull = "driver=".$devicefull;
3282 my %options = split(/[=,]/, $devicefull);
f19d1c47 3283
d695b5b7 3284 vm_mon_cmd($vmid, "device_add" , %options);
5e5dcb73 3285}
afdb31d5 3286
5e5dcb73 3287sub qemu_devicedel {
fee46675 3288 my ($vmid, $deviceid) = @_;
63c2da2f 3289
5a77d8c1 3290 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
5e5dcb73
DA
3291}
3292
3293sub qemu_driveadd {
fee46675 3294 my ($storecfg, $vmid, $device) = @_;
5e5dcb73
DA
3295
3296 my $drive = print_drive_full($storecfg, $vmid, $device);
7b7c6d1b 3297 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
fee46675 3298
5e5dcb73 3299 # If the command succeeds qemu prints: "OK"
fee46675
DM
3300 return 1 if $ret =~ m/OK/s;
3301
3302 die "adding drive failed: $ret\n";
5e5dcb73 3303}
afdb31d5 3304
5e5dcb73
DA
3305sub qemu_drivedel {
3306 my($vmid, $deviceid) = @_;
873c2d69 3307
7b7c6d1b 3308 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73 3309 $ret =~ s/^\s+//;
63c2da2f
DM
3310
3311 return 1 if $ret eq "";
3312
3313 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
3314 return 1 if $ret =~ m/Device \'.*?\' not found/s;
3315
3316 die "deleting drive $deviceid failed : $ret\n";
5e5dcb73 3317}
f19d1c47 3318
5e5dcb73 3319sub qemu_deviceaddverify {
fee46675 3320 my ($vmid, $deviceid) = @_;
873c2d69 3321
5e5dcb73
DA
3322 for (my $i = 0; $i <= 5; $i++) {
3323 my $devices_list = vm_devices_list($vmid);
3324 return 1 if defined($devices_list->{$deviceid});
3325 sleep 1;
afdb31d5 3326 }
fee46675
DM
3327
3328 die "error on hotplug device '$deviceid'\n";
5e5dcb73 3329}
afdb31d5 3330
5e5dcb73
DA
3331
3332sub qemu_devicedelverify {
63c2da2f
DM
3333 my ($vmid, $deviceid) = @_;
3334
3335 # need to verify that the device is correctly removed as device_del
3336 # is async and empty return is not reliable
5e5dcb73 3337
5e5dcb73
DA
3338 for (my $i = 0; $i <= 5; $i++) {
3339 my $devices_list = vm_devices_list($vmid);
3340 return 1 if !defined($devices_list->{$deviceid});
3341 sleep 1;
afdb31d5 3342 }
63c2da2f
DM
3343
3344 die "error on hot-unplugging device '$deviceid'\n";
873c2d69
DA
3345}
3346
cdd20088 3347sub qemu_findorcreatescsihw {
cfc817c7
DA
3348 my ($storecfg, $conf, $vmid, $device) = @_;
3349
5b952ff5 3350 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3351 my $controller = int($device->{index} / $maxdev);
cdd20088 3352 my $scsihwid="scsihw$controller";
cfc817c7
DA
3353 my $devices_list = vm_devices_list($vmid);
3354
cdd20088 3355 if(!defined($devices_list->{$scsihwid})) {
fee46675 3356 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7 3357 }
fee46675 3358
cfc817c7
DA
3359 return 1;
3360}
3361
281fedb3 3362sub qemu_add_pci_bridge {
40f28a9f
AD
3363 my ($storecfg, $conf, $vmid, $device) = @_;
3364
3365 my $bridges = {};
281fedb3
DM
3366
3367 my $bridgeid;
3368
40f28a9f
AD
3369 print_pci_addr($device, $bridges);
3370
3371 while (my ($k, $v) = each %$bridges) {
3372 $bridgeid = $k;
3373 }
fee46675 3374 return 1 if !defined($bridgeid) || $bridgeid < 1;
281fedb3 3375
40f28a9f
AD
3376 my $bridge = "pci.$bridgeid";
3377 my $devices_list = vm_devices_list($vmid);
3378
281fedb3 3379 if (!defined($devices_list->{$bridge})) {
fee46675 3380 vm_deviceplug($storecfg, $conf, $vmid, $bridge);
40f28a9f 3381 }
281fedb3 3382
40f28a9f
AD
3383 return 1;
3384}
3385
2630d2a9
DA
3386sub qemu_netdevadd {
3387 my ($vmid, $conf, $device, $deviceid) = @_;
3388
3389 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3390 my %options = split(/[=,]/, $netdev);
2630d2a9 3391
73aa03b8
AD
3392 vm_mon_cmd($vmid, "netdev_add", %options);
3393 return 1;
2630d2a9
DA
3394}
3395
3396sub qemu_netdevdel {
3397 my ($vmid, $deviceid) = @_;
3398
89c1e0f4 3399 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
2630d2a9
DA
3400}
3401
838776ab
AD
3402sub qemu_cpu_hotplug {
3403 my ($vmid, $conf, $cores) = @_;
3404
3a11fadb
DM
3405 my $sockets = $conf->{sockets} || 1;
3406 die "cpu hotplug only works with one socket\n"
3407 if $sockets > 1;
838776ab 3408
3a11fadb
DM
3409 die "maxcpus is not defined\n"
3410 if !$conf->{maxcpus};
3411
3412 die "you can't add more cores than maxcpus\n"
3413 if $cores > $conf->{maxcpus};
3414
3415 my $currentcores = $conf->{cores} || 1;
3416 die "online cpu unplug is not yet possible\n"
3417 if $cores < $currentcores;
838776ab
AD
3418
3419 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
3a11fadb
DM
3420 die "cores number if running vm is different than configuration\n"
3421 if scalar(@{$currentrunningcores}) != $currentcores;
838776ab 3422
3a11fadb 3423 for (my $i = $currentcores; $i < $cores; $i++) {
838776ab
AD
3424 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3425 }
3426}
3427
affd2f88
AD
3428sub qemu_block_set_io_throttle {
3429 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3430
f3f323a3
AD
3431 return if !check_running($vmid) ;
3432
f3f323a3
AD
3433 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3434
affd2f88
AD
3435}
3436
f5eb281a 3437# old code, only used to shutdown old VM after update
dab36e1e
DM
3438sub __read_avail {
3439 my ($fh, $timeout) = @_;
3440
3441 my $sel = new IO::Select;
3442 $sel->add($fh);
3443
3444 my $res = '';
3445 my $buf;
3446
3447 my @ready;
3448 while (scalar (@ready = $sel->can_read($timeout))) {
3449 my $count;
3450 if ($count = $fh->sysread($buf, 8192)) {
3451 if ($buf =~ /^(.*)\(qemu\) $/s) {
3452 $res .= $1;
3453 last;
3454 } else {
3455 $res .= $buf;
3456 }
3457 } else {
3458 if (!defined($count)) {
3459 die "$!\n";
3460 }
3461 last;
3462 }
3463 }
3464
3465 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3466
dab36e1e
DM
3467 return $res;
3468}
3469
f5eb281a 3470# old code, only used to shutdown old VM after update
dab36e1e
DM
3471sub vm_monitor_command {
3472 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3473
dab36e1e
DM
3474 my $res;
3475
3476 eval {
3477 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3478
3479 my $sname = "${var_run_tmpdir}/$vmid.mon";
3480
3481 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3482 die "unable to connect to VM $vmid socket - $!\n";
3483
3484 my $timeout = 3;
3485
3486 # hack: migrate sometime blocks the monitor (when migrate_downtime
3487 # is set)
3488 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3489 $timeout = 60*60; # 1 hour
3490 }
3491
3492 # read banner;
3493 my $data = __read_avail($sock, $timeout);
3494
3495 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3496 die "got unexpected qemu monitor banner\n";
3497 }
3498
3499 my $sel = new IO::Select;
3500 $sel->add($sock);
3501
3502 if (!scalar(my @ready = $sel->can_write($timeout))) {
3503 die "monitor write error - timeout";
3504 }
3505
3506 my $fullcmd = "$cmdstr\r";
3507
3508 # syslog('info', "VM $vmid monitor command: $cmdstr");
3509
3510 my $b;
3511 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3512 die "monitor write error - $!";
3513 }
3514
3515 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3516
3517 $timeout = 20;
3518
3519 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3520 $timeout = 60*60; # 1 hour
3521 } elsif ($cmdstr =~ m/^(eject|change)/) {
3522 $timeout = 60; # note: cdrom mount command is slow
3523 }
3524 if ($res = __read_avail($sock, $timeout)) {
3525
3526 my @lines = split("\r?\n", $res);
f5eb281a 3527
dab36e1e 3528 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3529
dab36e1e
DM
3530 $res = join("\n", @lines);
3531 $res .= "\n";
3532 }
3533 };
3534
3535 my $err = $@;
3536
3537 if ($err) {
3538 syslog("err", "VM $vmid monitor command failed - $err");
3539 die $err;
3540 }
f5eb281a 3541
dab36e1e
DM
3542 return $res;
3543}
3544
c1175c92
AD
3545sub qemu_block_resize {
3546 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3547
ed221350 3548 my $running = check_running($vmid);
c1175c92
AD
3549
3550 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3551
3552 return if !$running;
3553
3554 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3555
3556}
3557
1ab0057c
AD
3558sub qemu_volume_snapshot {
3559 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3560
ed221350 3561 my $running = check_running($vmid);
1ab0057c
AD
3562
3563 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3564
3565 return if !$running;
3566
3567 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3568
3569}
3570
fc46aff9
AD
3571sub qemu_volume_snapshot_delete {
3572 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3573
ed221350 3574 my $running = check_running($vmid);
fc46aff9
AD
3575
3576 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3577
3578 return if !$running;
3579
18bfb361 3580 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3581}
3582
264e519f
DM
3583sub set_migration_caps {
3584 my ($vmid) = @_;
a89fded1 3585
8b8345f3 3586 my $cap_ref = [];
a89fded1
AD
3587
3588 my $enabled_cap = {
8b8345f3
DM
3589 "auto-converge" => 1,
3590 "xbzrle" => 0,
3591 "x-rdma-pin-all" => 0,
3592 "zero-blocks" => 0,
a89fded1
AD
3593 };
3594
8b8345f3 3595 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3596
8b8345f3 3597 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3598 push @$cap_ref, {
3599 capability => $supported_capability->{capability},
22430fa2
DM
3600 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3601 };
a89fded1
AD
3602 }
3603
8b8345f3
DM
3604 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3605}
a89fded1 3606
3a11fadb
DM
3607# hotplug changes in [PENDING]
3608# $selection hash can be used to only apply specified options, for
3609# example: { cores => 1 } (only apply changed 'cores')
3610# $errors ref is used to return error messages
c427973b 3611sub vmconfig_hotplug_pending {
3a11fadb 3612 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
c427973b 3613
8e90138a 3614 my $defaults = load_defaults();
c427973b
DM
3615
3616 # commit values which do not have any impact on running VM first
3a11fadb
DM
3617 # Note: those option cannot raise errors, we we do not care about
3618 # $selection and always apply them.
3619
3620 my $add_error = sub {
3621 my ($opt, $msg) = @_;
3622 $errors->{$opt} = "hotplug problem - $msg";
3623 };
c427973b
DM
3624
3625 my $changes = 0;
3626 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3627 if ($opt eq 'name' || $opt eq 'hotplug' || $opt eq 'onboot' || $opt eq 'shares') {
3628 $conf->{$opt} = $conf->{pending}->{$opt};
3629 delete $conf->{pending}->{$opt};
3630 $changes = 1;
3631 }
3632 }
3633
3634 if ($changes) {
3635 update_config_nolock($vmid, $conf, 1);
3636 $conf = load_config($vmid); # update/reload
3637 }
3638
3a11fadb 3639 my $hotplug = defined($conf->{hotplug}) ? $conf->{hotplug} : $defaults->{hotplug};
c427973b 3640
3d7389fe
DM
3641 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3642 foreach my $opt (@delete) {
3a11fadb 3643 next if $selection && !$selection->{$opt};
3a11fadb
DM
3644 eval {
3645 if ($opt eq 'tablet') {
e56beeda 3646 die "skip\n" if !$hotplug;
3a11fadb
DM
3647 if ($defaults->{tablet}) {
3648 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3649 } else {
3650 vm_deviceunplug($vmid, $conf, $opt);
3651 }
3652 } elsif ($opt eq 'cores') {
e56beeda 3653 die "skip\n" if !$hotplug;
3a11fadb 3654 qemu_cpu_hotplug($vmid, $conf, 1);
3eec5767
DM
3655 } elsif ($opt =~ m/^net(\d+)$/) {
3656 die "skip\n" if !$hotplug;
3657 vm_deviceunplug($vmid, $conf, $opt);
a05cff86
DM
3658 } elsif (valid_drivename($opt)) {
3659 die "skip\n"; # we do not allow to hot-remove disk?
3d7389fe 3660 } else {
e56beeda 3661 die "skip\n";
3d7389fe 3662 }
3a11fadb
DM
3663 };
3664 if (my $err = $@) {
e56beeda
DM
3665 &$add_error($opt, $err) if $err ne "skip\n";
3666 } else {
3a11fadb
DM
3667 # save new config if hotplug was successful
3668 delete $conf->{$opt};
3669 vmconfig_undelete_pending_option($conf, $opt);
3670 update_config_nolock($vmid, $conf, 1);
3671 $conf = load_config($vmid); # update/reload
3d7389fe 3672 }
3d7389fe
DM
3673 }
3674
3675 foreach my $opt (keys %{$conf->{pending}}) {
3a11fadb 3676 next if $selection && !$selection->{$opt};
3d7389fe 3677 my $value = $conf->{pending}->{$opt};
3a11fadb
DM
3678 eval {
3679 if ($opt eq 'tablet') {
e56beeda 3680 die "skip\n" if !$hotplug;
3a11fadb
DM
3681 if ($value == 1) {
3682 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3683 } elsif ($value == 0) {
3684 vm_deviceunplug($vmid, $conf, $opt);
3685 }
3686 } elsif ($opt eq 'cores') {
e56beeda 3687 die "skip\n" if !$hotplug;
3a11fadb
DM
3688 qemu_cpu_hotplug($vmid, $conf, $value);
3689 } elsif ($opt eq 'balloon') {
e56beeda 3690 die "skip\n" if !(defined($conf->{shares}) && ($conf->{shares} == 0));
3a11fadb
DM
3691 # allow manual ballooning if shares is set to zero
3692 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
3693 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
3eec5767
DM
3694 } elsif ($opt =~ m/^net(\d+)$/) {
3695 # some changes can be done without hotplug
3696 vmconfig_update_net($storecfg, $conf, $vmid, $opt, $value);
a05cff86
DM
3697 } elsif (valid_drivename($opt)) {
3698 # some changes can be done without hotplug
3699 vmconfig_update_disk($storecfg, $conf, $vmid, $opt, $value, 1);
3a11fadb 3700 } else {
e56beeda 3701 die "skip\n"; # skip non-hot-pluggable options
3d7389fe 3702 }
3a11fadb
DM
3703 };
3704 if (my $err = $@) {
e56beeda
DM
3705 &$add_error($opt, $err) if $err ne "skip\n";
3706 } else {
3a11fadb
DM
3707 # save new config if hotplug was successful
3708 $conf->{$opt} = $value;
3709 delete $conf->{pending}->{$opt};
3710 update_config_nolock($vmid, $conf, 1);
3711 $conf = load_config($vmid); # update/reload
3d7389fe 3712 }
3d7389fe 3713 }
c427973b 3714}
055d554d
DM
3715
3716sub vmconfig_apply_pending {
3a11fadb 3717 my ($vmid, $conf, $storecfg) = @_;
c427973b
DM
3718
3719 # cold plug
055d554d
DM
3720
3721 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3722 foreach my $opt (@delete) { # delete
3723 die "internal error" if $opt =~ m/^unused/;
3724 $conf = load_config($vmid); # update/reload
3725 if (!defined($conf->{$opt})) {
3726 vmconfig_undelete_pending_option($conf, $opt);
3727 update_config_nolock($vmid, $conf, 1);
3728 } elsif (valid_drivename($opt)) {
3729 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
3730 vmconfig_undelete_pending_option($conf, $opt);
3731 delete $conf->{$opt};
3732 update_config_nolock($vmid, $conf, 1);
3733 } else {
3734 vmconfig_undelete_pending_option($conf, $opt);
3735 delete $conf->{$opt};
3736 update_config_nolock($vmid, $conf, 1);
3737 }
3738 }
3739
3740 $conf = load_config($vmid); # update/reload
3741
3742 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3743 $conf = load_config($vmid); # update/reload
3744
3745 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
3746 # skip if nothing changed
3747 } elsif (valid_drivename($opt)) {
3748 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
3749 if defined($conf->{$opt});
3750 $conf->{$opt} = $conf->{pending}->{$opt};
3751 } else {
3752 $conf->{$opt} = $conf->{pending}->{$opt};
3753 }
3754
3755 delete $conf->{pending}->{$opt};
3756 update_config_nolock($vmid, $conf, 1);
3757 }
3758}
3759
3eec5767
DM
3760my $safe_num_ne = sub {
3761 my ($a, $b) = @_;
3762
3763 return 0 if !defined($a) && !defined($b);
3764 return 1 if !defined($a);
3765 return 1 if !defined($b);
3766
3767 return $a != $b;
3768};
3769
3770my $safe_string_ne = sub {
3771 my ($a, $b) = @_;
3772
3773 return 0 if !defined($a) && !defined($b);
3774 return 1 if !defined($a);
3775 return 1 if !defined($b);
3776
3777 return $a ne $b;
3778};
3779
3780sub vmconfig_update_net {
3781 my ($storecfg, $conf, $vmid, $opt, $value) = @_;
3782
3783 my $newnet = parse_net($value);
3784
3785 if ($conf->{$opt}) {
3786 my $oldnet = parse_net($conf->{$opt});
3787
3788 if (&$safe_string_ne($oldnet->{model}, $newnet->{model}) ||
3789 &$safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
3790 &$safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
3791 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
3792
3793 # for non online change, we try to hot-unplug
3794 die "skip\n" if !$conf->{hotplug};
3795 vm_deviceunplug($vmid, $conf, $opt);
3796 } else {
3797
3798 die "internal error" if $opt !~ m/net(\d+)/;
3799 my $iface = "tap${vmid}i$1";
3800
3801 if (&$safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
3802 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3803 }
3804
3805 if(&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
3806 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
3807 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3808 PVE::Network::tap_unplug($iface);
3809 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall});
3810 }
3811 }
3812 }
3813
3814 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet);
3815}
3816
a05cff86
DM
3817sub vmconfig_update_disk {
3818 my ($storecfg, $conf, $vmid, $opt, $value, $force) = @_;
3819
3820 # fixme: do we need force?
3821
3822 my $drive = parse_drive($opt, $value);
3823
3824 if ($conf->{$opt}) {
3825
3826 if (my $old_drive = parse_drive($opt, $conf->{$opt})) {
3827
3828 my $media = $drive->{media} || 'disk';
3829 my $oldmedia = $old_drive->{media} || 'disk';
3830 die "unable to change media type\n" if $media ne $oldmedia;
3831
3832 if (!drive_is_cdrom($old_drive)) {
3833
3834 if ($drive->{file} ne $old_drive->{file}) {
3835
3836 die "skip\n" if !$conf->{hotplug};
3837
3838 # unplug and register as unused
3839 vm_deviceunplug($vmid, $conf, $opt);
3840 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $old_drive)
3841
3842 } else {
3843 # update existing disk
3844
3845 # skip non hotpluggable value
3846 if (&$safe_num_ne($drive->{discard}, $old_drive->{discard}) ||
3847 &$safe_string_ne($drive->{cache}, $old_drive->{cache})) {
3848 die "skip\n";
3849 }
3850
3851 # apply throttle
3852 if (&$safe_num_ne($drive->{mbps}, $old_drive->{mbps}) ||
3853 &$safe_num_ne($drive->{mbps_rd}, $old_drive->{mbps_rd}) ||
3854 &$safe_num_ne($drive->{mbps_wr}, $old_drive->{mbps_wr}) ||
3855 &$safe_num_ne($drive->{iops}, $old_drive->{iops}) ||
3856 &$safe_num_ne($drive->{iops_rd}, $old_drive->{iops_rd}) ||
3857 &$safe_num_ne($drive->{iops_wr}, $old_drive->{iops_wr}) ||
3858 &$safe_num_ne($drive->{mbps_max}, $old_drive->{mbps_max}) ||
3859 &$safe_num_ne($drive->{mbps_rd_max}, $old_drive->{mbps_rd_max}) ||
3860 &$safe_num_ne($drive->{mbps_wr_max}, $old_drive->{mbps_wr_max}) ||
3861 &$safe_num_ne($drive->{iops_max}, $old_drive->{iops_max}) ||
3862 &$safe_num_ne($drive->{iops_rd_max}, $old_drive->{iops_rd_max}) ||
3863 &$safe_num_ne($drive->{iops_wr_max}, $old_drive->{iops_wr_max})) {
3864
3865 qemu_block_set_io_throttle($vmid,"drive-$opt",
3866 ($drive->{mbps} || 0)*1024*1024,
3867 ($drive->{mbps_rd} || 0)*1024*1024,
3868 ($drive->{mbps_wr} || 0)*1024*1024,
3869 $drive->{iops} || 0,
3870 $drive->{iops_rd} || 0,
3871 $drive->{iops_wr} || 0,
3872 ($drive->{mbps_max} || 0)*1024*1024,
3873 ($drive->{mbps_rd_max} || 0)*1024*1024,
3874 ($drive->{mbps_wr_max} || 0)*1024*1024,
3875 $drive->{iops_max} || 0,
3876 $drive->{iops_rd_max} || 0,
3877 $drive->{iops_wr_max} || 0);
3878
3879 }
3880
3881 return 1;
3882 }
3883 }
3884 }
3885 }
3886
3887 if (drive_is_cdrom($drive)) { # cdrom
3888
3889 if ($drive->{file} eq 'none') {
3890 vm_mon_cmd($vmid, "eject",force => JSON::true,device => "drive-$opt");
3891 } else {
3892 my $path = get_iso_path($storecfg, $vmid, $drive->{file});
3893 vm_mon_cmd($vmid, "eject", force => JSON::true,device => "drive-$opt"); # force eject if locked
3894 vm_mon_cmd($vmid, "change", device => "drive-$opt",target => "$path") if $path;
3895 }
3896
3897 } else {
3898 die "skip\n" if !$conf->{hotplug};
3899 # hotplug new disks
3900 vm_deviceplug($storecfg, $conf, $vmid, $opt, $drive);
3901 }
3902}
3903
1e3baf05 3904sub vm_start {
1d794448 3905 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 3906
6b64503e 3907 lock_config($vmid, sub {
7e8dcf2c 3908 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 3909
8b43bc11 3910 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 3911
6b64503e 3912 check_lock($conf) if !$skiplock;
1e3baf05 3913
7e8dcf2c 3914 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 3915
055d554d 3916 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3a11fadb 3917 vmconfig_apply_pending($vmid, $conf, $storecfg);
055d554d
DM
3918 $conf = load_config($vmid); # update/reload
3919 }
3920
6c47d546
DM
3921 my $defaults = load_defaults();
3922
3923 # set environment variable useful inside network script
3924 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3925
1d794448 3926 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 3927
1e3baf05 3928 my $migrate_port = 0;
5bc1e039 3929 my $migrate_uri;
1e3baf05
DM
3930 if ($statefile) {
3931 if ($statefile eq 'tcp') {
5bc1e039
SP
3932 my $localip = "localhost";
3933 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3934 if ($datacenterconf->{migration_unsecure}) {
3935 my $nodename = PVE::INotify::nodename();
3936 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3937 }
f9a971e0 3938 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 3939 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
3940 push @$cmd, '-incoming', $migrate_uri;
3941 push @$cmd, '-S';
1e3baf05 3942 } else {
6c47d546 3943 push @$cmd, '-loadstate', $statefile;
1e3baf05 3944 }
91bd6c90
DM
3945 } elsif ($paused) {
3946 push @$cmd, '-S';
1e3baf05
DM
3947 }
3948
1e3baf05 3949 # host pci devices
040b06b7
DA
3950 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3951 my $d = parse_hostpci($conf->{"hostpci$i"});
3952 next if !$d;
b1f72af6
AD
3953 my $pcidevices = $d->{pciid};
3954 foreach my $pcidevice (@$pcidevices) {
3955 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 3956
b1f72af6
AD
3957 my $info = pci_device_info("0000:$pciid");
3958 die "IOMMU not present\n" if !check_iommu_support();
3959 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 3960
b1f72af6
AD
3961 if ($d->{driver} && $d->{driver} eq "vfio") {
3962 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3963 } else {
3964 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3965 }
3966
8f3e88af 3967 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 3968 }
040b06b7 3969 }
1e3baf05
DM
3970
3971 PVE::Storage::activate_volumes($storecfg, $vollist);
3972
585b6e28
DM
3973 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3974 umask => 0077); };
1e3baf05 3975 my $err = $@;
ff1a2432 3976 die "start failed: $err" if $err;
1e3baf05 3977
5bc1e039 3978 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 3979
8c609afd 3980 if ($statefile && $statefile ne 'tcp') {
95381ce0 3981 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 3982 warn $@ if $@;
62de2cbd
DM
3983 }
3984
1d794448 3985 if ($migratedfrom) {
a89fded1
AD
3986
3987 eval {
8e90138a 3988 set_migration_caps($vmid);
a89fded1 3989 };
1d794448 3990 warn $@ if $@;
a89fded1 3991
1d794448
DM
3992 if ($spice_port) {
3993 print "spice listens on port $spice_port\n";
3994 if ($spice_ticket) {
8e90138a
DM
3995 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
3996 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
3997 }
3998 }
3999
1d794448 4000 } else {
4ec05c4c 4001
15b1fc93 4002 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 4003 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 4004 if $conf->{balloon};
be190583
DM
4005 vm_mon_cmd_nocheck($vmid, 'qom-set',
4006 path => "machine/peripheral/balloon0",
4007 property => "guest-stats-polling-interval",
4ec05c4c
AD
4008 value => 2);
4009 }
e18b0b99 4010 }
1e3baf05
DM
4011 });
4012}
4013
0eedc444
AD
4014sub vm_mon_cmd {
4015 my ($vmid, $execute, %params) = @_;
4016
26f11676
DM
4017 my $cmd = { execute => $execute, arguments => \%params };
4018 vm_qmp_command($vmid, $cmd);
0eedc444
AD
4019}
4020
4021sub vm_mon_cmd_nocheck {
4022 my ($vmid, $execute, %params) = @_;
4023
26f11676
DM
4024 my $cmd = { execute => $execute, arguments => \%params };
4025 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
4026}
4027
c971c4f2 4028sub vm_qmp_command {
c5a07de5 4029 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 4030
c971c4f2 4031 my $res;
26f11676 4032
14db5366
DM
4033 my $timeout;
4034 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
4035 $timeout = $cmd->{arguments}->{timeout};
4036 delete $cmd->{arguments}->{timeout};
4037 }
be190583 4038
c971c4f2
AD
4039 eval {
4040 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
4041 my $sname = qmp_socket($vmid);
4042 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 4043 my $qmpclient = PVE::QMPClient->new();
dab36e1e 4044
14db5366 4045 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 4046 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
4047 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
4048 if scalar(%{$cmd->{arguments}});
4049 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
4050 } else {
4051 die "unable to open monitor socket\n";
4052 }
c971c4f2 4053 };
26f11676 4054 if (my $err = $@) {
c971c4f2
AD
4055 syslog("err", "VM $vmid qmp command failed - $err");
4056 die $err;
4057 }
4058
4059 return $res;
4060}
4061
9df5cbcc
DM
4062sub vm_human_monitor_command {
4063 my ($vmid, $cmdline) = @_;
4064
4065 my $res;
4066
f5eb281a 4067 my $cmd = {
9df5cbcc
DM
4068 execute => 'human-monitor-command',
4069 arguments => { 'command-line' => $cmdline},
4070 };
4071
4072 return vm_qmp_command($vmid, $cmd);
4073}
4074
1e3baf05
DM
4075sub vm_commandline {
4076 my ($storecfg, $vmid) = @_;
4077
6b64503e 4078 my $conf = load_config($vmid);
1e3baf05
DM
4079
4080 my $defaults = load_defaults();
4081
6b64503e 4082 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 4083
6b64503e 4084 return join(' ', @$cmd);
1e3baf05
DM
4085}
4086
4087sub vm_reset {
4088 my ($vmid, $skiplock) = @_;
4089
6b64503e 4090 lock_config($vmid, sub {
1e3baf05 4091
6b64503e 4092 my $conf = load_config($vmid);
1e3baf05 4093
6b64503e 4094 check_lock($conf) if !$skiplock;
1e3baf05 4095
816e2c4a 4096 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
4097 });
4098}
4099
4100sub get_vm_volumes {
4101 my ($conf) = @_;
1e3baf05 4102
ff1a2432 4103 my $vollist = [];
d5769dc2
DM
4104 foreach_volid($conf, sub {
4105 my ($volid, $is_cdrom) = @_;
ff1a2432 4106
d5769dc2 4107 return if $volid =~ m|^/|;
ff1a2432 4108
d5769dc2
DM
4109 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4110 return if !$sid;
ff1a2432
DM
4111
4112 push @$vollist, $volid;
1e3baf05 4113 });
ff1a2432
DM
4114
4115 return $vollist;
4116}
4117
4118sub vm_stop_cleanup {
254575e9 4119 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 4120
745fed70
DM
4121 eval {
4122 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 4123
254575e9
DM
4124 if (!$keepActive) {
4125 my $vollist = get_vm_volumes($conf);
4126 PVE::Storage::deactivate_volumes($storecfg, $vollist);
4127 }
961bfcb2 4128
ab6a046f 4129 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
4130 unlink "/var/run/qemu-server/${vmid}.$ext";
4131 }
745fed70
DM
4132 };
4133 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
4134}
4135
e6c3b671 4136# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
4137# We need that when migration VMs to other nodes (files already moved)
4138# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 4139sub vm_stop {
af30308f 4140 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 4141
9269013a 4142 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 4143
af30308f
DM
4144 if ($migratedfrom){
4145 my $pid = check_running($vmid, $nocheck, $migratedfrom);
4146 kill 15, $pid if $pid;
4147 my $conf = load_config($vmid, $migratedfrom);
4148 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
4149 return;
4150 }
4151
e6c3b671 4152 lock_config($vmid, sub {
1e3baf05 4153
e6c3b671 4154 my $pid = check_running($vmid, $nocheck);
ff1a2432 4155 return if !$pid;
1e3baf05 4156
ff1a2432 4157 my $conf;
e6c3b671 4158 if (!$nocheck) {
ff1a2432 4159 $conf = load_config($vmid);
e6c3b671 4160 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
4161 if (!defined($timeout) && $shutdown && $conf->{startup}) {
4162 my $opts = parse_startup($conf->{startup});
4163 $timeout = $opts->{down} if $opts->{down};
4164 }
e6c3b671 4165 }
19672434 4166
7f4a5b5a 4167 $timeout = 60 if !defined($timeout);
67fb9de6 4168
9269013a
DM
4169 eval {
4170 if ($shutdown) {
6fab033c 4171 if (!$nocheck && $conf->{agent}) {
2ea54503 4172 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 4173 } else {
2ea54503 4174 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 4175 }
9269013a 4176 } else {
2ea54503 4177 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 4178 }
9269013a 4179 };
1e3baf05
DM
4180 my $err = $@;
4181
4182 if (!$err) {
1e3baf05 4183 my $count = 0;
e6c3b671 4184 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4185 $count++;
4186 sleep 1;
4187 }
4188
4189 if ($count >= $timeout) {
9269013a
DM
4190 if ($force) {
4191 warn "VM still running - terminating now with SIGTERM\n";
4192 kill 15, $pid;
4193 } else {
4194 die "VM quit/powerdown failed - got timeout\n";
4195 }
4196 } else {
254575e9 4197 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 4198 return;
1e3baf05
DM
4199 }
4200 } else {
9269013a
DM
4201 if ($force) {
4202 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4203 kill 15, $pid;
4204 } else {
afdb31d5 4205 die "VM quit/powerdown failed\n";
9269013a 4206 }
1e3baf05
DM
4207 }
4208
4209 # wait again
ff1a2432 4210 $timeout = 10;
1e3baf05
DM
4211
4212 my $count = 0;
e6c3b671 4213 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4214 $count++;
4215 sleep 1;
4216 }
4217
4218 if ($count >= $timeout) {
ff1a2432 4219 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 4220 kill 9, $pid;
ff1a2432 4221 sleep 1;
1e3baf05
DM
4222 }
4223
254575e9 4224 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 4225 });
1e3baf05
DM
4226}
4227
4228sub vm_suspend {
4229 my ($vmid, $skiplock) = @_;
4230
6b64503e 4231 lock_config($vmid, sub {
1e3baf05 4232
6b64503e 4233 my $conf = load_config($vmid);
1e3baf05 4234
051347aa 4235 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 4236
f77f91f3 4237 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
4238 });
4239}
4240
4241sub vm_resume {
4242 my ($vmid, $skiplock) = @_;
4243
6b64503e 4244 lock_config($vmid, sub {
1e3baf05 4245
6b64503e 4246 my $conf = load_config($vmid);
1e3baf05 4247
051347aa 4248 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 4249
12060fe8 4250 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
4251 });
4252}
4253
5fdbe4f0
DM
4254sub vm_sendkey {
4255 my ($vmid, $skiplock, $key) = @_;
1e3baf05 4256
6b64503e 4257 lock_config($vmid, sub {
1e3baf05 4258
6b64503e 4259 my $conf = load_config($vmid);
f5eb281a 4260
7b7c6d1b
DM
4261 # there is no qmp command, so we use the human monitor command
4262 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
4263 });
4264}
4265
4266sub vm_destroy {
4267 my ($storecfg, $vmid, $skiplock) = @_;
4268
6b64503e 4269 lock_config($vmid, sub {
1e3baf05 4270
6b64503e 4271 my $conf = load_config($vmid);
1e3baf05 4272
6b64503e 4273 check_lock($conf) if !$skiplock;
1e3baf05 4274
ff1a2432
DM
4275 if (!check_running($vmid)) {
4276 fairsched_rmnod($vmid); # try to destroy group
4277 destroy_vm($storecfg, $vmid);
4278 } else {
4279 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
4280 }
4281 });
4282}
4283
1e3baf05
DM
4284# pci helpers
4285
4286sub file_write {
4287 my ($filename, $buf) = @_;
4288
6b64503e 4289 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
4290 return undef if !$fh;
4291
4292 my $res = print $fh $buf;
4293
4294 $fh->close();
4295
4296 return $res;
4297}
4298
4299sub pci_device_info {
4300 my ($name) = @_;
4301
4302 my $res;
4303
4304 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
4305 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
4306
4307 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
4308 return undef if !defined($irq) || $irq !~ m/^\d+$/;
4309
4310 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
4311 return undef if !defined($vendor) || $vendor !~ s/^0x//;
4312
4313 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
4314 return undef if !defined($product) || $product !~ s/^0x//;
4315
4316 $res = {
4317 name => $name,
4318 vendor => $vendor,
4319 product => $product,
4320 domain => $domain,
4321 bus => $bus,
4322 slot => $slot,
4323 func => $func,
4324 irq => $irq,
4325 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
4326 };
4327
4328 return $res;
4329}
4330
4331sub pci_dev_reset {
4332 my ($dev) = @_;
4333
4334 my $name = $dev->{name};
4335
4336 my $fn = "$pcisysfs/devices/$name/reset";
4337
6b64503e 4338 return file_write($fn, "1");
1e3baf05
DM
4339}
4340
4341sub pci_dev_bind_to_stub {
4342 my ($dev) = @_;
4343
4344 my $name = $dev->{name};
4345
4346 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
4347 return 1 if -d $testdir;
4348
4349 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 4350 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
4351
4352 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 4353 if (!file_write($fn, $name)) {
1e3baf05
DM
4354 return undef if -f $fn;
4355 }
4356
4357 $fn = "$pcisysfs/drivers/pci-stub/bind";
4358 if (! -d $testdir) {
6b64503e 4359 return undef if !file_write($fn, $name);
1e3baf05
DM
4360 }
4361
4362 return -d $testdir;
4363}
4364
000fc0a2
SP
4365sub pci_dev_bind_to_vfio {
4366 my ($dev) = @_;
4367
4368 my $name = $dev->{name};
4369
4370 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4371
4372 if (!-d $vfio_basedir) {
4373 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4374 }
4375 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4376
4377 my $testdir = "$vfio_basedir/$name";
4378 return 1 if -d $testdir;
4379
4380 my $data = "$dev->{vendor} $dev->{product}";
4381 return undef if !file_write("$vfio_basedir/new_id", $data);
4382
4383 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4384 if (!file_write($fn, $name)) {
4385 return undef if -f $fn;
4386 }
4387
4388 $fn = "$vfio_basedir/bind";
4389 if (! -d $testdir) {
4390 return undef if !file_write($fn, $name);
4391 }
4392
4393 return -d $testdir;
4394}
4395
4396sub pci_dev_group_bind_to_vfio {
4397 my ($pciid) = @_;
4398
4399 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4400
4401 if (!-d $vfio_basedir) {
4402 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4403 }
4404 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4405
4406 # get IOMMU group devices
4407 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
4408 my @devs = grep /^0000:/, readdir($D);
4409 closedir($D);
4410
4411 foreach my $pciid (@devs) {
4412 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
4413 my $info = pci_device_info($1);
4414 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
4415 }
4416
4417 return 1;
4418}
4419
afdb31d5 4420sub print_pci_addr {
5bdcf937 4421 my ($id, $bridges) = @_;
6b64503e 4422
72a063e4 4423 my $res = '';
6b64503e 4424 my $devices = {
24f0d39a 4425 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 4426 #addr2 : first videocard
13b5a753 4427 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 4428 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
4429 scsihw0 => { bus => 0, addr => 5 },
4430 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 4431 ahci0 => { bus => 0, addr => 7 },
ab6a046f 4432 qga0 => { bus => 0, addr => 8 },
1011b570 4433 spice => { bus => 0, addr => 9 },
6b64503e
DM
4434 virtio0 => { bus => 0, addr => 10 },
4435 virtio1 => { bus => 0, addr => 11 },
4436 virtio2 => { bus => 0, addr => 12 },
4437 virtio3 => { bus => 0, addr => 13 },
4438 virtio4 => { bus => 0, addr => 14 },
4439 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
4440 hostpci0 => { bus => 0, addr => 16 },
4441 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
4442 net0 => { bus => 0, addr => 18 },
4443 net1 => { bus => 0, addr => 19 },
4444 net2 => { bus => 0, addr => 20 },
4445 net3 => { bus => 0, addr => 21 },
4446 net4 => { bus => 0, addr => 22 },
4447 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
4448 vga1 => { bus => 0, addr => 24 },
4449 vga2 => { bus => 0, addr => 25 },
4450 vga3 => { bus => 0, addr => 26 },
5cffb2d2
AD
4451 hostpci2 => { bus => 0, addr => 27 },
4452 hostpci3 => { bus => 0, addr => 28 },
e5f7f8ed 4453 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
4454 'pci.1' => { bus => 0, addr => 30 },
4455 'pci.2' => { bus => 0, addr => 31 },
4456 'net6' => { bus => 1, addr => 1 },
4457 'net7' => { bus => 1, addr => 2 },
4458 'net8' => { bus => 1, addr => 3 },
4459 'net9' => { bus => 1, addr => 4 },
4460 'net10' => { bus => 1, addr => 5 },
4461 'net11' => { bus => 1, addr => 6 },
4462 'net12' => { bus => 1, addr => 7 },
4463 'net13' => { bus => 1, addr => 8 },
4464 'net14' => { bus => 1, addr => 9 },
4465 'net15' => { bus => 1, addr => 10 },
4466 'net16' => { bus => 1, addr => 11 },
4467 'net17' => { bus => 1, addr => 12 },
4468 'net18' => { bus => 1, addr => 13 },
4469 'net19' => { bus => 1, addr => 14 },
4470 'net20' => { bus => 1, addr => 15 },
4471 'net21' => { bus => 1, addr => 16 },
4472 'net22' => { bus => 1, addr => 17 },
4473 'net23' => { bus => 1, addr => 18 },
4474 'net24' => { bus => 1, addr => 19 },
4475 'net25' => { bus => 1, addr => 20 },
4476 'net26' => { bus => 1, addr => 21 },
4477 'net27' => { bus => 1, addr => 22 },
4478 'net28' => { bus => 1, addr => 23 },
4479 'net29' => { bus => 1, addr => 24 },
4480 'net30' => { bus => 1, addr => 25 },
4481 'net31' => { bus => 1, addr => 26 },
4482 'virtio6' => { bus => 2, addr => 1 },
4483 'virtio7' => { bus => 2, addr => 2 },
4484 'virtio8' => { bus => 2, addr => 3 },
4485 'virtio9' => { bus => 2, addr => 4 },
4486 'virtio10' => { bus => 2, addr => 5 },
4487 'virtio11' => { bus => 2, addr => 6 },
4488 'virtio12' => { bus => 2, addr => 7 },
4489 'virtio13' => { bus => 2, addr => 8 },
4490 'virtio14' => { bus => 2, addr => 9 },
4491 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
4492 };
4493
4494 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 4495 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
4496 my $bus = $devices->{$id}->{bus};
4497 $res = ",bus=pci.$bus,addr=$addr";
98627641 4498 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
4499 }
4500 return $res;
4501
4502}
4503
2e3b7e2a
AD
4504sub print_pcie_addr {
4505 my ($id) = @_;
4506
4507 my $res = '';
4508 my $devices = {
4509 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4510 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4511 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4512 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4513 };
4514
4515 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4516 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4517 my $bus = $devices->{$id}->{bus};
4518 $res = ",bus=$bus,addr=$addr";
4519 }
4520 return $res;
4521
4522}
4523
3e16d5fc
DM
4524# vzdump restore implementaion
4525
ed221350 4526sub tar_archive_read_firstfile {
3e16d5fc 4527 my $archive = shift;
afdb31d5 4528
3e16d5fc
DM
4529 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4530
4531 # try to detect archive type first
4532 my $pid = open (TMP, "tar tf '$archive'|") ||
4533 die "unable to open file '$archive'\n";
4534 my $firstfile = <TMP>;
4535 kill 15, $pid;
4536 close TMP;
4537
4538 die "ERROR: archive contaions no data\n" if !$firstfile;
4539 chomp $firstfile;
4540
4541 return $firstfile;
4542}
4543
ed221350
DM
4544sub tar_restore_cleanup {
4545 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
4546
4547 print STDERR "starting cleanup\n";
4548
4549 if (my $fd = IO::File->new($statfile, "r")) {
4550 while (defined(my $line = <$fd>)) {
4551 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4552 my $volid = $2;
4553 eval {
4554 if ($volid =~ m|^/|) {
4555 unlink $volid || die 'unlink failed\n';
4556 } else {
ed221350 4557 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 4558 }
afdb31d5 4559 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
4560 };
4561 print STDERR "unable to cleanup '$volid' - $@" if $@;
4562 } else {
4563 print STDERR "unable to parse line in statfile - $line";
afdb31d5 4564 }
3e16d5fc
DM
4565 }
4566 $fd->close();
4567 }
4568}
4569
4570sub restore_archive {
a0d1b1a2 4571 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 4572
91bd6c90
DM
4573 my $format = $opts->{format};
4574 my $comp;
4575
4576 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4577 $format = 'tar' if !$format;
4578 $comp = 'gzip';
4579 } elsif ($archive =~ m/\.tar$/) {
4580 $format = 'tar' if !$format;
4581 } elsif ($archive =~ m/.tar.lzo$/) {
4582 $format = 'tar' if !$format;
4583 $comp = 'lzop';
4584 } elsif ($archive =~ m/\.vma$/) {
4585 $format = 'vma' if !$format;
4586 } elsif ($archive =~ m/\.vma\.gz$/) {
4587 $format = 'vma' if !$format;
4588 $comp = 'gzip';
4589 } elsif ($archive =~ m/\.vma\.lzo$/) {
4590 $format = 'vma' if !$format;
4591 $comp = 'lzop';
4592 } else {
4593 $format = 'vma' if !$format; # default
4594 }
4595
4596 # try to detect archive format
4597 if ($format eq 'tar') {
4598 return restore_tar_archive($archive, $vmid, $user, $opts);
4599 } else {
4600 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4601 }
4602}
4603
4604sub restore_update_config_line {
4605 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4606
4607 return if $line =~ m/^\#qmdump\#/;
4608 return if $line =~ m/^\#vzdump\#/;
4609 return if $line =~ m/^lock:/;
4610 return if $line =~ m/^unused\d+:/;
4611 return if $line =~ m/^parent:/;
ca3e4fa4 4612 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4613
4614 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4615 # try to convert old 1.X settings
4616 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4617 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4618 my ($model, $macaddr) = split(/\=/, $devconfig);
4619 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4620 my $net = {
4621 model => $model,
4622 bridge => "vmbr$ind",
4623 macaddr => $macaddr,
4624 };
4625 my $netstr = print_net($net);
4626
4627 print $outfd "net$cookie->{netcount}: $netstr\n";
4628 $cookie->{netcount}++;
4629 }
4630 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4631 my ($id, $netstr) = ($1, $2);
4632 my $net = parse_net($netstr);
4633 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4634 $netstr = print_net($net);
4635 print $outfd "$id: $netstr\n";
4636 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4637 my $virtdev = $1;
907ea891 4638 my $value = $3;
91bd6c90
DM
4639 if ($line =~ m/backup=no/) {
4640 print $outfd "#$line";
4641 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4642 my $di = parse_drive($virtdev, $value);
8fd57431 4643 delete $di->{format}; # format can change on restore
91bd6c90 4644 $di->{file} = $map->{$virtdev};
ed221350 4645 $value = print_drive($vmid, $di);
91bd6c90
DM
4646 print $outfd "$virtdev: $value\n";
4647 } else {
4648 print $outfd $line;
4649 }
4650 } else {
4651 print $outfd $line;
4652 }
4653}
4654
4655sub scan_volids {
4656 my ($cfg, $vmid) = @_;
4657
4658 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4659
4660 my $volid_hash = {};
4661 foreach my $storeid (keys %$info) {
4662 foreach my $item (@{$info->{$storeid}}) {
4663 next if !($item->{volid} && $item->{size});
5996a936 4664 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4665 $volid_hash->{$item->{volid}} = $item;
4666 }
4667 }
4668
4669 return $volid_hash;
4670}
4671
a8e2f942
DM
4672sub get_used_paths {
4673 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4674
4675 my $used_path = {};
4676
4677 my $scan_config = sub {
4678 my ($cref, $snapname) = @_;
4679
4680 foreach my $key (keys %$cref) {
4681 my $value = $cref->{$key};
4682 if (valid_drivename($key)) {
4683 next if $skip_drive && $key eq $skip_drive;
4684 my $drive = parse_drive($key, $value);
4685 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4686 if ($drive->{file} =~ m!^/!) {
4687 $used_path->{$drive->{file}}++; # = 1;
4688 } else {
4689 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4690 next if !$storeid;
4691 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4692 next if !$scfg;
4693 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4694 $used_path->{$path}++; # = 1;
4695 }
4696 }
4697 }
4698 };
4699
4700 &$scan_config($conf);
4701
4702 undef $skip_drive;
4703
4704 if ($scan_snapshots) {
4705 foreach my $snapname (keys %{$conf->{snapshots}}) {
4706 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4707 }
4708 }
4709
4710 return $used_path;
4711}
4712
91bd6c90
DM
4713sub update_disksize {
4714 my ($vmid, $conf, $volid_hash) = @_;
be190583 4715
91bd6c90
DM
4716 my $changes;
4717
4718 my $used = {};
4719
5996a936
DM
4720 # Note: it is allowed to define multiple storages with same path (alias), so
4721 # we need to check both 'volid' and real 'path' (two different volid can point
4722 # to the same path).
4723
4724 my $usedpath = {};
be190583 4725
91bd6c90
DM
4726 # update size info
4727 foreach my $opt (keys %$conf) {
ed221350
DM
4728 if (valid_drivename($opt)) {
4729 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4730 my $volid = $drive->{file};
4731 next if !$volid;
4732
4733 $used->{$volid} = 1;
be190583 4734 if ($volid_hash->{$volid} &&
5996a936
DM
4735 (my $path = $volid_hash->{$volid}->{path})) {
4736 $usedpath->{$path} = 1;
4737 }
91bd6c90 4738
ed221350 4739 next if drive_is_cdrom($drive);
91bd6c90
DM
4740 next if !$volid_hash->{$volid};
4741
4742 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4743 my $new = print_drive($vmid, $drive);
4744 if ($new ne $conf->{$opt}) {
4745 $changes = 1;
4746 $conf->{$opt} = $new;
4747 }
91bd6c90
DM
4748 }
4749 }
4750
5996a936
DM
4751 # remove 'unusedX' entry if volume is used
4752 foreach my $opt (keys %$conf) {
4753 next if $opt !~ m/^unused\d+$/;
4754 my $volid = $conf->{$opt};
4755 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4756 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4757 $changes = 1;
4758 delete $conf->{$opt};
4759 }
4760 }
4761
91bd6c90
DM
4762 foreach my $volid (sort keys %$volid_hash) {
4763 next if $volid =~ m/vm-$vmid-state-/;
4764 next if $used->{$volid};
5996a936
DM
4765 my $path = $volid_hash->{$volid}->{path};
4766 next if !$path; # just to be sure
4767 next if $usedpath->{$path};
91bd6c90 4768 $changes = 1;
ed221350 4769 add_unused_volume($conf, $volid);
05937a14 4770 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4771 }
4772
4773 return $changes;
4774}
4775
4776sub rescan {
4777 my ($vmid, $nolock) = @_;
4778
4779 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4780
4781 my $volid_hash = scan_volids($cfg, $vmid);
4782
4783 my $updatefn = sub {
4784 my ($vmid) = @_;
4785
ed221350 4786 my $conf = load_config($vmid);
be190583 4787
ed221350 4788 check_lock($conf);
91bd6c90 4789
03da3f0d
DM
4790 my $vm_volids = {};
4791 foreach my $volid (keys %$volid_hash) {
4792 my $info = $volid_hash->{$volid};
4793 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4794 }
4795
4796 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 4797
ed221350 4798 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
4799 };
4800
4801 if (defined($vmid)) {
4802 if ($nolock) {
4803 &$updatefn($vmid);
4804 } else {
ed221350 4805 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
4806 }
4807 } else {
4808 my $vmlist = config_list();
4809 foreach my $vmid (keys %$vmlist) {
4810 if ($nolock) {
4811 &$updatefn($vmid);
4812 } else {
ed221350 4813 lock_config($vmid, $updatefn, $vmid);
be190583 4814 }
91bd6c90
DM
4815 }
4816 }
4817}
4818
4819sub restore_vma_archive {
4820 my ($archive, $vmid, $user, $opts, $comp) = @_;
4821
4822 my $input = $archive eq '-' ? "<&STDIN" : undef;
4823 my $readfrom = $archive;
4824
4825 my $uncomp = '';
4826 if ($comp) {
4827 $readfrom = '-';
4828 my $qarchive = PVE::Tools::shellquote($archive);
4829 if ($comp eq 'gzip') {
4830 $uncomp = "zcat $qarchive|";
4831 } elsif ($comp eq 'lzop') {
4832 $uncomp = "lzop -d -c $qarchive|";
4833 } else {
4834 die "unknown compression method '$comp'\n";
4835 }
be190583 4836
91bd6c90
DM
4837 }
4838
4839 my $tmpdir = "/var/tmp/vzdumptmp$$";
4840 rmtree $tmpdir;
4841
4842 # disable interrupts (always do cleanups)
4843 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4844 warn "got interrupt - ignored\n";
4845 };
4846
4847 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4848 POSIX::mkfifo($mapfifo, 0600);
4849 my $fifofh;
4850
4851 my $openfifo = sub {
4852 open($fifofh, '>', $mapfifo) || die $!;
4853 };
4854
4855 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4856
4857 my $oldtimeout;
4858 my $timeout = 5;
4859
4860 my $devinfo = {};
4861
4862 my $rpcenv = PVE::RPCEnvironment::get();
4863
ed221350 4864 my $conffile = config_file($vmid);
91bd6c90
DM
4865 my $tmpfn = "$conffile.$$.tmp";
4866
ed221350
DM
4867 # Note: $oldconf is undef if VM does not exists
4868 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4869
91bd6c90
DM
4870 my $print_devmap = sub {
4871 my $virtdev_hash = {};
4872
4873 my $cfgfn = "$tmpdir/qemu-server.conf";
4874
4875 # we can read the config - that is already extracted
4876 my $fh = IO::File->new($cfgfn, "r") ||
4877 "unable to read qemu-server.conf - $!\n";
4878
4879 while (defined(my $line = <$fh>)) {
4880 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4881 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4882 die "archive does not contain data for drive '$virtdev'\n"
4883 if !$devinfo->{$devname};
4884 if (defined($opts->{storage})) {
4885 $storeid = $opts->{storage} || 'local';
4886 } elsif (!$storeid) {
4887 $storeid = 'local';
4888 }
4889 $format = 'raw' if !$format;
4890 $devinfo->{$devname}->{devname} = $devname;
4891 $devinfo->{$devname}->{virtdev} = $virtdev;
4892 $devinfo->{$devname}->{format} = $format;
4893 $devinfo->{$devname}->{storeid} = $storeid;
4894
be190583 4895 # check permission on storage
91bd6c90
DM
4896 my $pool = $opts->{pool}; # todo: do we need that?
4897 if ($user ne 'root@pam') {
4898 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4899 }
4900
4901 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4902 }
4903 }
4904
4905 foreach my $devname (keys %$devinfo) {
be190583
DM
4906 die "found no device mapping information for device '$devname'\n"
4907 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
4908 }
4909
91bd6c90 4910 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
4911
4912 # create empty/temp config
be190583 4913 if ($oldconf) {
ed221350
DM
4914 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4915 foreach_drive($oldconf, sub {
4916 my ($ds, $drive) = @_;
4917
4918 return if drive_is_cdrom($drive);
4919
4920 my $volid = $drive->{file};
4921
4922 return if !$volid || $volid =~ m|^/|;
4923
4924 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4925 return if !$path || !$owner || ($owner != $vmid);
4926
4927 # Note: only delete disk we want to restore
4928 # other volumes will become unused
4929 if ($virtdev_hash->{$ds}) {
4930 PVE::Storage::vdisk_free($cfg, $volid);
4931 }
4932 });
4933 }
4934
4935 my $map = {};
91bd6c90
DM
4936 foreach my $virtdev (sort keys %$virtdev_hash) {
4937 my $d = $virtdev_hash->{$virtdev};
4938 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4939 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
4940
4941 # test if requested format is supported
4942 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4943 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4944 $d->{format} = $defFormat if !$supported;
4945
91bd6c90
DM
4946 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4947 $d->{format}, undef, $alloc_size);
4948 print STDERR "new volume ID is '$volid'\n";
4949 $d->{volid} = $volid;
4950 my $path = PVE::Storage::path($cfg, $volid);
4951
4952 my $write_zeros = 1;
4953 # fixme: what other storages types initialize volumes with zero?
244f2577 4954 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 4955 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
4956 $write_zeros = 0;
4957 }
4958
4959 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4960
4961 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4962 $map->{$virtdev} = $volid;
4963 }
4964
4965 $fh->seek(0, 0) || die "seek failed - $!\n";
4966
4967 my $outfd = new IO::File ($tmpfn, "w") ||
4968 die "unable to write config for VM $vmid\n";
4969
4970 my $cookie = { netcount => 0 };
4971 while (defined(my $line = <$fh>)) {
be190583 4972 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
4973 }
4974
4975 $fh->close();
4976 $outfd->close();
4977 };
4978
4979 eval {
4980 # enable interrupts
4981 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4982 die "interrupted by signal\n";
4983 };
4984 local $SIG{ALRM} = sub { die "got timeout\n"; };
4985
4986 $oldtimeout = alarm($timeout);
4987
4988 my $parser = sub {
4989 my $line = shift;
4990
4991 print "$line\n";
4992
4993 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
4994 my ($dev_id, $size, $devname) = ($1, $2, $3);
4995 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
4996 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 4997 # we correctly received the vma config, so we can disable
3cf90d7a
DM
4998 # the timeout now for disk allocation (set to 10 minutes, so
4999 # that we always timeout if something goes wrong)
5000 alarm(600);
91bd6c90
DM
5001 &$print_devmap();
5002 print $fifofh "done\n";
5003 my $tmp = $oldtimeout || 0;
5004 $oldtimeout = undef;
5005 alarm($tmp);
5006 close($fifofh);
5007 }
5008 };
be190583 5009
91bd6c90
DM
5010 print "restore vma archive: $cmd\n";
5011 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
5012 };
5013 my $err = $@;
5014
5015 alarm($oldtimeout) if $oldtimeout;
5016
5017 unlink $mapfifo;
5018
5019 if ($err) {
5020 rmtree $tmpdir;
5021 unlink $tmpfn;
5022
5023 my $cfg = cfs_read_file('storage.cfg');
5024 foreach my $devname (keys %$devinfo) {
5025 my $volid = $devinfo->{$devname}->{volid};
5026 next if !$volid;
5027 eval {
5028 if ($volid =~ m|^/|) {
5029 unlink $volid || die 'unlink failed\n';
5030 } else {
5031 PVE::Storage::vdisk_free($cfg, $volid);
5032 }
5033 print STDERR "temporary volume '$volid' sucessfuly removed\n";
5034 };
5035 print STDERR "unable to cleanup '$volid' - $@" if $@;
5036 }
5037 die $err;
5038 }
5039
5040 rmtree $tmpdir;
ed221350
DM
5041
5042 rename($tmpfn, $conffile) ||
91bd6c90
DM
5043 die "unable to commit configuration file '$conffile'\n";
5044
ed221350
DM
5045 PVE::Cluster::cfs_update(); # make sure we read new file
5046
91bd6c90
DM
5047 eval { rescan($vmid, 1); };
5048 warn $@ if $@;
5049}
5050
5051sub restore_tar_archive {
5052 my ($archive, $vmid, $user, $opts) = @_;
5053
9c502e26 5054 if ($archive ne '-') {
ed221350 5055 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
5056 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
5057 if $firstfile ne 'qemu-server.conf';
5058 }
3e16d5fc 5059
ed221350 5060 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 5061
ed221350 5062 # destroy existing data - keep empty config
8e90138a 5063 my $vmcfgfn = config_file($vmid);
ebb55558 5064 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 5065
3e16d5fc
DM
5066 my $tocmd = "/usr/lib/qemu-server/qmextract";
5067
2415a446 5068 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 5069 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
5070 $tocmd .= ' --prealloc' if $opts->{prealloc};
5071 $tocmd .= ' --info' if $opts->{info};
5072
a0d1b1a2 5073 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 5074 # so we pipe to zcat
2415a446
DM
5075 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
5076 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
5077
5078 my $tmpdir = "/var/tmp/vzdumptmp$$";
5079 mkpath $tmpdir;
5080
5081 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
5082 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 5083 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 5084
ed221350 5085 my $conffile = config_file($vmid);
3e16d5fc
DM
5086 my $tmpfn = "$conffile.$$.tmp";
5087
5088 # disable interrupts (always do cleanups)
5089 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5090 print STDERR "got interrupt - ignored\n";
5091 };
5092
afdb31d5 5093 eval {
3e16d5fc
DM
5094 # enable interrupts
5095 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5096 die "interrupted by signal\n";
5097 };
5098
9c502e26
DM
5099 if ($archive eq '-') {
5100 print "extracting archive from STDIN\n";
5101 run_command($cmd, input => "<&STDIN");
5102 } else {
5103 print "extracting archive '$archive'\n";
5104 run_command($cmd);
5105 }
3e16d5fc
DM
5106
5107 return if $opts->{info};
5108
5109 # read new mapping
5110 my $map = {};
5111 my $statfile = "$tmpdir/qmrestore.stat";
5112 if (my $fd = IO::File->new($statfile, "r")) {
5113 while (defined (my $line = <$fd>)) {
5114 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5115 $map->{$1} = $2 if $1;
5116 } else {
5117 print STDERR "unable to parse line in statfile - $line\n";
5118 }
5119 }
5120 $fd->close();
5121 }
5122
5123 my $confsrc = "$tmpdir/qemu-server.conf";
5124
5125 my $srcfd = new IO::File($confsrc, "r") ||
5126 die "unable to open file '$confsrc'\n";
5127
5128 my $outfd = new IO::File ($tmpfn, "w") ||
5129 die "unable to write config for VM $vmid\n";
5130
91bd6c90 5131 my $cookie = { netcount => 0 };
3e16d5fc 5132 while (defined (my $line = <$srcfd>)) {
be190583 5133 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
5134 }
5135
5136 $srcfd->close();
5137 $outfd->close();
5138 };
5139 my $err = $@;
5140
afdb31d5 5141 if ($err) {
3e16d5fc
DM
5142
5143 unlink $tmpfn;
5144
ed221350 5145 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 5146
3e16d5fc 5147 die $err;
afdb31d5 5148 }
3e16d5fc
DM
5149
5150 rmtree $tmpdir;
5151
5152 rename $tmpfn, $conffile ||
5153 die "unable to commit configuration file '$conffile'\n";
91bd6c90 5154
ed221350
DM
5155 PVE::Cluster::cfs_update(); # make sure we read new file
5156
91bd6c90
DM
5157 eval { rescan($vmid, 1); };
5158 warn $@ if $@;
3e16d5fc
DM
5159};
5160
0d18dcfc
DM
5161
5162# Internal snapshots
5163
5164# NOTE: Snapshot create/delete involves several non-atomic
5165# action, and can take a long time.
5166# So we try to avoid locking the file and use 'lock' variable
5167# inside the config file instead.
5168
ef59d1ca
DM
5169my $snapshot_copy_config = sub {
5170 my ($source, $dest) = @_;
5171
5172 foreach my $k (keys %$source) {
5173 next if $k eq 'snapshots';
982c7f12
DM
5174 next if $k eq 'snapstate';
5175 next if $k eq 'snaptime';
18bfb361 5176 next if $k eq 'vmstate';
ef59d1ca
DM
5177 next if $k eq 'lock';
5178 next if $k eq 'digest';
db7c26e5 5179 next if $k eq 'description';
ef59d1ca 5180 next if $k =~ m/^unused\d+$/;
be190583 5181
ef59d1ca
DM
5182 $dest->{$k} = $source->{$k};
5183 }
5184};
5185
5186my $snapshot_apply_config = sub {
5187 my ($conf, $snap) = @_;
5188
5189 # copy snapshot list
5190 my $newconf = {
5191 snapshots => $conf->{snapshots},
5192 };
5193
db7c26e5 5194 # keep description and list of unused disks
ef59d1ca 5195 foreach my $k (keys %$conf) {
db7c26e5 5196 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
5197 $newconf->{$k} = $conf->{$k};
5198 }
5199
5200 &$snapshot_copy_config($snap, $newconf);
5201
5202 return $newconf;
5203};
5204
18bfb361
DM
5205sub foreach_writable_storage {
5206 my ($conf, $func) = @_;
5207
5208 my $sidhash = {};
5209
5210 foreach my $ds (keys %$conf) {
5211 next if !valid_drivename($ds);
5212
5213 my $drive = parse_drive($ds, $conf->{$ds});
5214 next if !$drive;
5215 next if drive_is_cdrom($drive);
5216
5217 my $volid = $drive->{file};
5218
5219 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 5220 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
5221 }
5222
5223 foreach my $sid (sort keys %$sidhash) {
5224 &$func($sid);
5225 }
5226}
5227
5228my $alloc_vmstate_volid = sub {
5229 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 5230
18bfb361
DM
5231 # Note: we try to be smart when selecting a $target storage
5232
5233 my $target;
5234
5235 # search shared storage first
5236 foreach_writable_storage($conf, sub {
5237 my ($sid) = @_;
5238 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5239 return if !$scfg->{shared};
5240
5241 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
5242 });
5243
5244 if (!$target) {
5245 # now search local storage
5246 foreach_writable_storage($conf, sub {
5247 my ($sid) = @_;
5248 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5249 return if $scfg->{shared};
5250
5251 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
5252 });
5253 }
5254
5255 $target = 'local' if !$target;
5256
fe6249f4
DM
5257 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
5258 # we abort live save after $conf->{memory}, so we need at max twice that space
5259 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
5260
5261 my $name = "vm-$vmid-state-$snapname";
5262 my $scfg = PVE::Storage::storage_config($storecfg, $target);
5263 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
5264 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
5265
5266 return $volid;
5267};
5268
0d18dcfc 5269my $snapshot_prepare = sub {
18bfb361 5270 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
5271
5272 my $snap;
0d18dcfc
DM
5273
5274 my $updatefn = sub {
5275
5276 my $conf = load_config($vmid);
5277
be190583 5278 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
5279 if is_template($conf);
5280
0d18dcfc
DM
5281 check_lock($conf);
5282
22c377f0
DM
5283 $conf->{lock} = 'snapshot';
5284
be190583
DM
5285 die "snapshot name '$snapname' already used\n"
5286 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 5287
ee2f90b1 5288 my $storecfg = PVE::Storage::config();
7ea975ef 5289 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 5290
782f4f75 5291 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 5292
18bfb361
DM
5293 if ($save_vmstate && check_running($vmid)) {
5294 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
5295 }
5296
ef59d1ca 5297 &$snapshot_copy_config($conf, $snap);
0d18dcfc 5298
782f4f75
DM
5299 $snap->{snapstate} = "prepare";
5300 $snap->{snaptime} = time();
5301 $snap->{description} = $comment if $comment;
5302
4b15803d
DM
5303 # always overwrite machine if we save vmstate. This makes sure we
5304 # can restore it later using correct machine type
5305 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
5306
0d18dcfc
DM
5307 update_config_nolock($vmid, $conf, 1);
5308 };
5309
5310 lock_config($vmid, $updatefn);
22c377f0
DM
5311
5312 return $snap;
0d18dcfc
DM
5313};
5314
5315my $snapshot_commit = sub {
5316 my ($vmid, $snapname) = @_;
5317
5318 my $updatefn = sub {
5319
5320 my $conf = load_config($vmid);
5321
be190583
DM
5322 die "missing snapshot lock\n"
5323 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc 5324
7946e0fa
DM
5325 my $has_machine_config = defined($conf->{machine});
5326
0d18dcfc
DM
5327 my $snap = $conf->{snapshots}->{$snapname};
5328
be190583
DM
5329 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5330
5331 die "wrong snapshot state\n"
5332 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 5333
0d18dcfc 5334 delete $snap->{snapstate};
ee2f90b1 5335 delete $conf->{lock};
0d18dcfc 5336
ef59d1ca 5337 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 5338
7946e0fa
DM
5339 delete $newconf->{machine} if !$has_machine_config;
5340
05e5ad3f
DM
5341 $newconf->{parent} = $snapname;
5342
0d18dcfc
DM
5343 update_config_nolock($vmid, $newconf, 1);
5344 };
5345
5346 lock_config($vmid, $updatefn);
5347};
5348
22c377f0
DM
5349sub snapshot_rollback {
5350 my ($vmid, $snapname) = @_;
5351
5352 my $snap;
5353
5354 my $prepare = 1;
5355
a3222b91 5356 my $storecfg = PVE::Storage::config();
be190583 5357
22c377f0
DM
5358 my $updatefn = sub {
5359
5360 my $conf = load_config($vmid);
5361
8b43bc11 5362 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 5363
ab33a7c2
DM
5364 $snap = $conf->{snapshots}->{$snapname};
5365
be190583 5366 die "snapshot '$snapname' does not exist\n" if !defined($snap);
ab33a7c2 5367
be190583 5368 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
5369 if $snap->{snapstate};
5370
a3222b91
DM
5371 if ($prepare) {
5372 check_lock($conf);
5373 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
5374 }
22c377f0
DM
5375
5376 die "unable to rollback vm $vmid: vm is running\n"
5377 if check_running($vmid);
5378
5379 if ($prepare) {
5380 $conf->{lock} = 'rollback';
5381 } else {
5382 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
5383 delete $conf->{lock};
5384 }
5385
4b15803d
DM
5386 my $forcemachine;
5387
22c377f0 5388 if (!$prepare) {
4b15803d
DM
5389 my $has_machine_config = defined($conf->{machine});
5390
22c377f0 5391 # copy snapshot config to current config
ef59d1ca
DM
5392 $conf = &$snapshot_apply_config($conf, $snap);
5393 $conf->{parent} = $snapname;
4b15803d 5394
d8b916fd
DM
5395 # Note: old code did not store 'machine', so we try to be smart
5396 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
5397 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 5398 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
5399 # in the original config.
5400 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
5401 }
5402
5403 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
5404
5405 if (!$prepare && $snap->{vmstate}) {
5406 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 5407 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 5408 }
22c377f0
DM
5409 };
5410
5411 lock_config($vmid, $updatefn);
be190583 5412
22c377f0
DM
5413 foreach_drive($snap, sub {
5414 my ($ds, $drive) = @_;
5415
5416 return if drive_is_cdrom($drive);
5417
5418 my $volid = $drive->{file};
5419 my $device = "drive-$ds";
5420
79e57b29 5421 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
5422 });
5423
5424 $prepare = 0;
5425 lock_config($vmid, $updatefn);
5426}
5427
9dcf4909
DM
5428my $savevm_wait = sub {
5429 my ($vmid) = @_;
5430
5431 for(;;) {
ed221350 5432 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
5433 if (!$stat->{status}) {
5434 die "savevm not active\n";
5435 } elsif ($stat->{status} eq 'active') {
5436 sleep(1);
5437 next;
5438 } elsif ($stat->{status} eq 'completed') {
5439 last;
5440 } else {
5441 die "query-savevm returned status '$stat->{status}'\n";
5442 }
5443 }
5444};
5445
0d18dcfc 5446sub snapshot_create {
af9110dd 5447 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
0d18dcfc 5448
18bfb361 5449 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 5450
af9110dd 5451 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
18bfb361 5452
67fb9de6
DM
5453 my $config = load_config($vmid);
5454
af9110dd
WL
5455 my $running = check_running($vmid);
5456
67fb9de6 5457 my $freezefs = $running && $config->{agent};
af9110dd
WL
5458 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5459
5460 my $drivehash = {};
5461
5462 if ($freezefs) {
65994ad7
WL
5463 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5464 warn "guest-fsfreeze-freeze problems - $@" if $@;
5465 }
67fb9de6 5466
0d18dcfc
DM
5467 eval {
5468 # create internal snapshots of all drives
22c377f0
DM
5469
5470 my $storecfg = PVE::Storage::config();
a3222b91
DM
5471
5472 if ($running) {
5473 if ($snap->{vmstate}) {
be190583 5474 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
5475 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5476 &$savevm_wait($vmid);
a3222b91 5477 } else {
9dcf4909 5478 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
5479 }
5480 };
5481
22c377f0
DM
5482 foreach_drive($snap, sub {
5483 my ($ds, $drive) = @_;
5484
5485 return if drive_is_cdrom($drive);
0d18dcfc 5486
22c377f0
DM
5487 my $volid = $drive->{file};
5488 my $device = "drive-$ds";
5489
5490 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 5491 $drivehash->{$ds} = 1;
22c377f0 5492 });
0d18dcfc 5493 };
22c377f0
DM
5494 my $err = $@;
5495
65994ad7
WL
5496 if ($running) {
5497 eval { vm_mon_cmd($vmid, "savevm-end") };
5498 warn $@ if $@;
22c377f0 5499
af9110dd 5500 if ($freezefs) {
67fb9de6 5501 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
65994ad7
WL
5502 warn "guest-fsfreeze-thaw problems - $@" if $@;
5503 }
22c377f0 5504
65994ad7 5505 # savevm-end is async, we need to wait
f34ebd52 5506 for (;;) {
2c9e8036
AD
5507 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5508 if (!$stat->{bytes}) {
5509 last;
5510 } else {
5511 print "savevm not yet finished\n";
5512 sleep(1);
5513 next;
5514 }
5515 }
5516 }
5517
22c377f0 5518 if ($err) {
0d18dcfc 5519 warn "snapshot create failed: starting cleanup\n";
3ee28e38 5520 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
5521 warn $@ if $@;
5522 die $err;
5523 }
5524
5525 &$snapshot_commit($vmid, $snapname);
5526}
5527
3ee28e38 5528# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 5529sub snapshot_delete {
3ee28e38 5530 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
5531
5532 my $prepare = 1;
5533
22c377f0 5534 my $snap;
ee2f90b1 5535 my $unused = [];
0d18dcfc 5536
6cb1a8cf
DM
5537 my $unlink_parent = sub {
5538 my ($confref, $new_parent) = @_;
5539
5540 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5541 if ($new_parent) {
5542 $confref->{parent} = $new_parent;
5543 } else {
5544 delete $confref->{parent};
5545 }
5546 }
5547 };
be190583 5548
0d18dcfc 5549 my $updatefn = sub {
2009f324 5550 my ($remove_drive) = @_;
0d18dcfc 5551
22c377f0 5552 my $conf = load_config($vmid);
0d18dcfc 5553
5295b23d
DM
5554 if (!$drivehash) {
5555 check_lock($conf);
be190583 5556 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
5557 if is_template($conf);
5558 }
0d18dcfc 5559
22c377f0 5560 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 5561
be190583 5562 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
5563
5564 # remove parent refs
8fd882a4
SP
5565 if (!$prepare) {
5566 &$unlink_parent($conf, $snap->{parent});
5567 foreach my $sn (keys %{$conf->{snapshots}}) {
5568 next if $sn eq $snapname;
5569 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5570 }
0d18dcfc
DM
5571 }
5572
2009f324 5573 if ($remove_drive) {
18bfb361
DM
5574 if ($remove_drive eq 'vmstate') {
5575 delete $snap->{$remove_drive};
5576 } else {
5577 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5578 my $volid = $drive->{file};
5579 delete $snap->{$remove_drive};
5580 add_unused_volume($conf, $volid);
5581 }
2009f324
DM
5582 }
5583
0d18dcfc
DM
5584 if ($prepare) {
5585 $snap->{snapstate} = 'delete';
5586 } else {
5587 delete $conf->{snapshots}->{$snapname};
3ee28e38 5588 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
5589 foreach my $volid (@$unused) {
5590 add_unused_volume($conf, $volid);
5591 }
0d18dcfc
DM
5592 }
5593
5594 update_config_nolock($vmid, $conf, 1);
5595 };
5596
5597 lock_config($vmid, $updatefn);
5598
18bfb361 5599 # now remove vmstate file
0d18dcfc 5600
22c377f0
DM
5601 my $storecfg = PVE::Storage::config();
5602
18bfb361
DM
5603 if ($snap->{vmstate}) {
5604 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5605 if (my $err = $@) {
5606 die $err if !$force;
5607 warn $err;
5608 }
5609 # save changes (remove vmstate from snapshot)
5610 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5611 };
5612
5613 # now remove all internal snapshots
5614 foreach_drive($snap, sub {
22c377f0
DM
5615 my ($ds, $drive) = @_;
5616
5617 return if drive_is_cdrom($drive);
3ee28e38 5618
22c377f0
DM
5619 my $volid = $drive->{file};
5620 my $device = "drive-$ds";
5621
2009f324
DM
5622 if (!$drivehash || $drivehash->{$ds}) {
5623 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5624 if (my $err = $@) {
5625 die $err if !$force;
5626 warn $err;
5627 }
3ee28e38 5628 }
2009f324
DM
5629
5630 # save changes (remove drive fron snapshot)
5631 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5632 push @$unused, $volid;
22c377f0 5633 });
0d18dcfc
DM
5634
5635 # now cleanup config
5636 $prepare = 0;
5637 lock_config($vmid, $updatefn);
5638}
5639
9cd07842 5640sub has_feature {
7ea975ef
AD
5641 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5642
719893a9 5643 my $err;
7ea975ef
AD
5644 foreach_drive($conf, sub {
5645 my ($ds, $drive) = @_;
5646
5647 return if drive_is_cdrom($drive);
5648 my $volid = $drive->{file};
5649 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5650 });
5651
719893a9 5652 return $err ? 0 : 1;
7ea975ef 5653}
04a69bb4
AD
5654
5655sub template_create {
5656 my ($vmid, $conf, $disk) = @_;
5657
04a69bb4 5658 my $storecfg = PVE::Storage::config();
04a69bb4 5659
9cd07842
DM
5660 foreach_drive($conf, sub {
5661 my ($ds, $drive) = @_;
5662
5663 return if drive_is_cdrom($drive);
5664 return if $disk && $ds ne $disk;
5665
5666 my $volid = $drive->{file};
bbd56097 5667 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5668
04a69bb4
AD
5669 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5670 $drive->{file} = $voliddst;
152fe752
DM
5671 $conf->{$ds} = print_drive($vmid, $drive);
5672 update_config_nolock($vmid, $conf, 1);
04a69bb4 5673 });
04a69bb4
AD
5674}
5675
624361b3
AD
5676sub is_template {
5677 my ($conf) = @_;
5678
96d695c0 5679 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5680}
5681
5133de42
AD
5682sub qemu_img_convert {
5683 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5684
5685 my $storecfg = PVE::Storage::config();
5686 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5687 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5688
5689 if ($src_storeid && $dst_storeid) {
5690 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5691 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5692
5693 my $src_format = qemu_img_format($src_scfg, $src_volname);
5694 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5695
5696 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5697 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5698
5699 my $cmd = [];
71ddbff9 5700 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5701 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5702 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5703
5704 my $parser = sub {
5705 my $line = shift;
5706 if($line =~ m/\((\S+)\/100\%\)/){
5707 my $percent = $1;
5708 my $transferred = int($size * $percent / 100);
5709 my $remaining = $size - $transferred;
5710
5711 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5712 }
5713
5714 };
5715
5716 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5717 my $err = $@;
5718 die "copy failed: $err" if $err;
5719 }
5720}
5721
5722sub qemu_img_format {
5723 my ($scfg, $volname) = @_;
5724
ccb5c001 5725 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5726 return $1;
ccb5c001 5727 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5728 return "host_device";
be190583 5729 } else {
5133de42 5730 return "raw";
5133de42
AD
5731 }
5732}
5733
cfad42af 5734sub qemu_drive_mirror {
ab6ecffe 5735 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
cfad42af 5736
ab6ecffe 5737 my $count = 0;
cfad42af
AD
5738 my $old_len = 0;
5739 my $frozen = undef;
ab6ecffe 5740 my $maxwait = 120;
cfad42af
AD
5741
5742 my $storecfg = PVE::Storage::config();
08ac653f 5743 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
152fe752 5744
08ac653f 5745 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 5746
08ac653f
DM
5747 my $format;
5748 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5749 $format = $1;
5750 }
21ccdb50 5751
08ac653f 5752 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 5753
88383920
DM
5754 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5755 $opts->{format} = $format if $format;
5756
5757 #fixme : sometime drive-mirror timeout, but works fine after.
5758 # (I have see the problem with big volume > 200GB), so we need to eval
f34ebd52 5759 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
88383920 5760 # ignore errors here
21ccdb50 5761
08ac653f
DM
5762 eval {
5763 while (1) {
5764 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5765 my $stat = @$stats[0];
5766 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5767 die "error job is not mirroring" if $stat->{type} ne "mirror";
5768
08ac653f
DM
5769 my $busy = $stat->{busy};
5770
6f708643
DM
5771 if (my $total = $stat->{len}) {
5772 my $transferred = $stat->{offset} || 0;
5773 my $remaining = $total - $transferred;
5774 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
67fb9de6 5775
6f708643
DM
5776 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
5777 }
f34ebd52 5778
08ac653f
DM
5779 if ($stat->{len} == $stat->{offset}) {
5780 if ($busy eq 'false') {
5781
5782 last if $vmiddst != $vmid;
f34ebd52 5783
08ac653f
DM
5784 # try to switch the disk if source and destination are on the same guest
5785 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
5786 last if !$@;
5787 die $@ if $@ !~ m/cannot be completed/;
cfad42af 5788 }
b467f79a 5789
08ac653f
DM
5790 if ($count > $maxwait) {
5791 # if too much writes to disk occurs at the end of migration
5792 #the disk needs to be freezed to be able to complete the migration
5793 vm_suspend($vmid,1);
5794 $frozen = 1;
bcc87408 5795 }
08ac653f
DM
5796 $count ++
5797 }
5798 $old_len = $stat->{offset};
5799 sleep 1;
cfad42af
AD
5800 }
5801
08ac653f
DM
5802 vm_resume($vmid, 1) if $frozen;
5803
5804 };
88383920 5805 my $err = $@;
08ac653f 5806
88383920 5807 my $cancel_job = sub {
08ac653f
DM
5808 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
5809 while (1) {
5810 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5811 my $stat = @$stats[0];
5812 last if !$stat;
5813 sleep 1;
cfad42af 5814 }
88383920
DM
5815 };
5816
5817 if ($err) {
f34ebd52 5818 eval { &$cancel_job(); };
88383920
DM
5819 die "mirroring error: $err";
5820 }
5821
5822 if ($vmiddst != $vmid) {
5823 # if we clone a disk for a new target vm, we don't switch the disk
5824 &$cancel_job(); # so we call block-job-cancel
cfad42af
AD
5825 }
5826}
5827
152fe752 5828sub clone_disk {
be190583 5829 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
5830 $newvmid, $storage, $format, $full, $newvollist) = @_;
5831
5832 my $newvolid;
5833
5834 if (!$full) {
5835 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 5836 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
5837 push @$newvollist, $newvolid;
5838 } else {
5839 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5840 $storeid = $storage if $storage;
5841
1377d7b0
DM
5842 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5843 if (!$format) {
5844 $format = $drive->{format} || $defFormat;
152fe752
DM
5845 }
5846
1377d7b0
DM
5847 # test if requested format is supported - else use default
5848 my $supported = grep { $_ eq $format } @$validFormats;
5849 $format = $defFormat if !$supported;
5850
152fe752
DM
5851 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5852
5853 print "create full clone of drive $drivename ($drive->{file})\n";
5854 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5855 push @$newvollist, $newvolid;
5856
5857 if (!$running || $snapname) {
5858 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5859 } else {
5860 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 5861 }
152fe752
DM
5862 }
5863
5864 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5865
5866 my $disk = $drive;
5867 $disk->{format} = undef;
5868 $disk->{file} = $newvolid;
5869 $disk->{size} = $size;
5870
5871 return $disk;
5872}
5873
ff556cf2
DM
5874# this only works if VM is running
5875sub get_current_qemu_machine {
5876 my ($vmid) = @_;
5877
5878 my $cmd = { execute => 'query-machines', arguments => {} };
8e90138a 5879 my $res = vm_qmp_command($vmid, $cmd);
ff556cf2
DM
5880
5881 my ($current, $default);
5882 foreach my $e (@$res) {
5883 $default = $e->{name} if $e->{'is-default'};
5884 $current = $e->{name} if $e->{'is-current'};
5885 }
5886
5887 # fallback to the default machine if current is not supported by qemu
5888 return $current || $default || 'pc';
5889}
5890
4543ecf0
AD
5891sub lspci {
5892
5893 my $devices = {};
5894
5895 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5896 my (undef, $id, $function) = @_;
5897 my $res = { id => $id, function => $function};
5898 push @{$devices->{$id}}, $res;
5899 });
5900
5901 return $devices;
5902}
5903
1e3baf05 59041;