]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
remove unused code
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05 154my $confdesc = {
7183bd9a
AD
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
1e3baf05
DM
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
2ff09f52
DA
173 hotplug => {
174 optional => 1,
e8b9c17c 175 type => 'boolean',
6c52b679 176 description => "Allow hotplug for disk and network device",
2dbe827e 177 default => 0,
2ff09f52 178 },
1e3baf05
DM
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
22c377f0 189 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
7878afeb 209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
210 minimum => 16,
211 default => 512,
212 },
13a48620
DA
213 balloon => {
214 optional => 1,
215 type => 'integer',
8b1accf7
DM
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
13a48620 226 },
1e3baf05
DM
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 231 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
7fabe17d 236 type => 'string', format => 'dns-name',
1e3baf05
DM
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
cdd20088
AD
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
5b952ff5 243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
244 default => 'lsi',
245 },
1e3baf05
DM
246 description => {
247 optional => 1,
248 type => 'string',
0581fe4f 249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
6b9d84cf 254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
255 description => <<EODESC,
256Used to enable special optimization/features for specific
257operating systems:
258
259other => unspecified OS
260wxp => Microsoft Windows XP
261w2k => Microsoft Windows 2000
262w2k3 => Microsoft Windows 2003
263w2k8 => Microsoft Windows 2008
264wvista => Microsoft Windows Vista
265win7 => Microsoft Windows 7
a70ebde3 266win8 => Microsoft Windows 8/2012
1e3baf05
DM
267l24 => Linux 2.4 Kernel
268l26 => Linux 2.6/3.X Kernel
6b9d84cf 269solaris => solaris/opensolaris/openindiania kernel
1e3baf05 270
6b9d84cf 271other|l24|l26|solaris ... no special behaviour
a70ebde3 272wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
273EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
32baffb4 280 default => 'cdn',
1e3baf05
DM
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
03e480fc 286 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
8a010eae
AD
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
3bd18e48
AD
315 maxcpus => {
316 optional => 1,
317 type => 'integer',
318 description => "Maximum cpus for hotplug.",
319 minimum => 1,
320 default => 1,
321 },
1e3baf05
DM
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
bc84dcca 328 agent => {
ab6a046f
AD
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
be79c214 332 default => 0,
ab6a046f 333 },
1e3baf05
DM
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
8c559505
DM
343 description => "Enable/disable time drift fix.",
344 default => 0,
1e3baf05 345 },
19672434 346 localtime => {
1e3baf05
DM
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
ef5e2be2 359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 361 },
0ea9541d
DM
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
1e3baf05
DM
368 startdate => {
369 optional => 1,
19672434 370 type => 'string',
1e3baf05
DM
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
59411c4e
DM
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
68eda3ab
AD
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
1e3baf05
DM
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394args: -no-reboot -no-hpet
395EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
5acbfe9e 401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
04432191 412 type => 'number',
1e3baf05
DM
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
04432191 415 default => 0.1,
1e3baf05
DM
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
3aefd6fd 427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 428 default => 'kvm64',
1e3baf05 429 },
b7ba6b79
DM
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
982c7f12
DM
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
18bfb361
DM
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
3bafc510
DM
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
2796e7d5
DM
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
1e3baf05
DM
459};
460
461# what about other qemu settings ?
462#cpu => 'string',
463#machine => 'string',
464#fda => 'file',
465#fdb => 'file',
466#mtdblock => 'file',
467#sd => 'file',
468#pflash => 'file',
469#snapshot => 'bool',
470#bootp => 'file',
471##tftp => 'dir',
472##smb => 'dir',
473#kernel => 'file',
474#append => 'string',
475#initrd => 'file',
476##soundhw => 'string',
477
478while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480}
481
482my $MAX_IDE_DISKS = 4;
f62db2a4 483my $MAX_SCSI_DISKS = 14;
a2650619 484my $MAX_VIRTIO_DISKS = 16;
cdb0931f 485my $MAX_SATA_DISKS = 6;
1e3baf05 486my $MAX_USB_DEVICES = 5;
5bdcf937 487my $MAX_NETS = 32;
1e3baf05 488my $MAX_UNUSED_DISKS = 8;
5cffb2d2 489my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 490my $MAX_SERIAL_PORTS = 4;
1989a89c 491my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
492my $MAX_NUMA = 8;
493
494my $numadesc = {
495 optional => 1,
496 type => 'string', format => 'pve-qm-numanode',
497 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>][,policy=<preferred|bind|interleave>]]",
498 description => "numa topology",
499};
500PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
501
502for (my $i = 0; $i < $MAX_NUMA; $i++) {
503 $confdesc->{"numa$i"} = $numadesc;
504}
1e3baf05
DM
505
506my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
e4c6e0b8 507 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
6b64503e 508my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 509
1e3baf05
DM
510my $netdesc = {
511 optional => 1,
512 type => 'string', format => 'pve-qm-net',
a9410357 513 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
1e3baf05 514 description => <<EODESCR,
19672434 515Specify network devices.
1e3baf05
DM
516
517MODEL is one of: $nic_model_list_txt
518
19672434 519XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
520automatically generated if not specified.
521
522The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
523
524Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
525
526If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
527
52810.0.2.2 Gateway
52910.0.2.3 DNS Server
53010.0.2.4 SMB Server
531
532The DHCP server assign addresses to the guest starting from 10.0.2.15.
533
534EODESCR
535};
536PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
537
538for (my $i = 0; $i < $MAX_NETS; $i++) {
539 $confdesc->{"net$i"} = $netdesc;
540}
541
542my $drivename_hash;
19672434 543
1e3baf05
DM
544my $idedesc = {
545 optional => 1,
546 type => 'string', format => 'pve-qm-drive',
8d87f8aa 547 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 548 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
549};
550PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
551
552my $scsidesc = {
553 optional => 1,
554 type => 'string', format => 'pve-qm-drive',
8d87f8aa 555 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 556 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
557};
558PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
559
cdb0931f
DA
560my $satadesc = {
561 optional => 1,
562 type => 'string', format => 'pve-qm-drive',
8d87f8aa 563 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 564 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
565};
566PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
567
1e3baf05
DM
568my $virtiodesc = {
569 optional => 1,
570 type => 'string', format => 'pve-qm-drive',
8d87f8aa 571 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 572 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
573};
574PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
575
576my $usbdesc = {
577 optional => 1,
578 type => 'string', format => 'pve-qm-usb-device',
80401dd8 579 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 580 description => <<EODESCR,
2fe1a152 581Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
582pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
583
19672434 584'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
585'vendor_id:product_id' (hexadeciaml numbers)
586
19672434 587You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
588
589Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
590
80401dd8
DM
591The value 'spice' can be used to add a usb redirection devices for spice.
592
1e3baf05
DM
593EODESCR
594};
595PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
596
040b06b7
DA
597my $hostpcidesc = {
598 optional => 1,
599 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 600 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
601 description => <<EODESCR,
602Map host pci devices. HOSTPCIDEVICE syntax is:
603
604'bus:dev.func' (hexadecimal numbers)
605
606You can us the 'lspci' command to list existing pci devices.
607
0cea6a01
DM
608The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
609
040b06b7
DA
610Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
611
612Experimental: user reported problems with this option.
613EODESCR
614};
615PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
616
bae179aa
DA
617my $serialdesc = {
618 optional => 1,
ca0cef26 619 type => 'string',
1b0b51ed 620 pattern => '(/dev/.+|socket)',
bae179aa 621 description => <<EODESCR,
1b0b51ed 622Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
623
624Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
625
626Experimental: user reported problems with this option.
627EODESCR
628};
bae179aa 629
1989a89c
DA
630my $paralleldesc= {
631 optional => 1,
ca0cef26 632 type => 'string',
9ecc8431 633 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 634 description => <<EODESCR,
19672434 635Map host parallel devices (n is 0 to 2).
1989a89c
DA
636
637Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
638
639Experimental: user reported problems with this option.
640EODESCR
641};
1989a89c
DA
642
643for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
644 $confdesc->{"parallel$i"} = $paralleldesc;
645}
646
bae179aa
DA
647for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
648 $confdesc->{"serial$i"} = $serialdesc;
649}
650
040b06b7
DA
651for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
652 $confdesc->{"hostpci$i"} = $hostpcidesc;
653}
1e3baf05
DM
654
655for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
656 $drivename_hash->{"ide$i"} = 1;
657 $confdesc->{"ide$i"} = $idedesc;
658}
659
cdb0931f
DA
660for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
661 $drivename_hash->{"sata$i"} = 1;
662 $confdesc->{"sata$i"} = $satadesc;
663}
664
1e3baf05
DM
665for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
666 $drivename_hash->{"scsi$i"} = 1;
667 $confdesc->{"scsi$i"} = $scsidesc ;
668}
669
670for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
671 $drivename_hash->{"virtio$i"} = 1;
672 $confdesc->{"virtio$i"} = $virtiodesc;
673}
674
675for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
676 $confdesc->{"usb$i"} = $usbdesc;
677}
678
679my $unuseddesc = {
680 optional => 1,
681 type => 'string', format => 'pve-volume-id',
682 description => "Reference to unused volumes.",
683};
684
685for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
686 $confdesc->{"unused$i"} = $unuseddesc;
687}
688
689my $kvm_api_version = 0;
690
691sub kvm_version {
692
693 return $kvm_api_version if $kvm_api_version;
694
6b64503e 695 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
696 return 0;
697
6b64503e 698 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
699 $kvm_api_version = $v;
700 }
701
702 $fh->close();
703
704 return $kvm_api_version;
705}
706
707my $kvm_user_version;
708
709sub kvm_user_version {
710
711 return $kvm_user_version if $kvm_user_version;
712
713 $kvm_user_version = 'unknown';
714
715 my $tmp = `kvm -help 2>/dev/null`;
19672434 716
fa7ae705 717 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
718 $kvm_user_version = $2;
719 }
720
721 return $kvm_user_version;
722
723}
724
725my $kernel_has_vhost_net = -c '/dev/vhost-net';
726
727sub disknames {
728 # order is important - used to autoselect boot disk
19672434 729 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 730 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
731 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
732 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
733}
734
735sub valid_drivename {
736 my $dev = shift;
737
6b64503e 738 return defined($drivename_hash->{$dev});
1e3baf05
DM
739}
740
741sub option_exists {
742 my $key = shift;
743 return defined($confdesc->{$key});
19672434 744}
1e3baf05
DM
745
746sub nic_models {
747 return $nic_model_list;
748}
749
750sub os_list_description {
751
752 return {
753 other => 'Other',
754 wxp => 'Windows XP',
755 w2k => 'Windows 2000',
756 w2k3 =>, 'Windows 2003',
757 w2k8 => 'Windows 2008',
758 wvista => 'Windows Vista',
759 win7 => 'Windows 7',
a70ebde3 760 win8 => 'Windows 8/2012',
1e3baf05
DM
761 l24 => 'Linux 2.4',
762 l26 => 'Linux 2.6',
19672434 763 };
1e3baf05
DM
764}
765
1e3baf05
DM
766my $cdrom_path;
767
768sub get_cdrom_path {
769
770 return $cdrom_path if $cdrom_path;
771
772 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
773 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
774 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
775}
776
777sub get_iso_path {
778 my ($storecfg, $vmid, $cdrom) = @_;
779
780 if ($cdrom eq 'cdrom') {
781 return get_cdrom_path();
782 } elsif ($cdrom eq 'none') {
783 return '';
784 } elsif ($cdrom =~ m|^/|) {
785 return $cdrom;
786 } else {
6b64503e 787 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
788 }
789}
790
791# try to convert old style file names to volume IDs
792sub filename_to_volume_id {
793 my ($vmid, $file, $media) = @_;
794
795 if (!($file eq 'none' || $file eq 'cdrom' ||
796 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 797
1e3baf05 798 return undef if $file =~ m|/|;
19672434 799
1e3baf05
DM
800 if ($media && $media eq 'cdrom') {
801 $file = "local:iso/$file";
802 } else {
803 $file = "local:$vmid/$file";
804 }
805 }
806
807 return $file;
808}
809
810sub verify_media_type {
811 my ($opt, $vtype, $media) = @_;
812
813 return if !$media;
814
815 my $etype;
816 if ($media eq 'disk') {
a125592c 817 $etype = 'images';
1e3baf05
DM
818 } elsif ($media eq 'cdrom') {
819 $etype = 'iso';
820 } else {
821 die "internal error";
822 }
823
824 return if ($vtype eq $etype);
19672434 825
1e3baf05
DM
826 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
827}
828
829sub cleanup_drive_path {
830 my ($opt, $storecfg, $drive) = @_;
831
832 # try to convert filesystem paths to volume IDs
833
834 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
835 ($drive->{file} !~ m|^/dev/.+|) &&
836 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 837 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
838 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
839 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
840 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
841 verify_media_type($opt, $vtype, $drive->{media});
842 $drive->{file} = $volid;
843 }
844
845 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
846}
847
848sub create_conf_nolock {
849 my ($vmid, $settings) = @_;
850
6b64503e 851 my $filename = config_file($vmid);
1e3baf05
DM
852
853 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 854
1e3baf05
DM
855 my $defaults = load_defaults();
856
857 $settings->{name} = "vm$vmid" if !$settings->{name};
858 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
859
860 my $data = '';
861 foreach my $opt (keys %$settings) {
862 next if !$confdesc->{$opt};
863
864 my $value = $settings->{$opt};
865 next if !$value;
866
867 $data .= "$opt: $value\n";
868 }
869
870 PVE::Tools::file_set_contents($filename, $data);
871}
872
f36ed4f4
DM
873my $parse_size = sub {
874 my ($value) = @_;
875
9bf371a6 876 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
877 my ($size, $unit) = ($1, $3);
878 if ($unit) {
879 if ($unit eq 'K') {
880 $size = $size * 1024;
881 } elsif ($unit eq 'M') {
882 $size = $size * 1024 * 1024;
883 } elsif ($unit eq 'G') {
884 $size = $size * 1024 * 1024 * 1024;
885 }
886 }
887 return int($size);
888};
889
890my $format_size = sub {
891 my ($size) = @_;
892
893 $size = int($size);
894
895 my $kb = int($size/1024);
896 return $size if $kb*1024 != $size;
897
898 my $mb = int($kb/1024);
899 return "${kb}K" if $mb*1024 != $kb;
900
901 my $gb = int($mb/1024);
902 return "${mb}M" if $gb*1024 != $mb;
903
904 return "${gb}G";
905};
906
1e3baf05
DM
907# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
908# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 909# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 910# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
911
912sub parse_drive {
913 my ($key, $data) = @_;
914
915 my $res = {};
19672434 916
1e3baf05
DM
917 # $key may be undefined - used to verify JSON parameters
918 if (!defined($key)) {
919 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
920 $res->{index} = 0;
921 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
922 $res->{interface} = $1;
923 $res->{index} = $2;
924 } else {
925 return undef;
926 }
927
928 foreach my $p (split (/,/, $data)) {
929 next if $p =~ m/^\s*$/;
930
74edd76b 931 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
932 my ($k, $v) = ($1, $2);
933
934 $k = 'file' if $k eq 'volume';
935
936 return undef if defined $res->{$k};
19672434 937
9bf371a6
DM
938 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
939 return undef if !$v || $v !~ m/^\d+/;
940 $k = "m$k";
941 $v = sprintf("%.3f", $v / (1024*1024));
942 }
1e3baf05
DM
943 $res->{$k} = $v;
944 } else {
945 if (!$res->{file} && $p !~ m/=/) {
946 $res->{file} = $p;
947 } else {
948 return undef;
949 }
950 }
951 }
952
953 return undef if !$res->{file};
954
bdf3f362
AD
955 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
956 $res->{format} = $1;
957 }
958
19672434 959 return undef if $res->{cache} &&
e482cec3 960 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
961 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
962 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
963 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
964 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
965 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
966 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
967 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
968 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
969 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
970 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
971 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 972 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 973
9bf371a6
DM
974 return undef if $res->{mbps_rd} && $res->{mbps};
975 return undef if $res->{mbps_wr} && $res->{mbps};
976
977 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 978 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 979 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 980 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 981 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 982 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 983
affd2f88
AD
984 return undef if $res->{iops_rd} && $res->{iops};
985 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
986
987
affd2f88 988 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 989 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 990 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 991 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 992 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 993 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
994
995
24afaca0 996 if ($res->{size}) {
be190583 997 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
998 }
999
1e3baf05
DM
1000 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1001 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1002 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1003 return undef if $res->{interface} eq 'virtio';
1004 }
1005
1006 # rerror does not work with scsi drives
1007 if ($res->{rerror}) {
1008 return undef if $res->{interface} eq 'scsi';
1009 }
1010
1011 return $res;
1012}
1013
74edd76b 1014my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
1015
1016sub print_drive {
1017 my ($vmid, $drive) = @_;
1018
1019 my $opts = '';
74edd76b 1020 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
1021 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1022 }
1023
24afaca0
DM
1024 if ($drive->{size}) {
1025 $opts .= ",size=" . &$format_size($drive->{size});
1026 }
1027
1e3baf05
DM
1028 return "$drive->{file}$opts";
1029}
1030
28ef82d3
DM
1031sub scsi_inquiry {
1032 my($fh, $noerr) = @_;
1033
1034 my $SG_IO = 0x2285;
1035 my $SG_GET_VERSION_NUM = 0x2282;
1036
1037 my $versionbuf = "\x00" x 8;
1038 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1039 if (!$ret) {
1040 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1041 return undef;
1042 }
97d62eb7 1043 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1044 if ($version < 30000) {
1045 die "scsi generic interface too old\n" if !$noerr;
1046 return undef;
1047 }
97d62eb7 1048
28ef82d3
DM
1049 my $buf = "\x00" x 36;
1050 my $sensebuf = "\x00" x 8;
f334aa3e 1051 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1052
28ef82d3
DM
1053 # see /usr/include/scsi/sg.h
1054 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1055
97d62eb7
DM
1056 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1057 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1058 $cmd, $sensebuf, 6000);
1059
1060 $ret = ioctl($fh, $SG_IO, $packet);
1061 if (!$ret) {
1062 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1063 return undef;
1064 }
97d62eb7 1065
28ef82d3
DM
1066 my @res = unpack($sg_io_hdr_t, $packet);
1067 if ($res[17] || $res[18]) {
1068 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1069 return undef;
1070 }
1071
1072 my $res = {};
09984754 1073 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1074 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1075
09984754
DM
1076 $res->{removable} = $byte1 & 128 ? 1 : 0;
1077 $res->{type} = $byte0 & 31;
1078
28ef82d3
DM
1079 return $res;
1080}
1081
1082sub path_is_scsi {
1083 my ($path) = @_;
1084
1085 my $fh = IO::File->new("+<$path") || return undef;
1086 my $res = scsi_inquiry($fh, 1);
1087 close($fh);
1088
1089 return $res;
1090}
1091
db656e5f
DM
1092sub machine_type_is_q35 {
1093 my ($conf) = @_;
b467f79a 1094
db656e5f
DM
1095 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1096}
1097
1098sub print_tabletdevice_full {
1099 my ($conf) = @_;
b467f79a 1100
db656e5f
DM
1101 my $q35 = machine_type_is_q35($conf);
1102
1103 # we use uhci for old VMs because tablet driver was buggy in older qemu
1104 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1105
db656e5f
DM
1106 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1107}
1108
ca916ecc 1109sub print_drivedevice_full {
5bdcf937 1110 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1111
1112 my $device = '';
1113 my $maxdev = 0;
19672434 1114
ca916ecc 1115 if ($drive->{interface} eq 'virtio') {
5bdcf937 1116 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1117 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
7183bd9a 1118 $device .= ",iothread=iothread0" if $conf->{iothread};
2ed36a41 1119 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1120 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1121 my $controller = int($drive->{index} / $maxdev);
1122 my $unit = $drive->{index} % $maxdev;
1123 my $devicetype = 'hd';
231f2e13
DA
1124 my $path = '';
1125 if (drive_is_cdrom($drive)) {
1126 $devicetype = 'cd';
29b19529 1127 } else {
231f2e13
DA
1128 if ($drive->{file} =~ m|^/|) {
1129 $path = $drive->{file};
1130 } else {
1131 $path = PVE::Storage::path($storecfg, $drive->{file});
1132 }
d454d040
AD
1133
1134 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1135 $devicetype = 'generic';
1136 } else {
09984754
DM
1137 if (my $info = path_is_scsi($path)) {
1138 if ($info->{type} == 0) {
1139 $devicetype = 'block';
1140 } elsif ($info->{type} == 1) { # tape
1141 $devicetype = 'generic';
1142 }
1143 }
d454d040 1144 }
231f2e13 1145 }
ca916ecc 1146
5b952ff5
DM
1147 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1148 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1149 } else {
1150 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1151 }
1152
2ed36a41
DM
1153 } elsif ($drive->{interface} eq 'ide'){
1154 $maxdev = 2;
1155 my $controller = int($drive->{index} / $maxdev);
1156 my $unit = $drive->{index} % $maxdev;
1157 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1158
7ebe888a 1159 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1160 } elsif ($drive->{interface} eq 'sata'){
1161 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1162 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1163 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1164 } elsif ($drive->{interface} eq 'usb') {
1165 die "implement me";
1166 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1167 } else {
1168 die "unsupported interface type";
ca916ecc
DA
1169 }
1170
3b408e82
DM
1171 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1172
ca916ecc
DA
1173 return $device;
1174}
1175
15b21acc 1176sub get_initiator_name {
46f58b5f 1177 my $initiator;
15b21acc 1178
46f58b5f
DM
1179 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1180 while (defined(my $line = <$fh>)) {
1181 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1182 $initiator = $1;
1183 last;
1184 }
46f58b5f
DM
1185 $fh->close();
1186
15b21acc
MR
1187 return $initiator;
1188}
1189
1e3baf05
DM
1190sub print_drive_full {
1191 my ($storecfg, $vmid, $drive) = @_;
1192
1193 my $opts = '';
1194 foreach my $o (@qemu_drive_options) {
3b408e82 1195 next if $o eq 'bootindex';
1e3baf05 1196 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1197 }
1e3baf05 1198
9bf371a6
DM
1199 foreach my $o (qw(bps bps_rd bps_wr)) {
1200 my $v = $drive->{"m$o"};
1201 $opts .= ",$o=" . int($v*1024*1024) if $v;
1202 }
1203
1e3baf05 1204 # use linux-aio by default (qemu default is threads)
19672434 1205 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1206
1207 my $path;
1208 my $volid = $drive->{file};
6b64503e
DM
1209 if (drive_is_cdrom($drive)) {
1210 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1211 } else {
1212 if ($volid =~ m|^/|) {
1213 $path = $volid;
1214 } else {
6b64503e 1215 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1216 }
1217 }
1218
ef86170e 1219 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1220
f1e05305
AD
1221 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1222 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1223
1e3baf05
DM
1224 my $pathinfo = $path ? "file=$path," : '';
1225
3ebfcc86 1226 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1227}
1228
cc4d6182 1229sub print_netdevice_full {
5bdcf937 1230 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1231
1232 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1233
1234 my $device = $net->{model};
1235 if ($net->{model} eq 'virtio') {
1236 $device = 'virtio-net-pci';
1237 };
1238
1239 # qemu > 0.15 always try to boot from network - we disable that by
1240 # not loading the pxe rom file
1241 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
5bdcf937 1242 my $pciaddr = print_pci_addr("$netid", $bridges);
cc4d6182 1243 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1244 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1245 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1246 my $vectors = $net->{queues} * 2 + 2;
1247 $tmpstr .= ",vectors=$vectors,mq=on";
1248 }
cc4d6182
DA
1249 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1250 return $tmpstr;
1251}
1252
1253sub print_netdev_full {
1254 my ($vmid, $conf, $net, $netid) = @_;
1255
1256 my $i = '';
1257 if ($netid =~ m/^net(\d+)$/) {
1258 $i = int($1);
1259 }
1260
1261 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1262
1263 my $ifname = "tap${vmid}i$i";
1264
1265 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1266 die "interface name '$ifname' is too long (max 15 character)\n"
1267 if length($ifname) >= 16;
1268
1269 my $vhostparam = '';
1270 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1271
1272 my $vmname = $conf->{name} || "vm$vmid";
1273
a9410357
AD
1274 my $netdev = "";
1275
cc4d6182 1276 if ($net->{bridge}) {
a9410357 1277 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1278 } else {
a9410357 1279 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1280 }
a9410357
AD
1281
1282 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1283
1284 return $netdev;
cc4d6182 1285}
1e3baf05
DM
1286
1287sub drive_is_cdrom {
1288 my ($drive) = @_;
1289
1290 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1291
1292}
1293
2ed5d572
AD
1294sub parse_numa {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 foreach my $kvp (split(/,/, $data)) {
1300
1301 if ($kvp =~ m/^memory=(\S+)$/) {
1302 $res->{memory} = $1;
1303 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1304 $res->{policy} = $1;
1305 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1306 $res->{cpus}->{start} = $1;
1307 $res->{cpus}->{end} = $3;
1308 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1309 $res->{hostnodes}->{start} = $1;
1310 $res->{hostnodes}->{end} = $3;
1311 } else {
1312 return undef;
1313 }
1314 }
1315
1316 return $res;
1317}
1318
040b06b7
DA
1319sub parse_hostpci {
1320 my ($value) = @_;
1321
1322 return undef if !$value;
1323
0cea6a01
DM
1324
1325 my @list = split(/,/, $value);
1326 my $found;
1327
040b06b7 1328 my $res = {};
0cea6a01 1329 foreach my $kv (@list) {
040b06b7 1330
4543ecf0 1331 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1332 $found = 1;
4543ecf0
AD
1333 if(defined($4)){
1334 push @{$res->{pciid}}, { id => $2 , function => $4};
1335
1336 }else{
1337 my $pcidevices = lspci($2);
1338 $res->{pciid} = $pcidevices->{$2};
1339 }
0cea6a01
DM
1340 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1341 $res->{driver} = $1;
1342 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1343 $res->{rombar} = $1;
2e3b7e2a
AD
1344 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1345 $res->{'x-vga'} = $1;
1346 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1347 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1348 } else {
1349 warn "unknown hostpci setting '$kv'\n";
1350 }
040b06b7
DA
1351 }
1352
0cea6a01
DM
1353 return undef if !$found;
1354
040b06b7
DA
1355 return $res;
1356}
1357
1e3baf05
DM
1358# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1359sub parse_net {
1360 my ($data) = @_;
1361
1362 my $res = {};
1363
6b64503e 1364 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1365
e4c6e0b8 1366 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1367 my $model = lc($1);
92f0fedc 1368 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1369 $res->{model} = $model;
1370 $res->{macaddr} = $mac;
1371 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1372 $res->{bridge} = $1;
a9410357
AD
1373 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1374 $res->{queues} = $1;
1e3baf05
DM
1375 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1376 $res->{rate} = $1;
5070f384
DA
1377 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1378 $res->{tag} = $1;
2dd4aa4c
AD
1379 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1380 $res->{firewall} = $1;
1e3baf05
DM
1381 } else {
1382 return undef;
1383 }
19672434 1384
1e3baf05
DM
1385 }
1386
1387 return undef if !$res->{model};
1388
1389 return $res;
1390}
1391
1392sub print_net {
1393 my $net = shift;
1394
1395 my $res = "$net->{model}";
1396 $res .= "=$net->{macaddr}" if $net->{macaddr};
1397 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1398 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1399 $res .= ",tag=$net->{tag}" if $net->{tag};
28138e9a 1400 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1e3baf05
DM
1401
1402 return $res;
1403}
1404
1405sub add_random_macs {
1406 my ($settings) = @_;
1407
1408 foreach my $opt (keys %$settings) {
1409 next if $opt !~ m/^net(\d+)$/;
1410 my $net = parse_net($settings->{$opt});
1411 next if !$net;
1412 $settings->{$opt} = print_net($net);
1413 }
1414}
1415
1416sub add_unused_volume {
1858638f 1417 my ($config, $volid) = @_;
1e3baf05
DM
1418
1419 my $key;
1420 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1421 my $test = "unused$ind";
1422 if (my $vid = $config->{$test}) {
1423 return if $vid eq $volid; # do not add duplicates
1424 } else {
1425 $key = $test;
19672434 1426 }
1e3baf05
DM
1427 }
1428
1429 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1430
1858638f 1431 $config->{$key} = $volid;
1e3baf05 1432
1858638f 1433 return $key;
1e3baf05
DM
1434}
1435
055d554d
DM
1436sub vm_is_volid_owner {
1437 my ($storecfg, $vmid, $volid) = @_;
1438
1439 if ($volid !~ m|^/|) {
1440 my ($path, $owner);
1441 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1442 if ($owner && ($owner == $vmid)) {
1443 return 1;
1444 }
1445 }
1446
1447 return undef;
1448}
1449
1450sub vmconfig_delete_pending_option {
1451 my ($conf, $key) = @_;
1452
1453 delete $conf->{pending}->{$key};
1454 my $pending_delete_hash = { $key => 1 };
1455 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1456 $pending_delete_hash->{$opt} = 1;
1457 }
1458 $conf->{pending}->{delete} = join(',', keys %$pending_delete_hash);
1459}
1460
1461sub vmconfig_undelete_pending_option {
1462 my ($conf, $key) = @_;
1463
1464 my $pending_delete_hash = {};
1465 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1466 $pending_delete_hash->{$opt} = 1;
1467 }
1468 delete $pending_delete_hash->{$key};
1469
1470 my @keylist = keys %$pending_delete_hash;
1471 if (scalar(@keylist)) {
1472 $conf->{pending}->{delete} = join(',', @keylist);
1473 } else {
1474 delete $conf->{pending}->{delete};
1475 }
1476}
1477
1478sub vmconfig_register_unused_drive {
1479 my ($storecfg, $vmid, $conf, $drive) = @_;
1480
1481 if (!drive_is_cdrom($drive)) {
1482 my $volid = $drive->{file};
1483 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
1484 add_unused_volume($conf, $volid, $vmid);
1485 }
1486 }
1487}
1488
c750e90a
DM
1489sub vmconfig_cleanup_pending {
1490 my ($conf) = @_;
1491
1492 # remove pending changes when nothing changed
1493 my $changes;
1494 foreach my $opt (keys %{$conf->{pending}}) {
1495 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1496 $changes = 1;
1497 delete $conf->{pending}->{$opt};
1498 }
1499 }
1500
1501 # remove delete if option is not set
1502 my $pending_delete_hash = {};
1503 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1504 if (defined($conf->{$opt})) {
1505 $pending_delete_hash->{$opt} = 1;
1506 } else {
1507 $changes = 1;
1508 }
1509 }
1510
1511 my @keylist = keys %$pending_delete_hash;
1512 if (scalar(@keylist)) {
1513 $conf->{pending}->{delete} = join(',', @keylist);
1514 } else {
1515 delete $conf->{pending}->{delete};
1516 }
1517
1518 return $changes;
1519}
1520
2796e7d5
DM
1521my $valid_smbios1_options = {
1522 manufacturer => '\S+',
1523 product => '\S+',
1524 version => '\S+',
1525 serial => '\S+',
1526 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1527 sku => '\S+',
1528 family => '\S+',
1529};
1530
1531# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1532sub parse_smbios1 {
1533 my ($data) = @_;
1534
1535 my $res = {};
1536
1537 foreach my $kvp (split(/,/, $data)) {
1538 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1539 my ($k, $v) = split(/=/, $kvp);
1540 return undef if !defined($k) || !defined($v);
1541 return undef if !$valid_smbios1_options->{$k};
1542 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1543 $res->{$k} = $v;
1544 }
1545
1546 return $res;
1547}
1548
cd11416f
DM
1549sub print_smbios1 {
1550 my ($smbios1) = @_;
1551
1552 my $data = '';
1553 foreach my $k (keys %$smbios1) {
1554 next if !defined($smbios1->{$k});
1555 next if !$valid_smbios1_options->{$k};
1556 $data .= ',' if $data;
1557 $data .= "$k=$smbios1->{$k}";
1558 }
1559 return $data;
1560}
1561
2796e7d5
DM
1562PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1563sub verify_smbios1 {
1564 my ($value, $noerr) = @_;
1565
1566 return $value if parse_smbios1($value);
1567
1568 return undef if $noerr;
1569
1570 die "unable to parse smbios (type 1) options\n";
1571}
1572
1e3baf05
DM
1573PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1574sub verify_bootdisk {
1575 my ($value, $noerr) = @_;
1576
19672434 1577 return $value if valid_drivename($value);
1e3baf05
DM
1578
1579 return undef if $noerr;
1580
1581 die "invalid boot disk '$value'\n";
1582}
1583
2ed5d572
AD
1584PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1585sub verify_numa {
1586 my ($value, $noerr) = @_;
1587
1588 return $value if parse_numa($value);
1589
1590 return undef if $noerr;
1591
1592 die "unable to parse numa options\n";
1593}
1594
1e3baf05
DM
1595PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1596sub verify_net {
1597 my ($value, $noerr) = @_;
1598
1599 return $value if parse_net($value);
1600
1601 return undef if $noerr;
19672434 1602
1e3baf05
DM
1603 die "unable to parse network options\n";
1604}
1605
1606PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1607sub verify_drive {
1608 my ($value, $noerr) = @_;
1609
6b64503e 1610 return $value if parse_drive(undef, $value);
1e3baf05
DM
1611
1612 return undef if $noerr;
19672434 1613
1e3baf05
DM
1614 die "unable to parse drive options\n";
1615}
1616
1617PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1618sub verify_hostpci {
1619 my ($value, $noerr) = @_;
1620
040b06b7
DA
1621 return $value if parse_hostpci($value);
1622
1623 return undef if $noerr;
1624
1625 die "unable to parse pci id\n";
1e3baf05
DM
1626}
1627
0ea9541d
DM
1628PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1629sub verify_watchdog {
1630 my ($value, $noerr) = @_;
1631
1632 return $value if parse_watchdog($value);
1633
1634 return undef if $noerr;
19672434 1635
0ea9541d
DM
1636 die "unable to parse watchdog options\n";
1637}
1638
1639sub parse_watchdog {
1640 my ($value) = @_;
1641
1642 return undef if !$value;
1643
1644 my $res = {};
1645
6b64503e 1646 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1647 next if $p =~ m/^\s*$/;
1648
1649 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1650 $res->{model} = $2;
1651 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1652 $res->{action} = $2;
1653 } else {
1654 return undef;
1655 }
1656 }
1657
1658 return $res;
1659}
1660
59411c4e
DM
1661PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1662sub verify_startup {
1663 my ($value, $noerr) = @_;
1664
1665 return $value if parse_startup($value);
1666
1667 return undef if $noerr;
1668
1669 die "unable to parse startup options\n";
1670}
1671
1672sub parse_startup {
1673 my ($value) = @_;
1674
1675 return undef if !$value;
1676
1677 my $res = {};
1678
1679 foreach my $p (split(/,/, $value)) {
1680 next if $p =~ m/^\s*$/;
1681
1682 if ($p =~ m/^(order=)?(\d+)$/) {
1683 $res->{order} = $2;
1684 } elsif ($p =~ m/^up=(\d+)$/) {
1685 $res->{up} = $1;
1686 } elsif ($p =~ m/^down=(\d+)$/) {
1687 $res->{down} = $1;
1688 } else {
1689 return undef;
1690 }
1691 }
1692
1693 return $res;
1694}
1695
1e3baf05
DM
1696sub parse_usb_device {
1697 my ($value) = @_;
1698
1699 return undef if !$value;
1700
6b64503e 1701 my @dl = split(/,/, $value);
1e3baf05
DM
1702 my $found;
1703
1704 my $res = {};
1705 foreach my $v (@dl) {
036e0e2b 1706 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1707 $found = 1;
036e0e2b
DM
1708 $res->{vendorid} = $2;
1709 $res->{productid} = $4;
1e3baf05
DM
1710 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1711 $found = 1;
1712 $res->{hostbus} = $1;
1713 $res->{hostport} = $2;
80401dd8
DM
1714 } elsif ($v =~ m/^spice$/) {
1715 $found = 1;
1716 $res->{spice} = 1;
1e3baf05
DM
1717 } else {
1718 return undef;
1719 }
1720 }
1721 return undef if !$found;
1722
1723 return $res;
1724}
19672434 1725
1e3baf05
DM
1726PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1727sub verify_usb_device {
1728 my ($value, $noerr) = @_;
1729
1730 return $value if parse_usb_device($value);
1731
1732 return undef if $noerr;
19672434 1733
1e3baf05
DM
1734 die "unable to parse usb device\n";
1735}
1736
1e3baf05
DM
1737# add JSON properties for create and set function
1738sub json_config_properties {
1739 my $prop = shift;
1740
1741 foreach my $opt (keys %$confdesc) {
18bfb361 1742 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1743 $prop->{$opt} = $confdesc->{$opt};
1744 }
1745
1746 return $prop;
1747}
1748
1749sub check_type {
1750 my ($key, $value) = @_;
1751
1752 die "unknown setting '$key'\n" if !$confdesc->{$key};
1753
1754 my $type = $confdesc->{$key}->{type};
1755
6b64503e 1756 if (!defined($value)) {
1e3baf05
DM
1757 die "got undefined value\n";
1758 }
1759
1760 if ($value =~ m/[\n\r]/) {
1761 die "property contains a line feed\n";
1762 }
1763
1764 if ($type eq 'boolean') {
19672434
DM
1765 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1766 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1767 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1768 } elsif ($type eq 'integer') {
1769 return int($1) if $value =~ m/^(\d+)$/;
1770 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1771 } elsif ($type eq 'number') {
1772 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1773 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1774 } elsif ($type eq 'string') {
1775 if (my $fmt = $confdesc->{$key}->{format}) {
1776 if ($fmt eq 'pve-qm-drive') {
1777 # special case - we need to pass $key to parse_drive()
6b64503e 1778 my $drive = parse_drive($key, $value);
1e3baf05
DM
1779 return $value if $drive;
1780 die "unable to parse drive options\n";
1781 }
1782 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1783 return $value;
1784 }
1e3baf05 1785 $value =~ s/^\"(.*)\"$/$1/;
19672434 1786 return $value;
1e3baf05
DM
1787 } else {
1788 die "internal error"
1789 }
1790}
1791
191435c6
DM
1792sub lock_config_full {
1793 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1794
6b64503e 1795 my $filename = config_file_lock($vmid);
1e3baf05 1796
191435c6 1797 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1798
1799 die $@ if $@;
5fdbe4f0
DM
1800
1801 return $res;
1e3baf05
DM
1802}
1803
4e4f83fe
DM
1804sub lock_config_mode {
1805 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1806
1807 my $filename = config_file_lock($vmid);
1808
4e4f83fe 1809 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1810
1811 die $@ if $@;
1812
1813 return $res;
1814}
1815
191435c6
DM
1816sub lock_config {
1817 my ($vmid, $code, @param) = @_;
1818
1819 return lock_config_full($vmid, 10, $code, @param);
1820}
1821
1e3baf05 1822sub cfs_config_path {
a78ccf26 1823 my ($vmid, $node) = @_;
1e3baf05 1824
a78ccf26
DM
1825 $node = $nodename if !$node;
1826 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1827}
1828
040b06b7
DA
1829sub check_iommu_support{
1830 #fixme : need to check IOMMU support
1831 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1832
1833 my $iommu=1;
1834 return $iommu;
1835
1836}
1837
1e3baf05 1838sub config_file {
a78ccf26 1839 my ($vmid, $node) = @_;
1e3baf05 1840
a78ccf26 1841 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1842 return "/etc/pve/$cfspath";
1843}
1844
1845sub config_file_lock {
1846 my ($vmid) = @_;
1847
1848 return "$lock_dir/lock-$vmid.conf";
1849}
1850
1851sub touch_config {
1852 my ($vmid) = @_;
1853
6b64503e 1854 my $conf = config_file($vmid);
1e3baf05
DM
1855 utime undef, undef, $conf;
1856}
1857
1e3baf05 1858sub destroy_vm {
a6af7b3e 1859 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1860
6b64503e 1861 my $conffile = config_file($vmid);
1e3baf05 1862
6b64503e 1863 my $conf = load_config($vmid);
1e3baf05 1864
6b64503e 1865 check_lock($conf);
1e3baf05 1866
19672434 1867 # only remove disks owned by this VM
1e3baf05
DM
1868 foreach_drive($conf, sub {
1869 my ($ds, $drive) = @_;
1870
6b64503e 1871 return if drive_is_cdrom($drive);
1e3baf05
DM
1872
1873 my $volid = $drive->{file};
ed221350 1874
ff1a2432 1875 return if !$volid || $volid =~ m|^/|;
1e3baf05 1876
6b64503e 1877 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1878 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1879
6b64503e 1880 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1881 });
19672434 1882
a6af7b3e 1883 if ($keep_empty_config) {
9c502e26 1884 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1885 } else {
1886 unlink $conffile;
1887 }
1e3baf05
DM
1888
1889 # also remove unused disk
1890 eval {
6b64503e 1891 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1892
1893 eval {
6b64503e 1894 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1895 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1896 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1897 });
1898 };
1899 warn $@ if $@;
1900
1901 };
1902 warn $@ if $@;
1903}
1904
1e3baf05 1905sub load_config {
7e8dcf2c 1906 my ($vmid, $node) = @_;
1e3baf05 1907
7e8dcf2c 1908 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1909
1910 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1911
1912 die "no such VM ('$vmid')\n" if !defined($conf);
1913
1914 return $conf;
19672434 1915}
1e3baf05
DM
1916
1917sub parse_vm_config {
1918 my ($filename, $raw) = @_;
1919
1920 return undef if !defined($raw);
1921
554ac7e7 1922 my $res = {
fc1ddcdc 1923 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1924 snapshots => {},
0d732d16 1925 pending => {},
554ac7e7 1926 };
1e3baf05 1927
19672434 1928 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1929 || die "got strange filename '$filename'";
1930
1931 my $vmid = $1;
1932
0d18dcfc 1933 my $conf = $res;
0581fe4f 1934 my $descr = '';
e297c490 1935 my $section = '';
0581fe4f 1936
0d18dcfc
DM
1937 my @lines = split(/\n/, $raw);
1938 foreach my $line (@lines) {
1e3baf05 1939 next if $line =~ m/^\s*$/;
be190583 1940
eab09f4e 1941 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 1942 $section = 'pending';
0d732d16
DM
1943 $conf->{description} = $descr if $descr;
1944 $descr = '';
e297c490 1945 $conf = $res->{$section} = {};
eab09f4e
AD
1946 next;
1947
0d732d16 1948 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 1949 $section = $1;
0d18dcfc 1950 $conf->{description} = $descr if $descr;
782f4f75 1951 $descr = '';
e297c490 1952 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
1953 next;
1954 }
1e3baf05 1955
0581fe4f
DM
1956 if ($line =~ m/^\#(.*)\s*$/) {
1957 $descr .= PVE::Tools::decode_text($1) . "\n";
1958 next;
1959 }
1960
1e3baf05 1961 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1962 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1963 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1964 $conf->{snapstate} = $1;
1e3baf05
DM
1965 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1966 my $key = $1;
1967 my $value = $2;
0d18dcfc 1968 $conf->{$key} = $value;
ef824322 1969 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
e297c490 1970 my $value = $1;
ef824322
DM
1971 if ($section eq 'pending') {
1972 $conf->{delete} = $value; # we parse this later
1973 } else {
1974 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
eab09f4e 1975 }
1e3baf05
DM
1976 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1977 my $key = $1;
1978 my $value = $2;
1979 eval { $value = check_type($key, $value); };
1980 if ($@) {
1981 warn "vm $vmid - unable to parse value of '$key' - $@";
1982 } else {
1983 my $fmt = $confdesc->{$key}->{format};
1984 if ($fmt && $fmt eq 'pve-qm-drive') {
1985 my $v = parse_drive($key, $value);
1986 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1987 $v->{file} = $volid;
6b64503e 1988 $value = print_drive($vmid, $v);
1e3baf05
DM
1989 } else {
1990 warn "vm $vmid - unable to parse value of '$key'\n";
1991 next;
1992 }
1993 }
1994
1995 if ($key eq 'cdrom') {
0d18dcfc 1996 $conf->{ide2} = $value;
1e3baf05 1997 } else {
0d18dcfc 1998 $conf->{$key} = $value;
1e3baf05
DM
1999 }
2000 }
2001 }
2002 }
2003
0d18dcfc 2004 $conf->{description} = $descr if $descr;
0581fe4f 2005
0d18dcfc 2006 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
2007
2008 return $res;
2009}
2010
1858638f
DM
2011sub write_vm_config {
2012 my ($filename, $conf) = @_;
1e3baf05 2013
0d18dcfc
DM
2014 delete $conf->{snapstate}; # just to be sure
2015
1858638f
DM
2016 if ($conf->{cdrom}) {
2017 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2018 $conf->{ide2} = $conf->{cdrom};
2019 delete $conf->{cdrom};
2020 }
1e3baf05
DM
2021
2022 # we do not use 'smp' any longer
1858638f
DM
2023 if ($conf->{sockets}) {
2024 delete $conf->{smp};
2025 } elsif ($conf->{smp}) {
2026 $conf->{sockets} = $conf->{smp};
2027 delete $conf->{cores};
2028 delete $conf->{smp};
1e3baf05
DM
2029 }
2030
264e519f 2031 if ($conf->{maxcpus} && $conf->{sockets}) {
3bd18e48
AD
2032 delete $conf->{sockets};
2033 }
264e519f 2034
ee2f90b1 2035 my $used_volids = {};
0d18dcfc 2036
ee2f90b1 2037 my $cleanup_config = sub {
ef824322 2038 my ($cref, $pending, $snapname) = @_;
1858638f 2039
ee2f90b1
DM
2040 foreach my $key (keys %$cref) {
2041 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
ef824322 2042 $key eq 'snapstate' || $key eq 'pending';
ee2f90b1 2043 my $value = $cref->{$key};
ef824322
DM
2044 if ($key eq 'delete') {
2045 die "propertry 'delete' is only allowed in [PENDING]\n"
2046 if !$pending;
2047 # fixme: check syntax?
2048 next;
2049 }
ee2f90b1
DM
2050 eval { $value = check_type($key, $value); };
2051 die "unable to parse value of '$key' - $@" if $@;
1858638f 2052
ee2f90b1
DM
2053 $cref->{$key} = $value;
2054
a8e2f942 2055 if (!$snapname && valid_drivename($key)) {
ed221350 2056 my $drive = parse_drive($key, $value);
ee2f90b1
DM
2057 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2058 }
1e3baf05 2059 }
ee2f90b1
DM
2060 };
2061
2062 &$cleanup_config($conf);
ef824322
DM
2063
2064 &$cleanup_config($conf->{pending}, 1);
2065
ee2f90b1 2066 foreach my $snapname (keys %{$conf->{snapshots}}) {
ef824322
DM
2067 die "internal error" if $snapname eq 'pending';
2068 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
1e3baf05
DM
2069 }
2070
1858638f
DM
2071 # remove 'unusedX' settings if we re-add a volume
2072 foreach my $key (keys %$conf) {
2073 my $value = $conf->{$key};
ee2f90b1 2074 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 2075 delete $conf->{$key};
1e3baf05 2076 }
1858638f 2077 }
be190583 2078
0d18dcfc
DM
2079 my $generate_raw_config = sub {
2080 my ($conf) = @_;
0581fe4f 2081
0d18dcfc
DM
2082 my $raw = '';
2083
2084 # add description as comment to top of file
2085 my $descr = $conf->{description} || '';
2086 foreach my $cl (split(/\n/, $descr)) {
2087 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2088 }
2089
2090 foreach my $key (sort keys %$conf) {
ef824322 2091 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
0d18dcfc
DM
2092 $raw .= "$key: $conf->{$key}\n";
2093 }
2094 return $raw;
2095 };
0581fe4f 2096
0d18dcfc 2097 my $raw = &$generate_raw_config($conf);
ef824322
DM
2098
2099 if (scalar(keys %{$conf->{pending}})){
2100 $raw .= "\n[PENDING]\n";
2101 $raw .= &$generate_raw_config($conf->{pending});
2102 }
2103
0d18dcfc
DM
2104 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2105 $raw .= "\n[$snapname]\n";
2106 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2107 }
1e3baf05 2108
1858638f
DM
2109 return $raw;
2110}
1e3baf05 2111
1858638f
DM
2112sub update_config_nolock {
2113 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2114
1858638f 2115 check_lock($conf) if !$skiplock;
97d62eb7 2116
1858638f 2117 my $cfspath = cfs_config_path($vmid);
1e3baf05 2118
1858638f
DM
2119 PVE::Cluster::cfs_write_file($cfspath, $conf);
2120}
1e3baf05 2121
1858638f
DM
2122sub update_config {
2123 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2124
1858638f 2125 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
2126}
2127
19672434 2128sub load_defaults {
1e3baf05
DM
2129
2130 my $res = {};
2131
2132 # we use static defaults from our JSON schema configuration
2133 foreach my $key (keys %$confdesc) {
2134 if (defined(my $default = $confdesc->{$key}->{default})) {
2135 $res->{$key} = $default;
2136 }
2137 }
19672434 2138
1e3baf05
DM
2139 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2140 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2141
2142 return $res;
2143}
2144
2145sub config_list {
2146 my $vmlist = PVE::Cluster::get_vmlist();
2147 my $res = {};
2148 return $res if !$vmlist || !$vmlist->{ids};
2149 my $ids = $vmlist->{ids};
2150
1e3baf05
DM
2151 foreach my $vmid (keys %$ids) {
2152 my $d = $ids->{$vmid};
2153 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2154 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2155 $res->{$vmid}->{exists} = 1;
2156 }
2157 return $res;
2158}
2159
64e13401
DM
2160# test if VM uses local resources (to prevent migration)
2161sub check_local_resources {
2162 my ($conf, $noerr) = @_;
2163
2164 my $loc_res = 0;
19672434 2165
e0ab7331
DM
2166 $loc_res = 1 if $conf->{hostusb}; # old syntax
2167 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2168
0d29ab3b 2169 foreach my $k (keys %$conf) {
49ca581d 2170 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 2171 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2172 }
2173
2174 die "VM uses local resources\n" if $loc_res && !$noerr;
2175
2176 return $loc_res;
2177}
2178
719893a9 2179# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2180sub check_storage_availability {
2181 my ($storecfg, $conf, $node) = @_;
2182
2183 foreach_drive($conf, sub {
2184 my ($ds, $drive) = @_;
2185
2186 my $volid = $drive->{file};
2187 return if !$volid;
2188
2189 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2190 return if !$sid;
2191
2192 # check if storage is available on both nodes
2193 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2194 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2195 });
2196}
2197
719893a9
DM
2198# list nodes where all VM images are available (used by has_feature API)
2199sub shared_nodes {
2200 my ($conf, $storecfg) = @_;
2201
2202 my $nodelist = PVE::Cluster::get_nodelist();
2203 my $nodehash = { map { $_ => 1 } @$nodelist };
2204 my $nodename = PVE::INotify::nodename();
be190583 2205
719893a9
DM
2206 foreach_drive($conf, sub {
2207 my ($ds, $drive) = @_;
2208
2209 my $volid = $drive->{file};
2210 return if !$volid;
2211
2212 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2213 if ($storeid) {
2214 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2215 if ($scfg->{disable}) {
2216 $nodehash = {};
2217 } elsif (my $avail = $scfg->{nodes}) {
2218 foreach my $node (keys %$nodehash) {
2219 delete $nodehash->{$node} if !$avail->{$node};
2220 }
2221 } elsif (!$scfg->{shared}) {
2222 foreach my $node (keys %$nodehash) {
2223 delete $nodehash->{$node} if $node ne $nodename
2224 }
2225 }
2226 }
2227 });
2228
2229 return $nodehash
2230}
2231
1e3baf05
DM
2232sub check_lock {
2233 my ($conf) = @_;
2234
2235 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2236}
2237
2238sub check_cmdline {
2239 my ($pidfile, $pid) = @_;
2240
6b64503e
DM
2241 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2242 if (defined($fh)) {
1e3baf05
DM
2243 my $line = <$fh>;
2244 $fh->close;
2245 return undef if !$line;
6b64503e 2246 my @param = split(/\0/, $line);
1e3baf05
DM
2247
2248 my $cmd = $param[0];
06094efd 2249 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2250
2251 for (my $i = 0; $i < scalar (@param); $i++) {
2252 my $p = $param[$i];
2253 next if !$p;
2254 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2255 my $p = $param[$i+1];
2256 return 1 if $p && ($p eq $pidfile);
2257 return undef;
2258 }
2259 }
2260 }
2261 return undef;
2262}
2263
2264sub check_running {
7e8dcf2c 2265 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2266
7e8dcf2c 2267 my $filename = config_file($vmid, $node);
1e3baf05
DM
2268
2269 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2270 if !$nocheck && ! -f $filename;
1e3baf05 2271
e6c3b671 2272 my $pidfile = pidfile_name($vmid);
1e3baf05 2273
e6c3b671
DM
2274 if (my $fd = IO::File->new("<$pidfile")) {
2275 my $st = stat($fd);
1e3baf05 2276 my $line = <$fd>;
6b64503e 2277 close($fd);
1e3baf05
DM
2278
2279 my $mtime = $st->mtime;
2280 if ($mtime > time()) {
2281 warn "file '$filename' modified in future\n";
2282 }
2283
2284 if ($line =~ m/^(\d+)$/) {
2285 my $pid = $1;
e6c3b671
DM
2286 if (check_cmdline($pidfile, $pid)) {
2287 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2288 return $pid;
2289 }
2290 }
1e3baf05
DM
2291 }
2292 }
2293
2294 return undef;
2295}
2296
2297sub vzlist {
19672434 2298
1e3baf05
DM
2299 my $vzlist = config_list();
2300
6b64503e 2301 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2302
19672434 2303 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2304 next if $de !~ m/^(\d+)\.pid$/;
2305 my $vmid = $1;
6b64503e
DM
2306 next if !defined($vzlist->{$vmid});
2307 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2308 $vzlist->{$vmid}->{pid} = $pid;
2309 }
2310 }
2311
2312 return $vzlist;
2313}
2314
1e3baf05
DM
2315sub disksize {
2316 my ($storecfg, $conf) = @_;
2317
2318 my $bootdisk = $conf->{bootdisk};
2319 return undef if !$bootdisk;
2320 return undef if !valid_drivename($bootdisk);
2321
2322 return undef if !$conf->{$bootdisk};
2323
2324 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2325 return undef if !defined($drive);
2326
2327 return undef if drive_is_cdrom($drive);
2328
2329 my $volid = $drive->{file};
2330 return undef if !$volid;
2331
24afaca0 2332 return $drive->{size};
1e3baf05
DM
2333}
2334
2335my $last_proc_pid_stat;
2336
03a33f30
DM
2337# get VM status information
2338# This must be fast and should not block ($full == false)
2339# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2340sub vmstatus {
03a33f30 2341 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2342
2343 my $res = {};
2344
19672434 2345 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2346
2347 my $list = vzlist();
694fcad4 2348 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2349
ae4915a2
DM
2350 my $cpucount = $cpuinfo->{cpus} || 1;
2351
1e3baf05
DM
2352 foreach my $vmid (keys %$list) {
2353 next if $opt_vmid && ($vmid ne $opt_vmid);
2354
2355 my $cfspath = cfs_config_path($vmid);
2356 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2357
2358 my $d = {};
2359 $d->{pid} = $list->{$vmid}->{pid};
2360
2361 # fixme: better status?
2362 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2363
af990afe
DM
2364 my $size = disksize($storecfg, $conf);
2365 if (defined($size)) {
2366 $d->{disk} = 0; # no info available
1e3baf05
DM
2367 $d->{maxdisk} = $size;
2368 } else {
2369 $d->{disk} = 0;
2370 $d->{maxdisk} = 0;
2371 }
2372
2373 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2374 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2375
1e3baf05 2376 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2377 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2378
8b1accf7 2379 if ($conf->{balloon}) {
4bdb0514 2380 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2381 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2382 }
2383
1e3baf05
DM
2384 $d->{uptime} = 0;
2385 $d->{cpu} = 0;
1e3baf05
DM
2386 $d->{mem} = 0;
2387
2388 $d->{netout} = 0;
2389 $d->{netin} = 0;
2390
2391 $d->{diskread} = 0;
2392 $d->{diskwrite} = 0;
2393
4d8c851b
AD
2394 $d->{template} = is_template($conf);
2395
1e3baf05
DM
2396 $res->{$vmid} = $d;
2397 }
2398
2399 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2400 foreach my $dev (keys %$netdev) {
2401 next if $dev !~ m/^tap([1-9]\d*)i/;
2402 my $vmid = $1;
2403 my $d = $res->{$vmid};
2404 next if !$d;
19672434 2405
1e3baf05
DM
2406 $d->{netout} += $netdev->{$dev}->{receive};
2407 $d->{netin} += $netdev->{$dev}->{transmit};
2408 }
2409
1e3baf05
DM
2410 my $ctime = gettimeofday;
2411
2412 foreach my $vmid (keys %$list) {
2413
2414 my $d = $res->{$vmid};
2415 my $pid = $d->{pid};
2416 next if !$pid;
2417
694fcad4
DM
2418 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2419 next if !$pstat; # not running
19672434 2420
694fcad4 2421 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2422
694fcad4 2423 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2424
694fcad4 2425 if ($pstat->{vsize}) {
6b64503e 2426 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2427 }
2428
2429 my $old = $last_proc_pid_stat->{$pid};
2430 if (!$old) {
19672434
DM
2431 $last_proc_pid_stat->{$pid} = {
2432 time => $ctime,
1e3baf05
DM
2433 used => $used,
2434 cpu => 0,
1e3baf05
DM
2435 };
2436 next;
2437 }
2438
7f0b5beb 2439 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2440
2441 if ($dtime > 1000) {
2442 my $dutime = $used - $old->{used};
2443
ae4915a2 2444 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2445 $last_proc_pid_stat->{$pid} = {
19672434 2446 time => $ctime,
1e3baf05
DM
2447 used => $used,
2448 cpu => $d->{cpu},
1e3baf05
DM
2449 };
2450 } else {
2451 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2452 }
2453 }
2454
f5eb281a 2455 return $res if !$full;
03a33f30
DM
2456
2457 my $qmpclient = PVE::QMPClient->new();
2458
64e7fcf2
DM
2459 my $ballooncb = sub {
2460 my ($vmid, $resp) = @_;
2461
2462 my $info = $resp->{'return'};
2463 return if !$info->{max_mem};
be190583 2464
64e7fcf2
DM
2465 my $d = $res->{$vmid};
2466
2467 # use memory assigned to VM
2468 $d->{maxmem} = $info->{max_mem};
2469 $d->{balloon} = $info->{actual};
be190583 2470
64e7fcf2
DM
2471 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2472 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2473 $d->{freemem} = $info->{free_mem};
2474 }
2475
2476 };
2477
03a33f30
DM
2478 my $blockstatscb = sub {
2479 my ($vmid, $resp) = @_;
2480 my $data = $resp->{'return'} || [];
2481 my $totalrdbytes = 0;
2482 my $totalwrbytes = 0;
2483 for my $blockstat (@$data) {
2484 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2485 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2486 }
2487 $res->{$vmid}->{diskread} = $totalrdbytes;
2488 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2489 };
2490
2491 my $statuscb = sub {
2492 my ($vmid, $resp) = @_;
64e7fcf2 2493
03a33f30 2494 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2495 # this fails if ballon driver is not loaded, so this must be
2496 # the last commnand (following command are aborted if this fails).
2497 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2498
2499 my $status = 'unknown';
2500 if (!defined($status = $resp->{'return'}->{status})) {
2501 warn "unable to get VM status\n";
2502 return;
2503 }
2504
2505 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2506 };
2507
2508 foreach my $vmid (keys %$list) {
2509 next if $opt_vmid && ($vmid ne $opt_vmid);
2510 next if !$res->{$vmid}->{pid}; # not running
2511 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2512 }
2513
c8125172 2514 $qmpclient->queue_execute(undef, 1);
03a33f30
DM
2515
2516 foreach my $vmid (keys %$list) {
2517 next if $opt_vmid && ($vmid ne $opt_vmid);
2518 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2519 }
2520
1e3baf05
DM
2521 return $res;
2522}
2523
2524sub foreach_drive {
2525 my ($conf, $func) = @_;
2526
2527 foreach my $ds (keys %$conf) {
2528 next if !valid_drivename($ds);
2529
6b64503e 2530 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2531 next if !$drive;
2532
2533 &$func($ds, $drive);
2534 }
2535}
2536
d5769dc2
DM
2537sub foreach_volid {
2538 my ($conf, $func) = @_;
be190583 2539
d5769dc2
DM
2540 my $volhash = {};
2541
2542 my $test_volid = sub {
2543 my ($volid, $is_cdrom) = @_;
2544
2545 return if !$volid;
be190583 2546
d5769dc2
DM
2547 $volhash->{$volid} = $is_cdrom || 0;
2548 };
2549
ed221350 2550 foreach_drive($conf, sub {
d5769dc2
DM
2551 my ($ds, $drive) = @_;
2552 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2553 });
2554
2555 foreach my $snapname (keys %{$conf->{snapshots}}) {
2556 my $snap = $conf->{snapshots}->{$snapname};
2557 &$test_volid($snap->{vmstate}, 0);
ed221350 2558 foreach_drive($snap, sub {
d5769dc2
DM
2559 my ($ds, $drive) = @_;
2560 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2561 });
2562 }
2563
2564 foreach my $volid (keys %$volhash) {
be190583 2565 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2566 }
2567}
2568
86b8228b
DM
2569sub vga_conf_has_spice {
2570 my ($vga) = @_;
2571
590e698c
DM
2572 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2573
2574 return $1 || 1;
86b8228b
DM
2575}
2576
1e3baf05 2577sub config_to_command {
952958bc 2578 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2579
2580 my $cmd = [];
8c559505
DM
2581 my $globalFlags = [];
2582 my $machineFlags = [];
2583 my $rtcFlags = [];
519ed28c 2584 my $cpuFlags = [];
5bdcf937 2585 my $devices = [];
b78ebef7 2586 my $pciaddr = '';
5bdcf937 2587 my $bridges = {};
1e3baf05
DM
2588 my $kvmver = kvm_user_version();
2589 my $vernum = 0; # unknown
a3c52213
DM
2590 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2591 $vernum = $1*1000000+$2*1000;
2592 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2593 $vernum = $1*1000000+$2*1000+$3;
2594 }
2595
a3c52213 2596 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2597
2598 my $have_ovz = -f '/proc/vz/vestat';
2599
db656e5f
DM
2600 my $q35 = machine_type_is_q35($conf);
2601
1e3baf05
DM
2602 push @$cmd, '/usr/bin/kvm';
2603
2604 push @$cmd, '-id', $vmid;
2605
2606 my $use_virtio = 0;
2607
c971c4f2
AD
2608 my $qmpsocket = qmp_socket($vmid);
2609 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2610 push @$cmd, '-mon', "chardev=qmp,mode=control";
2611
7b7c6d1b 2612 my $socket = vnc_socket($vmid);
1e3baf05
DM
2613 push @$cmd, '-vnc', "unix:$socket,x509,password";
2614
6b64503e 2615 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2616
1e3baf05
DM
2617 push @$cmd, '-daemonize';
2618
2796e7d5
DM
2619 if ($conf->{smbios1}) {
2620 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2621 }
2622
7183bd9a
AD
2623 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2624
db656e5f 2625 if ($q35) {
b467f79a 2626 # the q35 chipset support native usb2, so we enable usb controller
db656e5f 2627 # by default for this machine type
f8e83f05 2628 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2629 } else {
f8e83f05
AD
2630 $pciaddr = print_pci_addr("piix3", $bridges);
2631 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2632
f8e83f05 2633 my $use_usb2 = 0;
db656e5f
DM
2634 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2635 next if !$conf->{"usb$i"};
2636 $use_usb2 = 1;
2637 }
2638 # include usb device config
2639 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2640 }
19672434 2641
5acbfe9e 2642 my $vga = $conf->{vga};
2fa3151e 2643
590e698c
DM
2644 my $qxlnum = vga_conf_has_spice($vga);
2645 $vga = 'qxl' if $qxlnum;
2fa3151e 2646
5acbfe9e 2647 if (!$vga) {
264e519f
DM
2648 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2649 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2650 $conf->{ostype} eq 'w2k8')) {
2651 $vga = 'std';
2652 } else {
2653 $vga = 'cirrus';
2654 }
2655 }
2656
1e3baf05 2657 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2658 my $tablet;
2659 if (defined($conf->{tablet})) {
2660 $tablet = $conf->{tablet};
2661 } else {
2662 $tablet = $defaults->{tablet};
590e698c 2663 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2664 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2665 }
2666
db656e5f 2667 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2668
1e3baf05 2669 # host pci devices
040b06b7 2670 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2671 my $d = parse_hostpci($conf->{"hostpci$i"});
2672 next if !$d;
2673
2674 my $pcie = $d->{pcie};
2675 if($pcie){
2676 die "q35 machine model is not enabled" if !$q35;
2677 $pciaddr = print_pcie_addr("hostpci$i");
2678 }else{
2679 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2680 }
2681
2682 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2683 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2684 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2685 if ($xvga && $xvga ne '') {
2686 push @$cpuFlags, 'kvm=off';
2687 $vga = 'none';
2688 }
2e3b7e2a 2689 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2690 my $pcidevices = $d->{pciid};
2691 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2692
4543ecf0
AD
2693 my $j=0;
2694 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2695
4543ecf0
AD
2696 my $id = "hostpci$i";
2697 $id .= ".$j" if $multifunction;
2698 my $addr = $pciaddr;
2699 $addr .= ".$j" if $multifunction;
2700 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2701
2702 if($j == 0){
2703 $devicestr .= "$rombar$xvga";
2704 $devicestr .= ",multifunction=on" if $multifunction;
2705 }
2706
2707 push @$devices, '-device', $devicestr;
2708 $j++;
2709 }
1e3baf05
DM
2710 }
2711
2712 # usb devices
2713 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2714 my $d = parse_usb_device($conf->{"usb$i"});
2715 next if !$d;
2716 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2717 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2718 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2719 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2720 } elsif ($d->{spice}) {
2721 # usb redir support for spice
2722 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2723 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2724 }
2725 }
2726
1e3baf05 2727 # serial devices
bae179aa 2728 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2729 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2730 if ($path eq 'socket') {
2731 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2732 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2733 push @$devices, '-device', "isa-serial,chardev=serial$i";
2734 } else {
2735 die "no such serial device\n" if ! -c $path;
2736 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2737 push @$devices, '-device', "isa-serial,chardev=serial$i";
2738 }
34978be3 2739 }
1e3baf05
DM
2740 }
2741
2742 # parallel devices
1989a89c 2743 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2744 if (my $path = $conf->{"parallel$i"}) {
19672434 2745 die "no such parallel device\n" if ! -c $path;
32e69805 2746 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2747 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2748 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2749 }
1e3baf05
DM
2750 }
2751
2752 my $vmname = $conf->{name} || "vm$vmid";
2753
2754 push @$cmd, '-name', $vmname;
19672434 2755
1e3baf05
DM
2756 my $sockets = 1;
2757 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2758 $sockets = $conf->{sockets} if $conf->{sockets};
2759
2760 my $cores = $conf->{cores} || 1;
3bd18e48
AD
2761 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2762
76267728
WL
2763 my $total_cores = $sockets * $cores;
2764 my $allowed_cores = $cpuinfo->{cpus};
2765
f34ebd52 2766 die "MAX $allowed_cores cores allowed per VM on this node\n"
76267728
WL
2767 if ($allowed_cores < $total_cores);
2768
264e519f 2769 if ($maxcpus) {
3bd18e48 2770 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
264e519f 2771 } else {
3bd18e48
AD
2772 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2773 }
1e3baf05 2774
1e3baf05
DM
2775 push @$cmd, '-nodefaults';
2776
32baffb4 2777 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2778
0888fdce
DM
2779 my $bootindex_hash = {};
2780 my $i = 1;
2781 foreach my $o (split(//, $bootorder)) {
2782 $bootindex_hash->{$o} = $i*100;
2783 $i++;
afdb31d5 2784 }
3b408e82
DM
2785
2786 push @$cmd, '-boot', "menu=on";
1e3baf05 2787
6b64503e 2788 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2789
6b64503e 2790 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2791
ef5e2be2 2792 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2793
2794 # time drift fix
6b64503e 2795 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2796
6b64503e 2797 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2798 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2799
2800 if (my $ost = $conf->{ostype}) {
6b9d84cf 2801 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2802
2803 if ($ost =~ m/^w/) { # windows
8c559505 2804 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2805
8c559505 2806 # use time drift fix when acpi is enabled
6b64503e 2807 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2808 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2809 }
2810 }
2811
be190583 2812 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2813 $ost eq 'wvista') {
8c559505 2814 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2815 push @$cmd, '-no-hpet';
462e8d19
AD
2816 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2817 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2818 }
2819
2820 if ($ost eq 'win7' || $ost eq 'win8') {
2821 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2822 }
1e3baf05
DM
2823 }
2824
8c559505
DM
2825 push @$rtcFlags, 'driftfix=slew' if $tdf;
2826
7f0b5beb 2827 if ($nokvm) {
8c559505 2828 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2829 } else {
2830 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2831 }
1e3baf05 2832
952958bc
DM
2833 my $machine_type = $forcemachine || $conf->{machine};
2834 if ($machine_type) {
2835 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2836 }
2837
8c559505
DM
2838 if ($conf->{startdate}) {
2839 push @$rtcFlags, "base=$conf->{startdate}";
2840 } elsif ($useLocaltime) {
2841 push @$rtcFlags, 'base=localtime';
2842 }
1e3baf05 2843
519ed28c
AD
2844 my $cpu = $nokvm ? "qemu64" : "kvm64";
2845 $cpu = $conf->{cpu} if $conf->{cpu};
2846
4dc339e7
AD
2847 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2848
6b9d84cf
AD
2849 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2850
2851 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2852
2e1a5389
AD
2853 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2854
be190583 2855 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2856
c0efd8cd
DM
2857 # Note: enforce needs kernel 3.10, so we do not use it for now
2858 # push @$cmd, '-cpu', "$cpu,enforce";
2859 push @$cmd, '-cpu', $cpu;
519ed28c 2860
67fb9de6 2861 my $memory = $conf->{memory} || $defaults->{memory};
8a010eae
AD
2862 push @$cmd, '-m', $memory;
2863
67fb9de6 2864 if ($conf->{numa}) {
8a010eae 2865
2ed5d572
AD
2866 my $numa_totalmemory = undef;
2867 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2868 next if !$conf->{"numa$i"};
2869 my $numa = parse_numa($conf->{"numa$i"});
2870 next if !$numa;
67fb9de6
DM
2871 # memory
2872 die "missing numa node$i memory value\n" if !$numa->{memory};
2ed5d572
AD
2873 my $numa_memory = $numa->{memory};
2874 $numa_totalmemory += $numa_memory;
2875 my $numa_object = "memory-backend-ram,id=ram-node$i,size=$numa_memory"."M";
2876
67fb9de6 2877 # cpus
2ed5d572 2878 my $cpus_start = $numa->{cpus}->{start};
67fb9de6 2879 die "missing numa node$i cpus\n" if !defined($cpus_start);
2ed5d572
AD
2880 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2881 my $cpus = $cpus_start;
2882 if (defined($cpus_end)) {
2883 $cpus .= "-$cpus_end";
67fb9de6 2884 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2ed5d572 2885 }
8a010eae 2886
67fb9de6 2887 # hostnodes
2ed5d572
AD
2888 my $hostnodes_start = $numa->{hostnodes}->{start};
2889 if (defined($hostnodes_start)) {
2890 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2891 my $hostnodes = $hostnodes_start;
2892 if (defined($hostnodes_end)) {
2893 $hostnodes .= "-$hostnodes_end";
67fb9de6 2894 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2ed5d572 2895 }
8a010eae 2896
2ed5d572
AD
2897 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2898 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
67fb9de6 2899 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2ed5d572 2900 }
8a010eae 2901
67fb9de6 2902 # policy
2ed5d572 2903 my $policy = $numa->{policy};
67fb9de6
DM
2904 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2905 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2ed5d572
AD
2906 }
2907
2908 push @$cmd, '-object', $numa_object;
8a010eae
AD
2909 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2910 }
67fb9de6
DM
2911
2912 die "total memory for NUMA nodes must be equal to vm memory\n"
2913 if $numa_totalmemory && $numa_totalmemory != $memory;
2ed5d572
AD
2914
2915 #if no custom tology, we split memory and cores across numa nodes
2916 if(!$numa_totalmemory) {
2917
67fb9de6 2918 my $numa_memory = ($memory / $sockets) . "M";
2ed5d572
AD
2919
2920 for (my $i = 0; $i < $sockets; $i++) {
2921
2922 my $cpustart = ($cores * $i);
2923 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2924 my $cpus = $cpustart;
2925 $cpus .= "-$cpuend" if $cpuend;
2926
2927 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2928 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2929 }
2930 }
8a010eae
AD
2931 }
2932
1e3baf05
DM
2933 push @$cmd, '-S' if $conf->{freeze};
2934
2935 # set keyboard layout
2936 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2937 push @$cmd, '-k', $kb if $kb;
2938
2939 # enable sound
2940 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2941 #push @$cmd, '-soundhw', 'es1370';
2942 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 2943
bc84dcca 2944 if($conf->{agent}) {
7a6c2150 2945 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
2946 my $pciaddr = print_pci_addr("qga0", $bridges);
2947 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2948 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2949 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2950 }
2951
1d794448 2952 my $spice_port;
2fa3151e 2953
590e698c
DM
2954 if ($qxlnum) {
2955 if ($qxlnum > 1) {
2956 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2957 for(my $i = 1; $i < $qxlnum; $i++){
2958 my $pciaddr = print_pci_addr("vga$i", $bridges);
2959 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2960 }
2961 } else {
2962 # assume other OS works like Linux
2963 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2964 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
2965 }
2966 }
2967
1011b570 2968 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 2969
cd339d1f 2970 $spice_port = PVE::Tools::next_spice_port();
943340a6 2971
d2da6d9b 2972 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 2973
d2da6d9b
AD
2974 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2975 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2976 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
2977 }
2978
8d9ae0d2
DM
2979 # enable balloon by default, unless explicitly disabled
2980 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2981 $pciaddr = print_pci_addr("balloon0", $bridges);
2982 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2983 }
1e3baf05 2984
0ea9541d
DM
2985 if ($conf->{watchdog}) {
2986 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 2987 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 2988 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
2989 push @$devices, '-device', "$watchdog$pciaddr";
2990 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
2991 }
2992
1e3baf05 2993 my $vollist = [];
941e0c42 2994 my $scsicontroller = {};
26ee04b6 2995 my $ahcicontroller = {};
cdd20088 2996 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 2997
5881b913
DM
2998 # Add iscsi initiator name if available
2999 if (my $initiator = get_initiator_name()) {
3000 push @$devices, '-iscsi', "initiator-name=$initiator";
3001 }
3002
1e3baf05
DM
3003 foreach_drive($conf, sub {
3004 my ($ds, $drive) = @_;
3005
ff1a2432 3006 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 3007 push @$vollist, $drive->{file};
ff1a2432 3008 }
afdb31d5 3009
1e3baf05 3010 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
3011
3012 if (drive_is_cdrom ($drive)) {
3013 if ($bootindex_hash->{d}) {
3014 $drive->{bootindex} = $bootindex_hash->{d};
3015 $bootindex_hash->{d} += 1;
3016 }
3017 } else {
3018 if ($bootindex_hash->{c}) {
3019 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3020 $bootindex_hash->{c} += 1;
3021 }
3022 }
3023
941e0c42 3024 if ($drive->{interface} eq 'scsi') {
cdd20088 3025
5b952ff5 3026 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 3027 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
3028 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
3029 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 3030 $scsicontroller->{$controller}=1;
941e0c42 3031 }
3b408e82 3032
26ee04b6
DA
3033 if ($drive->{interface} eq 'sata') {
3034 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
3035 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3036 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
3037 $ahcicontroller->{$controller}=1;
3038 }
46f58b5f 3039
15b21acc
MR
3040 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3041 push @$devices, '-drive',$drive_cmd;
46f58b5f 3042 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
3043 });
3044
cc4d6182 3045 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 3046 next if !$conf->{"net$i"};
cc4d6182
DA
3047 my $d = parse_net($conf->{"net$i"});
3048 next if !$d;
1e3baf05 3049
cc4d6182 3050 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 3051
cc4d6182
DA
3052 if ($bootindex_hash->{n}) {
3053 $d->{bootindex} = $bootindex_hash->{n};
3054 $bootindex_hash->{n} += 1;
3055 }
1e3baf05 3056
cc4d6182 3057 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
3058 push @$devices, '-netdev', $netdevfull;
3059
3060 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
3061 push @$devices, '-device', $netdevicefull;
3062 }
1e3baf05 3063
db656e5f
DM
3064 if (!$q35) {
3065 # add pci bridges
f8e83f05
AD
3066 while (my ($k, $v) = each %$bridges) {
3067 $pciaddr = print_pci_addr("pci.$k");
3068 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3069 }
19672434
DM
3070 }
3071
1e3baf05
DM
3072 # hack: virtio with fairsched is unreliable, so we do not use fairsched
3073 # when the VM uses virtio devices.
19672434
DM
3074 if (!$use_virtio && $have_ovz) {
3075
6b64503e 3076 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
3077 $conf->{cpuunits} : $defaults->{cpuunits};
3078
3079 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
3080
3081 # fixme: cpulimit is currently ignored
3082 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
3083 }
3084
3085 # add custom args
3086 if ($conf->{args}) {
3ada46c9 3087 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
3088 push @$cmd, @$aa;
3089 }
3090
5bdcf937 3091 push @$cmd, @$devices;
be190583 3092 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 3093 if scalar(@$rtcFlags);
be190583 3094 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
3095 if scalar(@$machineFlags);
3096 push @$cmd, '-global', join(',', @$globalFlags)
3097 if scalar(@$globalFlags);
3098
1d794448 3099 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 3100}
19672434 3101
1e3baf05
DM
3102sub vnc_socket {
3103 my ($vmid) = @_;
3104 return "${var_run_tmpdir}/$vmid.vnc";
3105}
3106
943340a6 3107sub spice_port {
1011b570 3108 my ($vmid) = @_;
943340a6 3109
1d794448 3110 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
3111
3112 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3113}
3114
c971c4f2 3115sub qmp_socket {
693d12a2
AD
3116 my ($vmid, $qga) = @_;
3117 my $sockettype = $qga ? 'qga' : 'qmp';
3118 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3119}
3120
1e3baf05
DM
3121sub pidfile_name {
3122 my ($vmid) = @_;
3123 return "${var_run_tmpdir}/$vmid.pid";
3124}
3125
86fdcfb2
DA
3126sub vm_devices_list {
3127 my ($vmid) = @_;
3128
ceea9078 3129 my $res = vm_mon_cmd($vmid, 'query-pci');
ceea9078
DM
3130 my $devices = {};
3131 foreach my $pcibus (@$res) {
3132 foreach my $device (@{$pcibus->{devices}}) {
3133 next if !$device->{'qdev_id'};
f78cc802
AD
3134 $devices->{$device->{'qdev_id'}} = 1;
3135 }
3136 }
3137
3138 my $resblock = vm_mon_cmd($vmid, 'query-block');
3139 foreach my $block (@$resblock) {
3140 if($block->{device} =~ m/^drive-(\S+)/){
3141 $devices->{$1} = 1;
1dc4f496
DM
3142 }
3143 }
86fdcfb2 3144
3d7389fe
DM
3145 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3146 foreach my $mice (@$resmice) {
3147 if ($mice->{name} eq 'QEMU HID Tablet') {
3148 $devices->{tablet} = 1;
3149 last;
3150 }
3151 }
3152
1dc4f496 3153 return $devices;
86fdcfb2
DA
3154}
3155
ec21aa11 3156sub vm_deviceplug {
f19d1c47 3157 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3158
fee46675 3159 die "internal error" if !$conf->{hotplug};
db656e5f
DM
3160
3161 my $q35 = machine_type_is_q35($conf);
3162
95d6343b
DA
3163 my $devices_list = vm_devices_list($vmid);
3164 return 1 if defined($devices_list->{$deviceid});
3165
fee46675
DM
3166 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid); # add PCI bridge if we need it for the device
3167
3d7389fe 3168 if ($deviceid eq 'tablet') {
fee46675 3169
3d7389fe 3170 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3d7389fe 3171
fee46675 3172 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
40f28a9f 3173
fee46675 3174 qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3175 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
fee46675 3176
5e5dcb73 3177 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3178 eval { qemu_deviceaddverify($vmid, $deviceid); };
3179 if (my $err = $@) {
63c2da2f
DM
3180 eval { qemu_drivedel($vmid, $deviceid); };
3181 warn $@ if $@;
fee46675 3182 die $err;
5e5dcb73 3183 }
cfc817c7 3184
fee46675
DM
3185 } elsif ($deviceid =~ m/^(scsihw)(\d+)$/) {
3186
cdd20088 3187 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3188 my $pciaddr = print_pci_addr($deviceid);
cdd20088 3189 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
fee46675 3190
cfc817c7 3191 qemu_deviceadd($vmid, $devicefull);
fee46675 3192 qemu_deviceaddverify($vmid, $deviceid);
cfc817c7 3193
fee46675
DM
3194 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3195
3196 qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
3197 qemu_driveadd($storecfg, $vmid, $device);
3198
3199 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3200 eval { qemu_deviceadd($vmid, $devicefull); };
3201 if (my $err = $@) {
63c2da2f
DM
3202 eval { qemu_drivedel($vmid, $deviceid); };
3203 warn $@ if $@;
fee46675 3204 die $err;
a4f091a0 3205 }
a4f091a0 3206
fee46675
DM
3207 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3208
2630d2a9
DA
3209 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3210 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3211 qemu_deviceadd($vmid, $netdevicefull);
fee46675
DM
3212 eval { qemu_deviceaddverify($vmid, $deviceid); };
3213 if (my $err = $@) {
3214 eval { qemu_netdevdel($vmid, $deviceid); };
3215 warn $@ if $@;
3216 die $err;
2630d2a9 3217 }
2630d2a9 3218
fee46675 3219 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
b467f79a 3220
40f28a9f
AD
3221 my $bridgeid = $2;
3222 my $pciaddr = print_pci_addr($deviceid);
3223 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
fee46675 3224
40f28a9f 3225 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3226 qemu_deviceaddverify($vmid, $deviceid);
3227
3228 } else {
3229 die "can't hotplug device '$deviceid'\n";
40f28a9f
AD
3230 }
3231
5e5dcb73 3232 return 1;
a4dea331
DA
3233}
3234
3eec5767 3235# fixme: this should raise exceptions on error!
ec21aa11 3236sub vm_deviceunplug {
f19d1c47 3237 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3238
63c2da2f 3239 die "internal error" if !$conf->{hotplug};
873c2d69 3240
95d6343b
DA
3241 my $devices_list = vm_devices_list($vmid);
3242 return 1 if !defined($devices_list->{$deviceid});
3243
63c2da2f
DM
3244 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3245
3d7389fe 3246 if ($deviceid eq 'tablet') {
63c2da2f 3247
3d7389fe 3248 qemu_devicedel($vmid, $deviceid);
3d7389fe 3249
63c2da2f 3250 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
f19d1c47 3251
5e5dcb73 3252 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3253 qemu_devicedelverify($vmid, $deviceid);
3254 qemu_drivedel($vmid, $deviceid);
3255
3256 } elsif ($deviceid =~ m/^(lsi)(\d+)$/) {
3257
3258 qemu_devicedel($vmid, $deviceid);
3259
3260 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
cfc817c7 3261
63c2da2f
DM
3262 qemu_devicedel($vmid, $deviceid);
3263 qemu_drivedel($vmid, $deviceid);
3264
3265 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
a4f091a0 3266
2630d2a9 3267 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3268 qemu_devicedelverify($vmid, $deviceid);
3269 qemu_netdevdel($vmid, $deviceid);
3270
3271 } else {
3272 die "can't unplug device '$deviceid'\n";
2630d2a9
DA
3273 }
3274
5e5dcb73
DA
3275 return 1;
3276}
3277
3278sub qemu_deviceadd {
3279 my ($vmid, $devicefull) = @_;
873c2d69 3280
d695b5b7
AD
3281 $devicefull = "driver=".$devicefull;
3282 my %options = split(/[=,]/, $devicefull);
f19d1c47 3283
d695b5b7 3284 vm_mon_cmd($vmid, "device_add" , %options);
5e5dcb73 3285}
afdb31d5 3286
5e5dcb73 3287sub qemu_devicedel {
fee46675 3288 my ($vmid, $deviceid) = @_;
63c2da2f 3289
5a77d8c1 3290 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
5e5dcb73
DA
3291}
3292
3293sub qemu_driveadd {
fee46675 3294 my ($storecfg, $vmid, $device) = @_;
5e5dcb73
DA
3295
3296 my $drive = print_drive_full($storecfg, $vmid, $device);
7b7c6d1b 3297 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
fee46675 3298
5e5dcb73 3299 # If the command succeeds qemu prints: "OK"
fee46675
DM
3300 return 1 if $ret =~ m/OK/s;
3301
3302 die "adding drive failed: $ret\n";
5e5dcb73 3303}
afdb31d5 3304
5e5dcb73
DA
3305sub qemu_drivedel {
3306 my($vmid, $deviceid) = @_;
873c2d69 3307
7b7c6d1b 3308 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73 3309 $ret =~ s/^\s+//;
63c2da2f
DM
3310
3311 return 1 if $ret eq "";
3312
3313 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
3314 return 1 if $ret =~ m/Device \'.*?\' not found/s;
3315
3316 die "deleting drive $deviceid failed : $ret\n";
5e5dcb73 3317}
f19d1c47 3318
5e5dcb73 3319sub qemu_deviceaddverify {
fee46675 3320 my ($vmid, $deviceid) = @_;
873c2d69 3321
5e5dcb73
DA
3322 for (my $i = 0; $i <= 5; $i++) {
3323 my $devices_list = vm_devices_list($vmid);
3324 return 1 if defined($devices_list->{$deviceid});
3325 sleep 1;
afdb31d5 3326 }
fee46675
DM
3327
3328 die "error on hotplug device '$deviceid'\n";
5e5dcb73 3329}
afdb31d5 3330
5e5dcb73
DA
3331
3332sub qemu_devicedelverify {
63c2da2f
DM
3333 my ($vmid, $deviceid) = @_;
3334
3335 # need to verify that the device is correctly removed as device_del
3336 # is async and empty return is not reliable
5e5dcb73 3337
5e5dcb73
DA
3338 for (my $i = 0; $i <= 5; $i++) {
3339 my $devices_list = vm_devices_list($vmid);
3340 return 1 if !defined($devices_list->{$deviceid});
3341 sleep 1;
afdb31d5 3342 }
63c2da2f
DM
3343
3344 die "error on hot-unplugging device '$deviceid'\n";
873c2d69
DA
3345}
3346
cdd20088 3347sub qemu_findorcreatescsihw {
cfc817c7
DA
3348 my ($storecfg, $conf, $vmid, $device) = @_;
3349
5b952ff5 3350 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3351 my $controller = int($device->{index} / $maxdev);
cdd20088 3352 my $scsihwid="scsihw$controller";
cfc817c7
DA
3353 my $devices_list = vm_devices_list($vmid);
3354
cdd20088 3355 if(!defined($devices_list->{$scsihwid})) {
fee46675 3356 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7 3357 }
fee46675 3358
cfc817c7
DA
3359 return 1;
3360}
3361
281fedb3 3362sub qemu_add_pci_bridge {
40f28a9f
AD
3363 my ($storecfg, $conf, $vmid, $device) = @_;
3364
3365 my $bridges = {};
281fedb3
DM
3366
3367 my $bridgeid;
3368
40f28a9f
AD
3369 print_pci_addr($device, $bridges);
3370
3371 while (my ($k, $v) = each %$bridges) {
3372 $bridgeid = $k;
3373 }
fee46675 3374 return 1 if !defined($bridgeid) || $bridgeid < 1;
281fedb3 3375
40f28a9f
AD
3376 my $bridge = "pci.$bridgeid";
3377 my $devices_list = vm_devices_list($vmid);
3378
281fedb3 3379 if (!defined($devices_list->{$bridge})) {
fee46675 3380 vm_deviceplug($storecfg, $conf, $vmid, $bridge);
40f28a9f 3381 }
281fedb3 3382
40f28a9f
AD
3383 return 1;
3384}
3385
2630d2a9
DA
3386sub qemu_netdevadd {
3387 my ($vmid, $conf, $device, $deviceid) = @_;
3388
3389 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3390 my %options = split(/[=,]/, $netdev);
2630d2a9 3391
73aa03b8
AD
3392 vm_mon_cmd($vmid, "netdev_add", %options);
3393 return 1;
2630d2a9
DA
3394}
3395
3396sub qemu_netdevdel {
3397 my ($vmid, $deviceid) = @_;
3398
89c1e0f4 3399 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
2630d2a9
DA
3400}
3401
838776ab
AD
3402sub qemu_cpu_hotplug {
3403 my ($vmid, $conf, $cores) = @_;
3404
3a11fadb
DM
3405 my $sockets = $conf->{sockets} || 1;
3406 die "cpu hotplug only works with one socket\n"
3407 if $sockets > 1;
838776ab 3408
3a11fadb
DM
3409 die "maxcpus is not defined\n"
3410 if !$conf->{maxcpus};
3411
3412 die "you can't add more cores than maxcpus\n"
3413 if $cores > $conf->{maxcpus};
3414
3415 my $currentcores = $conf->{cores} || 1;
3416 die "online cpu unplug is not yet possible\n"
3417 if $cores < $currentcores;
838776ab
AD
3418
3419 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
3a11fadb
DM
3420 die "cores number if running vm is different than configuration\n"
3421 if scalar(@{$currentrunningcores}) != $currentcores;
838776ab 3422
3a11fadb 3423 for (my $i = $currentcores; $i < $cores; $i++) {
838776ab
AD
3424 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3425 }
3426}
3427
affd2f88
AD
3428sub qemu_block_set_io_throttle {
3429 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3430
f3f323a3
AD
3431 return if !check_running($vmid) ;
3432
f3f323a3
AD
3433 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3434
affd2f88
AD
3435}
3436
f5eb281a 3437# old code, only used to shutdown old VM after update
dab36e1e
DM
3438sub __read_avail {
3439 my ($fh, $timeout) = @_;
3440
3441 my $sel = new IO::Select;
3442 $sel->add($fh);
3443
3444 my $res = '';
3445 my $buf;
3446
3447 my @ready;
3448 while (scalar (@ready = $sel->can_read($timeout))) {
3449 my $count;
3450 if ($count = $fh->sysread($buf, 8192)) {
3451 if ($buf =~ /^(.*)\(qemu\) $/s) {
3452 $res .= $1;
3453 last;
3454 } else {
3455 $res .= $buf;
3456 }
3457 } else {
3458 if (!defined($count)) {
3459 die "$!\n";
3460 }
3461 last;
3462 }
3463 }
3464
3465 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3466
dab36e1e
DM
3467 return $res;
3468}
3469
f5eb281a 3470# old code, only used to shutdown old VM after update
dab36e1e
DM
3471sub vm_monitor_command {
3472 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3473
dab36e1e
DM
3474 my $res;
3475
3476 eval {
3477 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3478
3479 my $sname = "${var_run_tmpdir}/$vmid.mon";
3480
3481 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3482 die "unable to connect to VM $vmid socket - $!\n";
3483
3484 my $timeout = 3;
3485
3486 # hack: migrate sometime blocks the monitor (when migrate_downtime
3487 # is set)
3488 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3489 $timeout = 60*60; # 1 hour
3490 }
3491
3492 # read banner;
3493 my $data = __read_avail($sock, $timeout);
3494
3495 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3496 die "got unexpected qemu monitor banner\n";
3497 }
3498
3499 my $sel = new IO::Select;
3500 $sel->add($sock);
3501
3502 if (!scalar(my @ready = $sel->can_write($timeout))) {
3503 die "monitor write error - timeout";
3504 }
3505
3506 my $fullcmd = "$cmdstr\r";
3507
3508 # syslog('info', "VM $vmid monitor command: $cmdstr");
3509
3510 my $b;
3511 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3512 die "monitor write error - $!";
3513 }
3514
3515 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3516
3517 $timeout = 20;
3518
3519 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3520 $timeout = 60*60; # 1 hour
3521 } elsif ($cmdstr =~ m/^(eject|change)/) {
3522 $timeout = 60; # note: cdrom mount command is slow
3523 }
3524 if ($res = __read_avail($sock, $timeout)) {
3525
3526 my @lines = split("\r?\n", $res);
f5eb281a 3527
dab36e1e 3528 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3529
dab36e1e
DM
3530 $res = join("\n", @lines);
3531 $res .= "\n";
3532 }
3533 };
3534
3535 my $err = $@;
3536
3537 if ($err) {
3538 syslog("err", "VM $vmid monitor command failed - $err");
3539 die $err;
3540 }
f5eb281a 3541
dab36e1e
DM
3542 return $res;
3543}
3544
c1175c92
AD
3545sub qemu_block_resize {
3546 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3547
ed221350 3548 my $running = check_running($vmid);
c1175c92
AD
3549
3550 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3551
3552 return if !$running;
3553
3554 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3555
3556}
3557
1ab0057c
AD
3558sub qemu_volume_snapshot {
3559 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3560
ed221350 3561 my $running = check_running($vmid);
1ab0057c
AD
3562
3563 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3564
3565 return if !$running;
3566
3567 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3568
3569}
3570
fc46aff9
AD
3571sub qemu_volume_snapshot_delete {
3572 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3573
ed221350 3574 my $running = check_running($vmid);
fc46aff9
AD
3575
3576 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3577
3578 return if !$running;
3579
18bfb361 3580 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3581}
3582
264e519f
DM
3583sub set_migration_caps {
3584 my ($vmid) = @_;
a89fded1 3585
8b8345f3 3586 my $cap_ref = [];
a89fded1
AD
3587
3588 my $enabled_cap = {
8b8345f3
DM
3589 "auto-converge" => 1,
3590 "xbzrle" => 0,
3591 "x-rdma-pin-all" => 0,
3592 "zero-blocks" => 0,
a89fded1
AD
3593 };
3594
8b8345f3 3595 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3596
8b8345f3 3597 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3598 push @$cap_ref, {
3599 capability => $supported_capability->{capability},
22430fa2
DM
3600 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3601 };
a89fded1
AD
3602 }
3603
8b8345f3
DM
3604 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3605}
a89fded1 3606
3a11fadb
DM
3607# hotplug changes in [PENDING]
3608# $selection hash can be used to only apply specified options, for
3609# example: { cores => 1 } (only apply changed 'cores')
3610# $errors ref is used to return error messages
c427973b 3611sub vmconfig_hotplug_pending {
3a11fadb 3612 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
c427973b 3613
8e90138a 3614 my $defaults = load_defaults();
c427973b
DM
3615
3616 # commit values which do not have any impact on running VM first
3a11fadb
DM
3617 # Note: those option cannot raise errors, we we do not care about
3618 # $selection and always apply them.
3619
3620 my $add_error = sub {
3621 my ($opt, $msg) = @_;
3622 $errors->{$opt} = "hotplug problem - $msg";
3623 };
c427973b
DM
3624
3625 my $changes = 0;
3626 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3627 if ($opt eq 'name' || $opt eq 'hotplug' || $opt eq 'onboot' || $opt eq 'shares') {
3628 $conf->{$opt} = $conf->{pending}->{$opt};
3629 delete $conf->{pending}->{$opt};
3630 $changes = 1;
3631 }
3632 }
3633
3634 if ($changes) {
3635 update_config_nolock($vmid, $conf, 1);
3636 $conf = load_config($vmid); # update/reload
3637 }
3638
3a11fadb 3639 my $hotplug = defined($conf->{hotplug}) ? $conf->{hotplug} : $defaults->{hotplug};
c427973b 3640
3d7389fe
DM
3641 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3642 foreach my $opt (@delete) {
3a11fadb 3643 next if $selection && !$selection->{$opt};
3a11fadb
DM
3644 eval {
3645 if ($opt eq 'tablet') {
e56beeda 3646 die "skip\n" if !$hotplug;
3a11fadb
DM
3647 if ($defaults->{tablet}) {
3648 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3649 } else {
3650 vm_deviceunplug($vmid, $conf, $opt);
3651 }
3652 } elsif ($opt eq 'cores') {
e56beeda 3653 die "skip\n" if !$hotplug;
3a11fadb 3654 qemu_cpu_hotplug($vmid, $conf, 1);
3eec5767
DM
3655 } elsif ($opt =~ m/^net(\d+)$/) {
3656 die "skip\n" if !$hotplug;
3657 vm_deviceunplug($vmid, $conf, $opt);
a05cff86
DM
3658 } elsif (valid_drivename($opt)) {
3659 die "skip\n"; # we do not allow to hot-remove disk?
3d7389fe 3660 } else {
e56beeda 3661 die "skip\n";
3d7389fe 3662 }
3a11fadb
DM
3663 };
3664 if (my $err = $@) {
e56beeda
DM
3665 &$add_error($opt, $err) if $err ne "skip\n";
3666 } else {
3a11fadb
DM
3667 # save new config if hotplug was successful
3668 delete $conf->{$opt};
3669 vmconfig_undelete_pending_option($conf, $opt);
3670 update_config_nolock($vmid, $conf, 1);
3671 $conf = load_config($vmid); # update/reload
3d7389fe 3672 }
3d7389fe
DM
3673 }
3674
3675 foreach my $opt (keys %{$conf->{pending}}) {
3a11fadb 3676 next if $selection && !$selection->{$opt};
3d7389fe 3677 my $value = $conf->{pending}->{$opt};
3a11fadb
DM
3678 eval {
3679 if ($opt eq 'tablet') {
e56beeda 3680 die "skip\n" if !$hotplug;
3a11fadb
DM
3681 if ($value == 1) {
3682 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3683 } elsif ($value == 0) {
3684 vm_deviceunplug($vmid, $conf, $opt);
3685 }
3686 } elsif ($opt eq 'cores') {
e56beeda 3687 die "skip\n" if !$hotplug;
3a11fadb
DM
3688 qemu_cpu_hotplug($vmid, $conf, $value);
3689 } elsif ($opt eq 'balloon') {
e56beeda 3690 die "skip\n" if !(defined($conf->{shares}) && ($conf->{shares} == 0));
3a11fadb
DM
3691 # allow manual ballooning if shares is set to zero
3692 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
3693 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
3eec5767
DM
3694 } elsif ($opt =~ m/^net(\d+)$/) {
3695 # some changes can be done without hotplug
3696 vmconfig_update_net($storecfg, $conf, $vmid, $opt, $value);
a05cff86
DM
3697 } elsif (valid_drivename($opt)) {
3698 # some changes can be done without hotplug
3699 vmconfig_update_disk($storecfg, $conf, $vmid, $opt, $value, 1);
3a11fadb 3700 } else {
e56beeda 3701 die "skip\n"; # skip non-hot-pluggable options
3d7389fe 3702 }
3a11fadb
DM
3703 };
3704 if (my $err = $@) {
e56beeda
DM
3705 &$add_error($opt, $err) if $err ne "skip\n";
3706 } else {
3a11fadb
DM
3707 # save new config if hotplug was successful
3708 $conf->{$opt} = $value;
3709 delete $conf->{pending}->{$opt};
3710 update_config_nolock($vmid, $conf, 1);
3711 $conf = load_config($vmid); # update/reload
3d7389fe 3712 }
3d7389fe 3713 }
c427973b 3714}
055d554d
DM
3715
3716sub vmconfig_apply_pending {
3a11fadb 3717 my ($vmid, $conf, $storecfg) = @_;
c427973b
DM
3718
3719 # cold plug
055d554d
DM
3720
3721 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3722 foreach my $opt (@delete) { # delete
3723 die "internal error" if $opt =~ m/^unused/;
3724 $conf = load_config($vmid); # update/reload
3725 if (!defined($conf->{$opt})) {
3726 vmconfig_undelete_pending_option($conf, $opt);
3727 update_config_nolock($vmid, $conf, 1);
3728 } elsif (valid_drivename($opt)) {
3729 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
3730 vmconfig_undelete_pending_option($conf, $opt);
3731 delete $conf->{$opt};
3732 update_config_nolock($vmid, $conf, 1);
3733 } else {
3734 vmconfig_undelete_pending_option($conf, $opt);
3735 delete $conf->{$opt};
3736 update_config_nolock($vmid, $conf, 1);
3737 }
3738 }
3739
3740 $conf = load_config($vmid); # update/reload
3741
3742 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3743 $conf = load_config($vmid); # update/reload
3744
3745 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
3746 # skip if nothing changed
3747 } elsif (valid_drivename($opt)) {
3748 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
3749 if defined($conf->{$opt});
3750 $conf->{$opt} = $conf->{pending}->{$opt};
3751 } else {
3752 $conf->{$opt} = $conf->{pending}->{$opt};
3753 }
3754
3755 delete $conf->{pending}->{$opt};
3756 update_config_nolock($vmid, $conf, 1);
3757 }
3758}
3759
3eec5767
DM
3760my $safe_num_ne = sub {
3761 my ($a, $b) = @_;
3762
3763 return 0 if !defined($a) && !defined($b);
3764 return 1 if !defined($a);
3765 return 1 if !defined($b);
3766
3767 return $a != $b;
3768};
3769
3770my $safe_string_ne = sub {
3771 my ($a, $b) = @_;
3772
3773 return 0 if !defined($a) && !defined($b);
3774 return 1 if !defined($a);
3775 return 1 if !defined($b);
3776
3777 return $a ne $b;
3778};
3779
3780sub vmconfig_update_net {
3781 my ($storecfg, $conf, $vmid, $opt, $value) = @_;
3782
3783 my $newnet = parse_net($value);
3784
3785 if ($conf->{$opt}) {
3786 my $oldnet = parse_net($conf->{$opt});
3787
3788 if (&$safe_string_ne($oldnet->{model}, $newnet->{model}) ||
3789 &$safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
3790 &$safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
3791 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
3792
3793 # for non online change, we try to hot-unplug
3794 die "skip\n" if !$conf->{hotplug};
3795 vm_deviceunplug($vmid, $conf, $opt);
3796 } else {
3797
3798 die "internal error" if $opt !~ m/net(\d+)/;
3799 my $iface = "tap${vmid}i$1";
3800
3801 if (&$safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
3802 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3803 }
3804
3805 if(&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
3806 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
3807 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3808 PVE::Network::tap_unplug($iface);
3809 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall});
3810 }
38c590d9
DM
3811
3812 return 1;
3eec5767
DM
3813 }
3814 }
3815
38c590d9
DM
3816 if ($conf->{hotplug}) {
3817 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet);
3818 } else {
3819 die "skip\n";
3820 }
3eec5767
DM
3821}
3822
a05cff86
DM
3823sub vmconfig_update_disk {
3824 my ($storecfg, $conf, $vmid, $opt, $value, $force) = @_;
3825
3826 # fixme: do we need force?
3827
3828 my $drive = parse_drive($opt, $value);
3829
3830 if ($conf->{$opt}) {
3831
3832 if (my $old_drive = parse_drive($opt, $conf->{$opt})) {
3833
3834 my $media = $drive->{media} || 'disk';
3835 my $oldmedia = $old_drive->{media} || 'disk';
3836 die "unable to change media type\n" if $media ne $oldmedia;
3837
3838 if (!drive_is_cdrom($old_drive)) {
3839
3840 if ($drive->{file} ne $old_drive->{file}) {
3841
3842 die "skip\n" if !$conf->{hotplug};
3843
3844 # unplug and register as unused
3845 vm_deviceunplug($vmid, $conf, $opt);
3846 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $old_drive)
3847
3848 } else {
3849 # update existing disk
3850
3851 # skip non hotpluggable value
3852 if (&$safe_num_ne($drive->{discard}, $old_drive->{discard}) ||
3853 &$safe_string_ne($drive->{cache}, $old_drive->{cache})) {
3854 die "skip\n";
3855 }
3856
3857 # apply throttle
3858 if (&$safe_num_ne($drive->{mbps}, $old_drive->{mbps}) ||
3859 &$safe_num_ne($drive->{mbps_rd}, $old_drive->{mbps_rd}) ||
3860 &$safe_num_ne($drive->{mbps_wr}, $old_drive->{mbps_wr}) ||
3861 &$safe_num_ne($drive->{iops}, $old_drive->{iops}) ||
3862 &$safe_num_ne($drive->{iops_rd}, $old_drive->{iops_rd}) ||
3863 &$safe_num_ne($drive->{iops_wr}, $old_drive->{iops_wr}) ||
3864 &$safe_num_ne($drive->{mbps_max}, $old_drive->{mbps_max}) ||
3865 &$safe_num_ne($drive->{mbps_rd_max}, $old_drive->{mbps_rd_max}) ||
3866 &$safe_num_ne($drive->{mbps_wr_max}, $old_drive->{mbps_wr_max}) ||
3867 &$safe_num_ne($drive->{iops_max}, $old_drive->{iops_max}) ||
3868 &$safe_num_ne($drive->{iops_rd_max}, $old_drive->{iops_rd_max}) ||
3869 &$safe_num_ne($drive->{iops_wr_max}, $old_drive->{iops_wr_max})) {
3870
3871 qemu_block_set_io_throttle($vmid,"drive-$opt",
3872 ($drive->{mbps} || 0)*1024*1024,
3873 ($drive->{mbps_rd} || 0)*1024*1024,
3874 ($drive->{mbps_wr} || 0)*1024*1024,
3875 $drive->{iops} || 0,
3876 $drive->{iops_rd} || 0,
3877 $drive->{iops_wr} || 0,
3878 ($drive->{mbps_max} || 0)*1024*1024,
3879 ($drive->{mbps_rd_max} || 0)*1024*1024,
3880 ($drive->{mbps_wr_max} || 0)*1024*1024,
3881 $drive->{iops_max} || 0,
3882 $drive->{iops_rd_max} || 0,
3883 $drive->{iops_wr_max} || 0);
3884
3885 }
3886
3887 return 1;
3888 }
3889 }
3890 }
3891 }
3892
3893 if (drive_is_cdrom($drive)) { # cdrom
3894
3895 if ($drive->{file} eq 'none') {
3896 vm_mon_cmd($vmid, "eject",force => JSON::true,device => "drive-$opt");
3897 } else {
3898 my $path = get_iso_path($storecfg, $vmid, $drive->{file});
3899 vm_mon_cmd($vmid, "eject", force => JSON::true,device => "drive-$opt"); # force eject if locked
3900 vm_mon_cmd($vmid, "change", device => "drive-$opt",target => "$path") if $path;
3901 }
3902
3903 } else {
3904 die "skip\n" if !$conf->{hotplug};
3905 # hotplug new disks
3906 vm_deviceplug($storecfg, $conf, $vmid, $opt, $drive);
3907 }
3908}
3909
1e3baf05 3910sub vm_start {
1d794448 3911 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 3912
6b64503e 3913 lock_config($vmid, sub {
7e8dcf2c 3914 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 3915
8b43bc11 3916 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 3917
6b64503e 3918 check_lock($conf) if !$skiplock;
1e3baf05 3919
7e8dcf2c 3920 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 3921
055d554d 3922 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3a11fadb 3923 vmconfig_apply_pending($vmid, $conf, $storecfg);
055d554d
DM
3924 $conf = load_config($vmid); # update/reload
3925 }
3926
6c47d546
DM
3927 my $defaults = load_defaults();
3928
3929 # set environment variable useful inside network script
3930 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3931
1d794448 3932 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 3933
1e3baf05 3934 my $migrate_port = 0;
5bc1e039 3935 my $migrate_uri;
1e3baf05
DM
3936 if ($statefile) {
3937 if ($statefile eq 'tcp') {
5bc1e039
SP
3938 my $localip = "localhost";
3939 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3940 if ($datacenterconf->{migration_unsecure}) {
3941 my $nodename = PVE::INotify::nodename();
3942 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3943 }
f9a971e0 3944 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 3945 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
3946 push @$cmd, '-incoming', $migrate_uri;
3947 push @$cmd, '-S';
1e3baf05 3948 } else {
6c47d546 3949 push @$cmd, '-loadstate', $statefile;
1e3baf05 3950 }
91bd6c90
DM
3951 } elsif ($paused) {
3952 push @$cmd, '-S';
1e3baf05
DM
3953 }
3954
1e3baf05 3955 # host pci devices
040b06b7
DA
3956 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3957 my $d = parse_hostpci($conf->{"hostpci$i"});
3958 next if !$d;
b1f72af6
AD
3959 my $pcidevices = $d->{pciid};
3960 foreach my $pcidevice (@$pcidevices) {
3961 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 3962
b1f72af6
AD
3963 my $info = pci_device_info("0000:$pciid");
3964 die "IOMMU not present\n" if !check_iommu_support();
3965 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 3966
b1f72af6
AD
3967 if ($d->{driver} && $d->{driver} eq "vfio") {
3968 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3969 } else {
3970 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3971 }
3972
8f3e88af 3973 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 3974 }
040b06b7 3975 }
1e3baf05
DM
3976
3977 PVE::Storage::activate_volumes($storecfg, $vollist);
3978
585b6e28
DM
3979 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3980 umask => 0077); };
1e3baf05 3981 my $err = $@;
ff1a2432 3982 die "start failed: $err" if $err;
1e3baf05 3983
5bc1e039 3984 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 3985
8c609afd 3986 if ($statefile && $statefile ne 'tcp') {
95381ce0 3987 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 3988 warn $@ if $@;
62de2cbd
DM
3989 }
3990
1d794448 3991 if ($migratedfrom) {
a89fded1
AD
3992
3993 eval {
8e90138a 3994 set_migration_caps($vmid);
a89fded1 3995 };
1d794448 3996 warn $@ if $@;
a89fded1 3997
1d794448
DM
3998 if ($spice_port) {
3999 print "spice listens on port $spice_port\n";
4000 if ($spice_ticket) {
8e90138a
DM
4001 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
4002 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
4003 }
4004 }
4005
1d794448 4006 } else {
4ec05c4c 4007
15b1fc93 4008 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 4009 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 4010 if $conf->{balloon};
be190583
DM
4011 vm_mon_cmd_nocheck($vmid, 'qom-set',
4012 path => "machine/peripheral/balloon0",
4013 property => "guest-stats-polling-interval",
4ec05c4c
AD
4014 value => 2);
4015 }
e18b0b99 4016 }
1e3baf05
DM
4017 });
4018}
4019
0eedc444
AD
4020sub vm_mon_cmd {
4021 my ($vmid, $execute, %params) = @_;
4022
26f11676
DM
4023 my $cmd = { execute => $execute, arguments => \%params };
4024 vm_qmp_command($vmid, $cmd);
0eedc444
AD
4025}
4026
4027sub vm_mon_cmd_nocheck {
4028 my ($vmid, $execute, %params) = @_;
4029
26f11676
DM
4030 my $cmd = { execute => $execute, arguments => \%params };
4031 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
4032}
4033
c971c4f2 4034sub vm_qmp_command {
c5a07de5 4035 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 4036
c971c4f2 4037 my $res;
26f11676 4038
14db5366
DM
4039 my $timeout;
4040 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
4041 $timeout = $cmd->{arguments}->{timeout};
4042 delete $cmd->{arguments}->{timeout};
4043 }
be190583 4044
c971c4f2
AD
4045 eval {
4046 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
4047 my $sname = qmp_socket($vmid);
4048 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 4049 my $qmpclient = PVE::QMPClient->new();
dab36e1e 4050
14db5366 4051 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 4052 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
4053 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
4054 if scalar(%{$cmd->{arguments}});
4055 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
4056 } else {
4057 die "unable to open monitor socket\n";
4058 }
c971c4f2 4059 };
26f11676 4060 if (my $err = $@) {
c971c4f2
AD
4061 syslog("err", "VM $vmid qmp command failed - $err");
4062 die $err;
4063 }
4064
4065 return $res;
4066}
4067
9df5cbcc
DM
4068sub vm_human_monitor_command {
4069 my ($vmid, $cmdline) = @_;
4070
4071 my $res;
4072
f5eb281a 4073 my $cmd = {
9df5cbcc
DM
4074 execute => 'human-monitor-command',
4075 arguments => { 'command-line' => $cmdline},
4076 };
4077
4078 return vm_qmp_command($vmid, $cmd);
4079}
4080
1e3baf05
DM
4081sub vm_commandline {
4082 my ($storecfg, $vmid) = @_;
4083
6b64503e 4084 my $conf = load_config($vmid);
1e3baf05
DM
4085
4086 my $defaults = load_defaults();
4087
6b64503e 4088 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 4089
6b64503e 4090 return join(' ', @$cmd);
1e3baf05
DM
4091}
4092
4093sub vm_reset {
4094 my ($vmid, $skiplock) = @_;
4095
6b64503e 4096 lock_config($vmid, sub {
1e3baf05 4097
6b64503e 4098 my $conf = load_config($vmid);
1e3baf05 4099
6b64503e 4100 check_lock($conf) if !$skiplock;
1e3baf05 4101
816e2c4a 4102 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
4103 });
4104}
4105
4106sub get_vm_volumes {
4107 my ($conf) = @_;
1e3baf05 4108
ff1a2432 4109 my $vollist = [];
d5769dc2
DM
4110 foreach_volid($conf, sub {
4111 my ($volid, $is_cdrom) = @_;
ff1a2432 4112
d5769dc2 4113 return if $volid =~ m|^/|;
ff1a2432 4114
d5769dc2
DM
4115 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4116 return if !$sid;
ff1a2432
DM
4117
4118 push @$vollist, $volid;
1e3baf05 4119 });
ff1a2432
DM
4120
4121 return $vollist;
4122}
4123
4124sub vm_stop_cleanup {
254575e9 4125 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 4126
745fed70
DM
4127 eval {
4128 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 4129
254575e9
DM
4130 if (!$keepActive) {
4131 my $vollist = get_vm_volumes($conf);
4132 PVE::Storage::deactivate_volumes($storecfg, $vollist);
4133 }
961bfcb2 4134
ab6a046f 4135 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
4136 unlink "/var/run/qemu-server/${vmid}.$ext";
4137 }
745fed70
DM
4138 };
4139 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
4140}
4141
e6c3b671 4142# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
4143# We need that when migration VMs to other nodes (files already moved)
4144# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 4145sub vm_stop {
af30308f 4146 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 4147
9269013a 4148 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 4149
af30308f
DM
4150 if ($migratedfrom){
4151 my $pid = check_running($vmid, $nocheck, $migratedfrom);
4152 kill 15, $pid if $pid;
4153 my $conf = load_config($vmid, $migratedfrom);
4154 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
4155 return;
4156 }
4157
e6c3b671 4158 lock_config($vmid, sub {
1e3baf05 4159
e6c3b671 4160 my $pid = check_running($vmid, $nocheck);
ff1a2432 4161 return if !$pid;
1e3baf05 4162
ff1a2432 4163 my $conf;
e6c3b671 4164 if (!$nocheck) {
ff1a2432 4165 $conf = load_config($vmid);
e6c3b671 4166 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
4167 if (!defined($timeout) && $shutdown && $conf->{startup}) {
4168 my $opts = parse_startup($conf->{startup});
4169 $timeout = $opts->{down} if $opts->{down};
4170 }
e6c3b671 4171 }
19672434 4172
7f4a5b5a 4173 $timeout = 60 if !defined($timeout);
67fb9de6 4174
9269013a
DM
4175 eval {
4176 if ($shutdown) {
6fab033c 4177 if (!$nocheck && $conf->{agent}) {
2ea54503 4178 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 4179 } else {
2ea54503 4180 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 4181 }
9269013a 4182 } else {
2ea54503 4183 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 4184 }
9269013a 4185 };
1e3baf05
DM
4186 my $err = $@;
4187
4188 if (!$err) {
1e3baf05 4189 my $count = 0;
e6c3b671 4190 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4191 $count++;
4192 sleep 1;
4193 }
4194
4195 if ($count >= $timeout) {
9269013a
DM
4196 if ($force) {
4197 warn "VM still running - terminating now with SIGTERM\n";
4198 kill 15, $pid;
4199 } else {
4200 die "VM quit/powerdown failed - got timeout\n";
4201 }
4202 } else {
254575e9 4203 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 4204 return;
1e3baf05
DM
4205 }
4206 } else {
9269013a
DM
4207 if ($force) {
4208 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4209 kill 15, $pid;
4210 } else {
afdb31d5 4211 die "VM quit/powerdown failed\n";
9269013a 4212 }
1e3baf05
DM
4213 }
4214
4215 # wait again
ff1a2432 4216 $timeout = 10;
1e3baf05
DM
4217
4218 my $count = 0;
e6c3b671 4219 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4220 $count++;
4221 sleep 1;
4222 }
4223
4224 if ($count >= $timeout) {
ff1a2432 4225 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 4226 kill 9, $pid;
ff1a2432 4227 sleep 1;
1e3baf05
DM
4228 }
4229
254575e9 4230 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 4231 });
1e3baf05
DM
4232}
4233
4234sub vm_suspend {
4235 my ($vmid, $skiplock) = @_;
4236
6b64503e 4237 lock_config($vmid, sub {
1e3baf05 4238
6b64503e 4239 my $conf = load_config($vmid);
1e3baf05 4240
051347aa 4241 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 4242
f77f91f3 4243 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
4244 });
4245}
4246
4247sub vm_resume {
4248 my ($vmid, $skiplock) = @_;
4249
6b64503e 4250 lock_config($vmid, sub {
1e3baf05 4251
6b64503e 4252 my $conf = load_config($vmid);
1e3baf05 4253
051347aa 4254 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 4255
12060fe8 4256 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
4257 });
4258}
4259
5fdbe4f0
DM
4260sub vm_sendkey {
4261 my ($vmid, $skiplock, $key) = @_;
1e3baf05 4262
6b64503e 4263 lock_config($vmid, sub {
1e3baf05 4264
6b64503e 4265 my $conf = load_config($vmid);
f5eb281a 4266
7b7c6d1b
DM
4267 # there is no qmp command, so we use the human monitor command
4268 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
4269 });
4270}
4271
4272sub vm_destroy {
4273 my ($storecfg, $vmid, $skiplock) = @_;
4274
6b64503e 4275 lock_config($vmid, sub {
1e3baf05 4276
6b64503e 4277 my $conf = load_config($vmid);
1e3baf05 4278
6b64503e 4279 check_lock($conf) if !$skiplock;
1e3baf05 4280
ff1a2432
DM
4281 if (!check_running($vmid)) {
4282 fairsched_rmnod($vmid); # try to destroy group
4283 destroy_vm($storecfg, $vmid);
4284 } else {
4285 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
4286 }
4287 });
4288}
4289
1e3baf05
DM
4290# pci helpers
4291
4292sub file_write {
4293 my ($filename, $buf) = @_;
4294
6b64503e 4295 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
4296 return undef if !$fh;
4297
4298 my $res = print $fh $buf;
4299
4300 $fh->close();
4301
4302 return $res;
4303}
4304
4305sub pci_device_info {
4306 my ($name) = @_;
4307
4308 my $res;
4309
4310 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
4311 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
4312
4313 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
4314 return undef if !defined($irq) || $irq !~ m/^\d+$/;
4315
4316 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
4317 return undef if !defined($vendor) || $vendor !~ s/^0x//;
4318
4319 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
4320 return undef if !defined($product) || $product !~ s/^0x//;
4321
4322 $res = {
4323 name => $name,
4324 vendor => $vendor,
4325 product => $product,
4326 domain => $domain,
4327 bus => $bus,
4328 slot => $slot,
4329 func => $func,
4330 irq => $irq,
4331 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
4332 };
4333
4334 return $res;
4335}
4336
4337sub pci_dev_reset {
4338 my ($dev) = @_;
4339
4340 my $name = $dev->{name};
4341
4342 my $fn = "$pcisysfs/devices/$name/reset";
4343
6b64503e 4344 return file_write($fn, "1");
1e3baf05
DM
4345}
4346
4347sub pci_dev_bind_to_stub {
4348 my ($dev) = @_;
4349
4350 my $name = $dev->{name};
4351
4352 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
4353 return 1 if -d $testdir;
4354
4355 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 4356 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
4357
4358 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 4359 if (!file_write($fn, $name)) {
1e3baf05
DM
4360 return undef if -f $fn;
4361 }
4362
4363 $fn = "$pcisysfs/drivers/pci-stub/bind";
4364 if (! -d $testdir) {
6b64503e 4365 return undef if !file_write($fn, $name);
1e3baf05
DM
4366 }
4367
4368 return -d $testdir;
4369}
4370
000fc0a2
SP
4371sub pci_dev_bind_to_vfio {
4372 my ($dev) = @_;
4373
4374 my $name = $dev->{name};
4375
4376 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4377
4378 if (!-d $vfio_basedir) {
4379 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4380 }
4381 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4382
4383 my $testdir = "$vfio_basedir/$name";
4384 return 1 if -d $testdir;
4385
4386 my $data = "$dev->{vendor} $dev->{product}";
4387 return undef if !file_write("$vfio_basedir/new_id", $data);
4388
4389 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4390 if (!file_write($fn, $name)) {
4391 return undef if -f $fn;
4392 }
4393
4394 $fn = "$vfio_basedir/bind";
4395 if (! -d $testdir) {
4396 return undef if !file_write($fn, $name);
4397 }
4398
4399 return -d $testdir;
4400}
4401
4402sub pci_dev_group_bind_to_vfio {
4403 my ($pciid) = @_;
4404
4405 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4406
4407 if (!-d $vfio_basedir) {
4408 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4409 }
4410 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4411
4412 # get IOMMU group devices
4413 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
4414 my @devs = grep /^0000:/, readdir($D);
4415 closedir($D);
4416
4417 foreach my $pciid (@devs) {
4418 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
4419 my $info = pci_device_info($1);
4420 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
4421 }
4422
4423 return 1;
4424}
4425
afdb31d5 4426sub print_pci_addr {
5bdcf937 4427 my ($id, $bridges) = @_;
6b64503e 4428
72a063e4 4429 my $res = '';
6b64503e 4430 my $devices = {
24f0d39a 4431 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 4432 #addr2 : first videocard
13b5a753 4433 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 4434 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
4435 scsihw0 => { bus => 0, addr => 5 },
4436 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 4437 ahci0 => { bus => 0, addr => 7 },
ab6a046f 4438 qga0 => { bus => 0, addr => 8 },
1011b570 4439 spice => { bus => 0, addr => 9 },
6b64503e
DM
4440 virtio0 => { bus => 0, addr => 10 },
4441 virtio1 => { bus => 0, addr => 11 },
4442 virtio2 => { bus => 0, addr => 12 },
4443 virtio3 => { bus => 0, addr => 13 },
4444 virtio4 => { bus => 0, addr => 14 },
4445 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
4446 hostpci0 => { bus => 0, addr => 16 },
4447 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
4448 net0 => { bus => 0, addr => 18 },
4449 net1 => { bus => 0, addr => 19 },
4450 net2 => { bus => 0, addr => 20 },
4451 net3 => { bus => 0, addr => 21 },
4452 net4 => { bus => 0, addr => 22 },
4453 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
4454 vga1 => { bus => 0, addr => 24 },
4455 vga2 => { bus => 0, addr => 25 },
4456 vga3 => { bus => 0, addr => 26 },
5cffb2d2
AD
4457 hostpci2 => { bus => 0, addr => 27 },
4458 hostpci3 => { bus => 0, addr => 28 },
e5f7f8ed 4459 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
4460 'pci.1' => { bus => 0, addr => 30 },
4461 'pci.2' => { bus => 0, addr => 31 },
4462 'net6' => { bus => 1, addr => 1 },
4463 'net7' => { bus => 1, addr => 2 },
4464 'net8' => { bus => 1, addr => 3 },
4465 'net9' => { bus => 1, addr => 4 },
4466 'net10' => { bus => 1, addr => 5 },
4467 'net11' => { bus => 1, addr => 6 },
4468 'net12' => { bus => 1, addr => 7 },
4469 'net13' => { bus => 1, addr => 8 },
4470 'net14' => { bus => 1, addr => 9 },
4471 'net15' => { bus => 1, addr => 10 },
4472 'net16' => { bus => 1, addr => 11 },
4473 'net17' => { bus => 1, addr => 12 },
4474 'net18' => { bus => 1, addr => 13 },
4475 'net19' => { bus => 1, addr => 14 },
4476 'net20' => { bus => 1, addr => 15 },
4477 'net21' => { bus => 1, addr => 16 },
4478 'net22' => { bus => 1, addr => 17 },
4479 'net23' => { bus => 1, addr => 18 },
4480 'net24' => { bus => 1, addr => 19 },
4481 'net25' => { bus => 1, addr => 20 },
4482 'net26' => { bus => 1, addr => 21 },
4483 'net27' => { bus => 1, addr => 22 },
4484 'net28' => { bus => 1, addr => 23 },
4485 'net29' => { bus => 1, addr => 24 },
4486 'net30' => { bus => 1, addr => 25 },
4487 'net31' => { bus => 1, addr => 26 },
4488 'virtio6' => { bus => 2, addr => 1 },
4489 'virtio7' => { bus => 2, addr => 2 },
4490 'virtio8' => { bus => 2, addr => 3 },
4491 'virtio9' => { bus => 2, addr => 4 },
4492 'virtio10' => { bus => 2, addr => 5 },
4493 'virtio11' => { bus => 2, addr => 6 },
4494 'virtio12' => { bus => 2, addr => 7 },
4495 'virtio13' => { bus => 2, addr => 8 },
4496 'virtio14' => { bus => 2, addr => 9 },
4497 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
4498 };
4499
4500 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 4501 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
4502 my $bus = $devices->{$id}->{bus};
4503 $res = ",bus=pci.$bus,addr=$addr";
98627641 4504 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
4505 }
4506 return $res;
4507
4508}
4509
2e3b7e2a
AD
4510sub print_pcie_addr {
4511 my ($id) = @_;
4512
4513 my $res = '';
4514 my $devices = {
4515 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4516 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4517 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4518 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4519 };
4520
4521 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4522 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4523 my $bus = $devices->{$id}->{bus};
4524 $res = ",bus=$bus,addr=$addr";
4525 }
4526 return $res;
4527
4528}
4529
3e16d5fc
DM
4530# vzdump restore implementaion
4531
ed221350 4532sub tar_archive_read_firstfile {
3e16d5fc 4533 my $archive = shift;
afdb31d5 4534
3e16d5fc
DM
4535 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4536
4537 # try to detect archive type first
4538 my $pid = open (TMP, "tar tf '$archive'|") ||
4539 die "unable to open file '$archive'\n";
4540 my $firstfile = <TMP>;
4541 kill 15, $pid;
4542 close TMP;
4543
4544 die "ERROR: archive contaions no data\n" if !$firstfile;
4545 chomp $firstfile;
4546
4547 return $firstfile;
4548}
4549
ed221350
DM
4550sub tar_restore_cleanup {
4551 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
4552
4553 print STDERR "starting cleanup\n";
4554
4555 if (my $fd = IO::File->new($statfile, "r")) {
4556 while (defined(my $line = <$fd>)) {
4557 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4558 my $volid = $2;
4559 eval {
4560 if ($volid =~ m|^/|) {
4561 unlink $volid || die 'unlink failed\n';
4562 } else {
ed221350 4563 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 4564 }
afdb31d5 4565 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
4566 };
4567 print STDERR "unable to cleanup '$volid' - $@" if $@;
4568 } else {
4569 print STDERR "unable to parse line in statfile - $line";
afdb31d5 4570 }
3e16d5fc
DM
4571 }
4572 $fd->close();
4573 }
4574}
4575
4576sub restore_archive {
a0d1b1a2 4577 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 4578
91bd6c90
DM
4579 my $format = $opts->{format};
4580 my $comp;
4581
4582 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4583 $format = 'tar' if !$format;
4584 $comp = 'gzip';
4585 } elsif ($archive =~ m/\.tar$/) {
4586 $format = 'tar' if !$format;
4587 } elsif ($archive =~ m/.tar.lzo$/) {
4588 $format = 'tar' if !$format;
4589 $comp = 'lzop';
4590 } elsif ($archive =~ m/\.vma$/) {
4591 $format = 'vma' if !$format;
4592 } elsif ($archive =~ m/\.vma\.gz$/) {
4593 $format = 'vma' if !$format;
4594 $comp = 'gzip';
4595 } elsif ($archive =~ m/\.vma\.lzo$/) {
4596 $format = 'vma' if !$format;
4597 $comp = 'lzop';
4598 } else {
4599 $format = 'vma' if !$format; # default
4600 }
4601
4602 # try to detect archive format
4603 if ($format eq 'tar') {
4604 return restore_tar_archive($archive, $vmid, $user, $opts);
4605 } else {
4606 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4607 }
4608}
4609
4610sub restore_update_config_line {
4611 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4612
4613 return if $line =~ m/^\#qmdump\#/;
4614 return if $line =~ m/^\#vzdump\#/;
4615 return if $line =~ m/^lock:/;
4616 return if $line =~ m/^unused\d+:/;
4617 return if $line =~ m/^parent:/;
ca3e4fa4 4618 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4619
4620 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4621 # try to convert old 1.X settings
4622 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4623 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4624 my ($model, $macaddr) = split(/\=/, $devconfig);
4625 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4626 my $net = {
4627 model => $model,
4628 bridge => "vmbr$ind",
4629 macaddr => $macaddr,
4630 };
4631 my $netstr = print_net($net);
4632
4633 print $outfd "net$cookie->{netcount}: $netstr\n";
4634 $cookie->{netcount}++;
4635 }
4636 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4637 my ($id, $netstr) = ($1, $2);
4638 my $net = parse_net($netstr);
4639 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4640 $netstr = print_net($net);
4641 print $outfd "$id: $netstr\n";
4642 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4643 my $virtdev = $1;
907ea891 4644 my $value = $3;
91bd6c90
DM
4645 if ($line =~ m/backup=no/) {
4646 print $outfd "#$line";
4647 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4648 my $di = parse_drive($virtdev, $value);
8fd57431 4649 delete $di->{format}; # format can change on restore
91bd6c90 4650 $di->{file} = $map->{$virtdev};
ed221350 4651 $value = print_drive($vmid, $di);
91bd6c90
DM
4652 print $outfd "$virtdev: $value\n";
4653 } else {
4654 print $outfd $line;
4655 }
4656 } else {
4657 print $outfd $line;
4658 }
4659}
4660
4661sub scan_volids {
4662 my ($cfg, $vmid) = @_;
4663
4664 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4665
4666 my $volid_hash = {};
4667 foreach my $storeid (keys %$info) {
4668 foreach my $item (@{$info->{$storeid}}) {
4669 next if !($item->{volid} && $item->{size});
5996a936 4670 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4671 $volid_hash->{$item->{volid}} = $item;
4672 }
4673 }
4674
4675 return $volid_hash;
4676}
4677
a8e2f942
DM
4678sub get_used_paths {
4679 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4680
4681 my $used_path = {};
4682
4683 my $scan_config = sub {
4684 my ($cref, $snapname) = @_;
4685
4686 foreach my $key (keys %$cref) {
4687 my $value = $cref->{$key};
4688 if (valid_drivename($key)) {
4689 next if $skip_drive && $key eq $skip_drive;
4690 my $drive = parse_drive($key, $value);
4691 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4692 if ($drive->{file} =~ m!^/!) {
4693 $used_path->{$drive->{file}}++; # = 1;
4694 } else {
4695 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4696 next if !$storeid;
4697 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4698 next if !$scfg;
4699 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4700 $used_path->{$path}++; # = 1;
4701 }
4702 }
4703 }
4704 };
4705
4706 &$scan_config($conf);
4707
4708 undef $skip_drive;
4709
4710 if ($scan_snapshots) {
4711 foreach my $snapname (keys %{$conf->{snapshots}}) {
4712 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4713 }
4714 }
4715
4716 return $used_path;
4717}
4718
91bd6c90
DM
4719sub update_disksize {
4720 my ($vmid, $conf, $volid_hash) = @_;
be190583 4721
91bd6c90
DM
4722 my $changes;
4723
4724 my $used = {};
4725
5996a936
DM
4726 # Note: it is allowed to define multiple storages with same path (alias), so
4727 # we need to check both 'volid' and real 'path' (two different volid can point
4728 # to the same path).
4729
4730 my $usedpath = {};
be190583 4731
91bd6c90
DM
4732 # update size info
4733 foreach my $opt (keys %$conf) {
ed221350
DM
4734 if (valid_drivename($opt)) {
4735 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4736 my $volid = $drive->{file};
4737 next if !$volid;
4738
4739 $used->{$volid} = 1;
be190583 4740 if ($volid_hash->{$volid} &&
5996a936
DM
4741 (my $path = $volid_hash->{$volid}->{path})) {
4742 $usedpath->{$path} = 1;
4743 }
91bd6c90 4744
ed221350 4745 next if drive_is_cdrom($drive);
91bd6c90
DM
4746 next if !$volid_hash->{$volid};
4747
4748 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4749 my $new = print_drive($vmid, $drive);
4750 if ($new ne $conf->{$opt}) {
4751 $changes = 1;
4752 $conf->{$opt} = $new;
4753 }
91bd6c90
DM
4754 }
4755 }
4756
5996a936
DM
4757 # remove 'unusedX' entry if volume is used
4758 foreach my $opt (keys %$conf) {
4759 next if $opt !~ m/^unused\d+$/;
4760 my $volid = $conf->{$opt};
4761 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4762 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4763 $changes = 1;
4764 delete $conf->{$opt};
4765 }
4766 }
4767
91bd6c90
DM
4768 foreach my $volid (sort keys %$volid_hash) {
4769 next if $volid =~ m/vm-$vmid-state-/;
4770 next if $used->{$volid};
5996a936
DM
4771 my $path = $volid_hash->{$volid}->{path};
4772 next if !$path; # just to be sure
4773 next if $usedpath->{$path};
91bd6c90 4774 $changes = 1;
ed221350 4775 add_unused_volume($conf, $volid);
05937a14 4776 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4777 }
4778
4779 return $changes;
4780}
4781
4782sub rescan {
4783 my ($vmid, $nolock) = @_;
4784
4785 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4786
4787 my $volid_hash = scan_volids($cfg, $vmid);
4788
4789 my $updatefn = sub {
4790 my ($vmid) = @_;
4791
ed221350 4792 my $conf = load_config($vmid);
be190583 4793
ed221350 4794 check_lock($conf);
91bd6c90 4795
03da3f0d
DM
4796 my $vm_volids = {};
4797 foreach my $volid (keys %$volid_hash) {
4798 my $info = $volid_hash->{$volid};
4799 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4800 }
4801
4802 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 4803
ed221350 4804 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
4805 };
4806
4807 if (defined($vmid)) {
4808 if ($nolock) {
4809 &$updatefn($vmid);
4810 } else {
ed221350 4811 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
4812 }
4813 } else {
4814 my $vmlist = config_list();
4815 foreach my $vmid (keys %$vmlist) {
4816 if ($nolock) {
4817 &$updatefn($vmid);
4818 } else {
ed221350 4819 lock_config($vmid, $updatefn, $vmid);
be190583 4820 }
91bd6c90
DM
4821 }
4822 }
4823}
4824
4825sub restore_vma_archive {
4826 my ($archive, $vmid, $user, $opts, $comp) = @_;
4827
4828 my $input = $archive eq '-' ? "<&STDIN" : undef;
4829 my $readfrom = $archive;
4830
4831 my $uncomp = '';
4832 if ($comp) {
4833 $readfrom = '-';
4834 my $qarchive = PVE::Tools::shellquote($archive);
4835 if ($comp eq 'gzip') {
4836 $uncomp = "zcat $qarchive|";
4837 } elsif ($comp eq 'lzop') {
4838 $uncomp = "lzop -d -c $qarchive|";
4839 } else {
4840 die "unknown compression method '$comp'\n";
4841 }
be190583 4842
91bd6c90
DM
4843 }
4844
4845 my $tmpdir = "/var/tmp/vzdumptmp$$";
4846 rmtree $tmpdir;
4847
4848 # disable interrupts (always do cleanups)
4849 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4850 warn "got interrupt - ignored\n";
4851 };
4852
4853 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4854 POSIX::mkfifo($mapfifo, 0600);
4855 my $fifofh;
4856
4857 my $openfifo = sub {
4858 open($fifofh, '>', $mapfifo) || die $!;
4859 };
4860
4861 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4862
4863 my $oldtimeout;
4864 my $timeout = 5;
4865
4866 my $devinfo = {};
4867
4868 my $rpcenv = PVE::RPCEnvironment::get();
4869
ed221350 4870 my $conffile = config_file($vmid);
91bd6c90
DM
4871 my $tmpfn = "$conffile.$$.tmp";
4872
ed221350
DM
4873 # Note: $oldconf is undef if VM does not exists
4874 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4875
91bd6c90
DM
4876 my $print_devmap = sub {
4877 my $virtdev_hash = {};
4878
4879 my $cfgfn = "$tmpdir/qemu-server.conf";
4880
4881 # we can read the config - that is already extracted
4882 my $fh = IO::File->new($cfgfn, "r") ||
4883 "unable to read qemu-server.conf - $!\n";
4884
4885 while (defined(my $line = <$fh>)) {
4886 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4887 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4888 die "archive does not contain data for drive '$virtdev'\n"
4889 if !$devinfo->{$devname};
4890 if (defined($opts->{storage})) {
4891 $storeid = $opts->{storage} || 'local';
4892 } elsif (!$storeid) {
4893 $storeid = 'local';
4894 }
4895 $format = 'raw' if !$format;
4896 $devinfo->{$devname}->{devname} = $devname;
4897 $devinfo->{$devname}->{virtdev} = $virtdev;
4898 $devinfo->{$devname}->{format} = $format;
4899 $devinfo->{$devname}->{storeid} = $storeid;
4900
be190583 4901 # check permission on storage
91bd6c90
DM
4902 my $pool = $opts->{pool}; # todo: do we need that?
4903 if ($user ne 'root@pam') {
4904 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4905 }
4906
4907 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4908 }
4909 }
4910
4911 foreach my $devname (keys %$devinfo) {
be190583
DM
4912 die "found no device mapping information for device '$devname'\n"
4913 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
4914 }
4915
91bd6c90 4916 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
4917
4918 # create empty/temp config
be190583 4919 if ($oldconf) {
ed221350
DM
4920 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4921 foreach_drive($oldconf, sub {
4922 my ($ds, $drive) = @_;
4923
4924 return if drive_is_cdrom($drive);
4925
4926 my $volid = $drive->{file};
4927
4928 return if !$volid || $volid =~ m|^/|;
4929
4930 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4931 return if !$path || !$owner || ($owner != $vmid);
4932
4933 # Note: only delete disk we want to restore
4934 # other volumes will become unused
4935 if ($virtdev_hash->{$ds}) {
4936 PVE::Storage::vdisk_free($cfg, $volid);
4937 }
4938 });
4939 }
4940
4941 my $map = {};
91bd6c90
DM
4942 foreach my $virtdev (sort keys %$virtdev_hash) {
4943 my $d = $virtdev_hash->{$virtdev};
4944 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4945 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
4946
4947 # test if requested format is supported
4948 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4949 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4950 $d->{format} = $defFormat if !$supported;
4951
91bd6c90
DM
4952 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4953 $d->{format}, undef, $alloc_size);
4954 print STDERR "new volume ID is '$volid'\n";
4955 $d->{volid} = $volid;
4956 my $path = PVE::Storage::path($cfg, $volid);
4957
4958 my $write_zeros = 1;
4959 # fixme: what other storages types initialize volumes with zero?
244f2577 4960 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 4961 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
4962 $write_zeros = 0;
4963 }
4964
4965 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4966
4967 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4968 $map->{$virtdev} = $volid;
4969 }
4970
4971 $fh->seek(0, 0) || die "seek failed - $!\n";
4972
4973 my $outfd = new IO::File ($tmpfn, "w") ||
4974 die "unable to write config for VM $vmid\n";
4975
4976 my $cookie = { netcount => 0 };
4977 while (defined(my $line = <$fh>)) {
be190583 4978 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
4979 }
4980
4981 $fh->close();
4982 $outfd->close();
4983 };
4984
4985 eval {
4986 # enable interrupts
4987 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4988 die "interrupted by signal\n";
4989 };
4990 local $SIG{ALRM} = sub { die "got timeout\n"; };
4991
4992 $oldtimeout = alarm($timeout);
4993
4994 my $parser = sub {
4995 my $line = shift;
4996
4997 print "$line\n";
4998
4999 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
5000 my ($dev_id, $size, $devname) = ($1, $2, $3);
5001 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
5002 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 5003 # we correctly received the vma config, so we can disable
3cf90d7a
DM
5004 # the timeout now for disk allocation (set to 10 minutes, so
5005 # that we always timeout if something goes wrong)
5006 alarm(600);
91bd6c90
DM
5007 &$print_devmap();
5008 print $fifofh "done\n";
5009 my $tmp = $oldtimeout || 0;
5010 $oldtimeout = undef;
5011 alarm($tmp);
5012 close($fifofh);
5013 }
5014 };
be190583 5015
91bd6c90
DM
5016 print "restore vma archive: $cmd\n";
5017 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
5018 };
5019 my $err = $@;
5020
5021 alarm($oldtimeout) if $oldtimeout;
5022
5023 unlink $mapfifo;
5024
5025 if ($err) {
5026 rmtree $tmpdir;
5027 unlink $tmpfn;
5028
5029 my $cfg = cfs_read_file('storage.cfg');
5030 foreach my $devname (keys %$devinfo) {
5031 my $volid = $devinfo->{$devname}->{volid};
5032 next if !$volid;
5033 eval {
5034 if ($volid =~ m|^/|) {
5035 unlink $volid || die 'unlink failed\n';
5036 } else {
5037 PVE::Storage::vdisk_free($cfg, $volid);
5038 }
5039 print STDERR "temporary volume '$volid' sucessfuly removed\n";
5040 };
5041 print STDERR "unable to cleanup '$volid' - $@" if $@;
5042 }
5043 die $err;
5044 }
5045
5046 rmtree $tmpdir;
ed221350
DM
5047
5048 rename($tmpfn, $conffile) ||
91bd6c90
DM
5049 die "unable to commit configuration file '$conffile'\n";
5050
ed221350
DM
5051 PVE::Cluster::cfs_update(); # make sure we read new file
5052
91bd6c90
DM
5053 eval { rescan($vmid, 1); };
5054 warn $@ if $@;
5055}
5056
5057sub restore_tar_archive {
5058 my ($archive, $vmid, $user, $opts) = @_;
5059
9c502e26 5060 if ($archive ne '-') {
ed221350 5061 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
5062 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
5063 if $firstfile ne 'qemu-server.conf';
5064 }
3e16d5fc 5065
ed221350 5066 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 5067
ed221350 5068 # destroy existing data - keep empty config
8e90138a 5069 my $vmcfgfn = config_file($vmid);
ebb55558 5070 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 5071
3e16d5fc
DM
5072 my $tocmd = "/usr/lib/qemu-server/qmextract";
5073
2415a446 5074 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 5075 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
5076 $tocmd .= ' --prealloc' if $opts->{prealloc};
5077 $tocmd .= ' --info' if $opts->{info};
5078
a0d1b1a2 5079 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 5080 # so we pipe to zcat
2415a446
DM
5081 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
5082 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
5083
5084 my $tmpdir = "/var/tmp/vzdumptmp$$";
5085 mkpath $tmpdir;
5086
5087 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
5088 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 5089 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 5090
ed221350 5091 my $conffile = config_file($vmid);
3e16d5fc
DM
5092 my $tmpfn = "$conffile.$$.tmp";
5093
5094 # disable interrupts (always do cleanups)
5095 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5096 print STDERR "got interrupt - ignored\n";
5097 };
5098
afdb31d5 5099 eval {
3e16d5fc
DM
5100 # enable interrupts
5101 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5102 die "interrupted by signal\n";
5103 };
5104
9c502e26
DM
5105 if ($archive eq '-') {
5106 print "extracting archive from STDIN\n";
5107 run_command($cmd, input => "<&STDIN");
5108 } else {
5109 print "extracting archive '$archive'\n";
5110 run_command($cmd);
5111 }
3e16d5fc
DM
5112
5113 return if $opts->{info};
5114
5115 # read new mapping
5116 my $map = {};
5117 my $statfile = "$tmpdir/qmrestore.stat";
5118 if (my $fd = IO::File->new($statfile, "r")) {
5119 while (defined (my $line = <$fd>)) {
5120 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5121 $map->{$1} = $2 if $1;
5122 } else {
5123 print STDERR "unable to parse line in statfile - $line\n";
5124 }
5125 }
5126 $fd->close();
5127 }
5128
5129 my $confsrc = "$tmpdir/qemu-server.conf";
5130
5131 my $srcfd = new IO::File($confsrc, "r") ||
5132 die "unable to open file '$confsrc'\n";
5133
5134 my $outfd = new IO::File ($tmpfn, "w") ||
5135 die "unable to write config for VM $vmid\n";
5136
91bd6c90 5137 my $cookie = { netcount => 0 };
3e16d5fc 5138 while (defined (my $line = <$srcfd>)) {
be190583 5139 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
5140 }
5141
5142 $srcfd->close();
5143 $outfd->close();
5144 };
5145 my $err = $@;
5146
afdb31d5 5147 if ($err) {
3e16d5fc
DM
5148
5149 unlink $tmpfn;
5150
ed221350 5151 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 5152
3e16d5fc 5153 die $err;
afdb31d5 5154 }
3e16d5fc
DM
5155
5156 rmtree $tmpdir;
5157
5158 rename $tmpfn, $conffile ||
5159 die "unable to commit configuration file '$conffile'\n";
91bd6c90 5160
ed221350
DM
5161 PVE::Cluster::cfs_update(); # make sure we read new file
5162
91bd6c90
DM
5163 eval { rescan($vmid, 1); };
5164 warn $@ if $@;
3e16d5fc
DM
5165};
5166
0d18dcfc
DM
5167
5168# Internal snapshots
5169
5170# NOTE: Snapshot create/delete involves several non-atomic
5171# action, and can take a long time.
5172# So we try to avoid locking the file and use 'lock' variable
5173# inside the config file instead.
5174
ef59d1ca
DM
5175my $snapshot_copy_config = sub {
5176 my ($source, $dest) = @_;
5177
5178 foreach my $k (keys %$source) {
5179 next if $k eq 'snapshots';
982c7f12
DM
5180 next if $k eq 'snapstate';
5181 next if $k eq 'snaptime';
18bfb361 5182 next if $k eq 'vmstate';
ef59d1ca
DM
5183 next if $k eq 'lock';
5184 next if $k eq 'digest';
db7c26e5 5185 next if $k eq 'description';
ef59d1ca 5186 next if $k =~ m/^unused\d+$/;
be190583 5187
ef59d1ca
DM
5188 $dest->{$k} = $source->{$k};
5189 }
5190};
5191
5192my $snapshot_apply_config = sub {
5193 my ($conf, $snap) = @_;
5194
5195 # copy snapshot list
5196 my $newconf = {
5197 snapshots => $conf->{snapshots},
5198 };
5199
db7c26e5 5200 # keep description and list of unused disks
ef59d1ca 5201 foreach my $k (keys %$conf) {
db7c26e5 5202 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
5203 $newconf->{$k} = $conf->{$k};
5204 }
5205
5206 &$snapshot_copy_config($snap, $newconf);
5207
5208 return $newconf;
5209};
5210
18bfb361
DM
5211sub foreach_writable_storage {
5212 my ($conf, $func) = @_;
5213
5214 my $sidhash = {};
5215
5216 foreach my $ds (keys %$conf) {
5217 next if !valid_drivename($ds);
5218
5219 my $drive = parse_drive($ds, $conf->{$ds});
5220 next if !$drive;
5221 next if drive_is_cdrom($drive);
5222
5223 my $volid = $drive->{file};
5224
5225 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 5226 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
5227 }
5228
5229 foreach my $sid (sort keys %$sidhash) {
5230 &$func($sid);
5231 }
5232}
5233
5234my $alloc_vmstate_volid = sub {
5235 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 5236
18bfb361
DM
5237 # Note: we try to be smart when selecting a $target storage
5238
5239 my $target;
5240
5241 # search shared storage first
5242 foreach_writable_storage($conf, sub {
5243 my ($sid) = @_;
5244 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5245 return if !$scfg->{shared};
5246
5247 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
5248 });
5249
5250 if (!$target) {
5251 # now search local storage
5252 foreach_writable_storage($conf, sub {
5253 my ($sid) = @_;
5254 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5255 return if $scfg->{shared};
5256
5257 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
5258 });
5259 }
5260
5261 $target = 'local' if !$target;
5262
fe6249f4
DM
5263 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
5264 # we abort live save after $conf->{memory}, so we need at max twice that space
5265 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
5266
5267 my $name = "vm-$vmid-state-$snapname";
5268 my $scfg = PVE::Storage::storage_config($storecfg, $target);
5269 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
5270 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
5271
5272 return $volid;
5273};
5274
0d18dcfc 5275my $snapshot_prepare = sub {
18bfb361 5276 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
5277
5278 my $snap;
0d18dcfc
DM
5279
5280 my $updatefn = sub {
5281
5282 my $conf = load_config($vmid);
5283
be190583 5284 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
5285 if is_template($conf);
5286
0d18dcfc
DM
5287 check_lock($conf);
5288
22c377f0
DM
5289 $conf->{lock} = 'snapshot';
5290
be190583
DM
5291 die "snapshot name '$snapname' already used\n"
5292 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 5293
ee2f90b1 5294 my $storecfg = PVE::Storage::config();
7ea975ef 5295 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 5296
782f4f75 5297 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 5298
18bfb361
DM
5299 if ($save_vmstate && check_running($vmid)) {
5300 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
5301 }
5302
ef59d1ca 5303 &$snapshot_copy_config($conf, $snap);
0d18dcfc 5304
782f4f75
DM
5305 $snap->{snapstate} = "prepare";
5306 $snap->{snaptime} = time();
5307 $snap->{description} = $comment if $comment;
5308
4b15803d
DM
5309 # always overwrite machine if we save vmstate. This makes sure we
5310 # can restore it later using correct machine type
5311 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
5312
0d18dcfc
DM
5313 update_config_nolock($vmid, $conf, 1);
5314 };
5315
5316 lock_config($vmid, $updatefn);
22c377f0
DM
5317
5318 return $snap;
0d18dcfc
DM
5319};
5320
5321my $snapshot_commit = sub {
5322 my ($vmid, $snapname) = @_;
5323
5324 my $updatefn = sub {
5325
5326 my $conf = load_config($vmid);
5327
be190583
DM
5328 die "missing snapshot lock\n"
5329 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc 5330
7946e0fa
DM
5331 my $has_machine_config = defined($conf->{machine});
5332
0d18dcfc
DM
5333 my $snap = $conf->{snapshots}->{$snapname};
5334
be190583
DM
5335 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5336
5337 die "wrong snapshot state\n"
5338 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 5339
0d18dcfc 5340 delete $snap->{snapstate};
ee2f90b1 5341 delete $conf->{lock};
0d18dcfc 5342
ef59d1ca 5343 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 5344
7946e0fa
DM
5345 delete $newconf->{machine} if !$has_machine_config;
5346
05e5ad3f
DM
5347 $newconf->{parent} = $snapname;
5348
0d18dcfc
DM
5349 update_config_nolock($vmid, $newconf, 1);
5350 };
5351
5352 lock_config($vmid, $updatefn);
5353};
5354
22c377f0
DM
5355sub snapshot_rollback {
5356 my ($vmid, $snapname) = @_;
5357
5358 my $snap;
5359
5360 my $prepare = 1;
5361
a3222b91 5362 my $storecfg = PVE::Storage::config();
be190583 5363
22c377f0
DM
5364 my $updatefn = sub {
5365
5366 my $conf = load_config($vmid);
5367
8b43bc11 5368 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 5369
ab33a7c2
DM
5370 $snap = $conf->{snapshots}->{$snapname};
5371
be190583 5372 die "snapshot '$snapname' does not exist\n" if !defined($snap);
ab33a7c2 5373
be190583 5374 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
5375 if $snap->{snapstate};
5376
a3222b91
DM
5377 if ($prepare) {
5378 check_lock($conf);
5379 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
5380 }
22c377f0
DM
5381
5382 die "unable to rollback vm $vmid: vm is running\n"
5383 if check_running($vmid);
5384
5385 if ($prepare) {
5386 $conf->{lock} = 'rollback';
5387 } else {
5388 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
5389 delete $conf->{lock};
5390 }
5391
4b15803d
DM
5392 my $forcemachine;
5393
22c377f0 5394 if (!$prepare) {
4b15803d
DM
5395 my $has_machine_config = defined($conf->{machine});
5396
22c377f0 5397 # copy snapshot config to current config
ef59d1ca
DM
5398 $conf = &$snapshot_apply_config($conf, $snap);
5399 $conf->{parent} = $snapname;
4b15803d 5400
d8b916fd
DM
5401 # Note: old code did not store 'machine', so we try to be smart
5402 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
5403 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 5404 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
5405 # in the original config.
5406 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
5407 }
5408
5409 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
5410
5411 if (!$prepare && $snap->{vmstate}) {
5412 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 5413 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 5414 }
22c377f0
DM
5415 };
5416
5417 lock_config($vmid, $updatefn);
be190583 5418
22c377f0
DM
5419 foreach_drive($snap, sub {
5420 my ($ds, $drive) = @_;
5421
5422 return if drive_is_cdrom($drive);
5423
5424 my $volid = $drive->{file};
5425 my $device = "drive-$ds";
5426
79e57b29 5427 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
5428 });
5429
5430 $prepare = 0;
5431 lock_config($vmid, $updatefn);
5432}
5433
9dcf4909
DM
5434my $savevm_wait = sub {
5435 my ($vmid) = @_;
5436
5437 for(;;) {
ed221350 5438 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
5439 if (!$stat->{status}) {
5440 die "savevm not active\n";
5441 } elsif ($stat->{status} eq 'active') {
5442 sleep(1);
5443 next;
5444 } elsif ($stat->{status} eq 'completed') {
5445 last;
5446 } else {
5447 die "query-savevm returned status '$stat->{status}'\n";
5448 }
5449 }
5450};
5451
0d18dcfc 5452sub snapshot_create {
af9110dd 5453 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
0d18dcfc 5454
18bfb361 5455 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 5456
af9110dd 5457 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
18bfb361 5458
67fb9de6
DM
5459 my $config = load_config($vmid);
5460
af9110dd
WL
5461 my $running = check_running($vmid);
5462
67fb9de6 5463 my $freezefs = $running && $config->{agent};
af9110dd
WL
5464 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5465
5466 my $drivehash = {};
5467
5468 if ($freezefs) {
65994ad7
WL
5469 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5470 warn "guest-fsfreeze-freeze problems - $@" if $@;
5471 }
67fb9de6 5472
0d18dcfc
DM
5473 eval {
5474 # create internal snapshots of all drives
22c377f0
DM
5475
5476 my $storecfg = PVE::Storage::config();
a3222b91
DM
5477
5478 if ($running) {
5479 if ($snap->{vmstate}) {
be190583 5480 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
5481 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5482 &$savevm_wait($vmid);
a3222b91 5483 } else {
9dcf4909 5484 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
5485 }
5486 };
5487
22c377f0
DM
5488 foreach_drive($snap, sub {
5489 my ($ds, $drive) = @_;
5490
5491 return if drive_is_cdrom($drive);
0d18dcfc 5492
22c377f0
DM
5493 my $volid = $drive->{file};
5494 my $device = "drive-$ds";
5495
5496 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 5497 $drivehash->{$ds} = 1;
22c377f0 5498 });
0d18dcfc 5499 };
22c377f0
DM
5500 my $err = $@;
5501
65994ad7
WL
5502 if ($running) {
5503 eval { vm_mon_cmd($vmid, "savevm-end") };
5504 warn $@ if $@;
22c377f0 5505
af9110dd 5506 if ($freezefs) {
67fb9de6 5507 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
65994ad7
WL
5508 warn "guest-fsfreeze-thaw problems - $@" if $@;
5509 }
22c377f0 5510
65994ad7 5511 # savevm-end is async, we need to wait
f34ebd52 5512 for (;;) {
2c9e8036
AD
5513 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5514 if (!$stat->{bytes}) {
5515 last;
5516 } else {
5517 print "savevm not yet finished\n";
5518 sleep(1);
5519 next;
5520 }
5521 }
5522 }
5523
22c377f0 5524 if ($err) {
0d18dcfc 5525 warn "snapshot create failed: starting cleanup\n";
3ee28e38 5526 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
5527 warn $@ if $@;
5528 die $err;
5529 }
5530
5531 &$snapshot_commit($vmid, $snapname);
5532}
5533
3ee28e38 5534# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 5535sub snapshot_delete {
3ee28e38 5536 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
5537
5538 my $prepare = 1;
5539
22c377f0 5540 my $snap;
ee2f90b1 5541 my $unused = [];
0d18dcfc 5542
6cb1a8cf
DM
5543 my $unlink_parent = sub {
5544 my ($confref, $new_parent) = @_;
5545
5546 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5547 if ($new_parent) {
5548 $confref->{parent} = $new_parent;
5549 } else {
5550 delete $confref->{parent};
5551 }
5552 }
5553 };
be190583 5554
0d18dcfc 5555 my $updatefn = sub {
2009f324 5556 my ($remove_drive) = @_;
0d18dcfc 5557
22c377f0 5558 my $conf = load_config($vmid);
0d18dcfc 5559
5295b23d
DM
5560 if (!$drivehash) {
5561 check_lock($conf);
be190583 5562 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
5563 if is_template($conf);
5564 }
0d18dcfc 5565
22c377f0 5566 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 5567
be190583 5568 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
5569
5570 # remove parent refs
8fd882a4
SP
5571 if (!$prepare) {
5572 &$unlink_parent($conf, $snap->{parent});
5573 foreach my $sn (keys %{$conf->{snapshots}}) {
5574 next if $sn eq $snapname;
5575 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5576 }
0d18dcfc
DM
5577 }
5578
2009f324 5579 if ($remove_drive) {
18bfb361
DM
5580 if ($remove_drive eq 'vmstate') {
5581 delete $snap->{$remove_drive};
5582 } else {
5583 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5584 my $volid = $drive->{file};
5585 delete $snap->{$remove_drive};
5586 add_unused_volume($conf, $volid);
5587 }
2009f324
DM
5588 }
5589
0d18dcfc
DM
5590 if ($prepare) {
5591 $snap->{snapstate} = 'delete';
5592 } else {
5593 delete $conf->{snapshots}->{$snapname};
3ee28e38 5594 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
5595 foreach my $volid (@$unused) {
5596 add_unused_volume($conf, $volid);
5597 }
0d18dcfc
DM
5598 }
5599
5600 update_config_nolock($vmid, $conf, 1);
5601 };
5602
5603 lock_config($vmid, $updatefn);
5604
18bfb361 5605 # now remove vmstate file
0d18dcfc 5606
22c377f0
DM
5607 my $storecfg = PVE::Storage::config();
5608
18bfb361
DM
5609 if ($snap->{vmstate}) {
5610 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5611 if (my $err = $@) {
5612 die $err if !$force;
5613 warn $err;
5614 }
5615 # save changes (remove vmstate from snapshot)
5616 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5617 };
5618
5619 # now remove all internal snapshots
5620 foreach_drive($snap, sub {
22c377f0
DM
5621 my ($ds, $drive) = @_;
5622
5623 return if drive_is_cdrom($drive);
3ee28e38 5624
22c377f0
DM
5625 my $volid = $drive->{file};
5626 my $device = "drive-$ds";
5627
2009f324
DM
5628 if (!$drivehash || $drivehash->{$ds}) {
5629 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5630 if (my $err = $@) {
5631 die $err if !$force;
5632 warn $err;
5633 }
3ee28e38 5634 }
2009f324
DM
5635
5636 # save changes (remove drive fron snapshot)
5637 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5638 push @$unused, $volid;
22c377f0 5639 });
0d18dcfc
DM
5640
5641 # now cleanup config
5642 $prepare = 0;
5643 lock_config($vmid, $updatefn);
5644}
5645
9cd07842 5646sub has_feature {
7ea975ef
AD
5647 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5648
719893a9 5649 my $err;
7ea975ef
AD
5650 foreach_drive($conf, sub {
5651 my ($ds, $drive) = @_;
5652
5653 return if drive_is_cdrom($drive);
5654 my $volid = $drive->{file};
5655 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5656 });
5657
719893a9 5658 return $err ? 0 : 1;
7ea975ef 5659}
04a69bb4
AD
5660
5661sub template_create {
5662 my ($vmid, $conf, $disk) = @_;
5663
04a69bb4 5664 my $storecfg = PVE::Storage::config();
04a69bb4 5665
9cd07842
DM
5666 foreach_drive($conf, sub {
5667 my ($ds, $drive) = @_;
5668
5669 return if drive_is_cdrom($drive);
5670 return if $disk && $ds ne $disk;
5671
5672 my $volid = $drive->{file};
bbd56097 5673 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5674
04a69bb4
AD
5675 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5676 $drive->{file} = $voliddst;
152fe752
DM
5677 $conf->{$ds} = print_drive($vmid, $drive);
5678 update_config_nolock($vmid, $conf, 1);
04a69bb4 5679 });
04a69bb4
AD
5680}
5681
624361b3
AD
5682sub is_template {
5683 my ($conf) = @_;
5684
96d695c0 5685 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5686}
5687
5133de42
AD
5688sub qemu_img_convert {
5689 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5690
5691 my $storecfg = PVE::Storage::config();
5692 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5693 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5694
5695 if ($src_storeid && $dst_storeid) {
5696 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5697 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5698
5699 my $src_format = qemu_img_format($src_scfg, $src_volname);
5700 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5701
5702 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5703 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5704
5705 my $cmd = [];
71ddbff9 5706 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5707 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5708 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5709
5710 my $parser = sub {
5711 my $line = shift;
5712 if($line =~ m/\((\S+)\/100\%\)/){
5713 my $percent = $1;
5714 my $transferred = int($size * $percent / 100);
5715 my $remaining = $size - $transferred;
5716
5717 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5718 }
5719
5720 };
5721
5722 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5723 my $err = $@;
5724 die "copy failed: $err" if $err;
5725 }
5726}
5727
5728sub qemu_img_format {
5729 my ($scfg, $volname) = @_;
5730
ccb5c001 5731 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5732 return $1;
ccb5c001 5733 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5734 return "host_device";
be190583 5735 } else {
5133de42 5736 return "raw";
5133de42
AD
5737 }
5738}
5739
cfad42af 5740sub qemu_drive_mirror {
ab6ecffe 5741 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
cfad42af 5742
ab6ecffe 5743 my $count = 0;
cfad42af
AD
5744 my $old_len = 0;
5745 my $frozen = undef;
ab6ecffe 5746 my $maxwait = 120;
cfad42af
AD
5747
5748 my $storecfg = PVE::Storage::config();
08ac653f 5749 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
152fe752 5750
08ac653f 5751 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 5752
08ac653f
DM
5753 my $format;
5754 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5755 $format = $1;
5756 }
21ccdb50 5757
08ac653f 5758 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 5759
88383920
DM
5760 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5761 $opts->{format} = $format if $format;
5762
5763 #fixme : sometime drive-mirror timeout, but works fine after.
5764 # (I have see the problem with big volume > 200GB), so we need to eval
f34ebd52 5765 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
88383920 5766 # ignore errors here
21ccdb50 5767
08ac653f
DM
5768 eval {
5769 while (1) {
5770 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5771 my $stat = @$stats[0];
5772 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5773 die "error job is not mirroring" if $stat->{type} ne "mirror";
5774
08ac653f
DM
5775 my $busy = $stat->{busy};
5776
6f708643
DM
5777 if (my $total = $stat->{len}) {
5778 my $transferred = $stat->{offset} || 0;
5779 my $remaining = $total - $transferred;
5780 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
67fb9de6 5781
6f708643
DM
5782 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
5783 }
f34ebd52 5784
08ac653f
DM
5785 if ($stat->{len} == $stat->{offset}) {
5786 if ($busy eq 'false') {
5787
5788 last if $vmiddst != $vmid;
f34ebd52 5789
08ac653f
DM
5790 # try to switch the disk if source and destination are on the same guest
5791 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
5792 last if !$@;
5793 die $@ if $@ !~ m/cannot be completed/;
cfad42af 5794 }
b467f79a 5795
08ac653f
DM
5796 if ($count > $maxwait) {
5797 # if too much writes to disk occurs at the end of migration
5798 #the disk needs to be freezed to be able to complete the migration
5799 vm_suspend($vmid,1);
5800 $frozen = 1;
bcc87408 5801 }
08ac653f
DM
5802 $count ++
5803 }
5804 $old_len = $stat->{offset};
5805 sleep 1;
cfad42af
AD
5806 }
5807
08ac653f
DM
5808 vm_resume($vmid, 1) if $frozen;
5809
5810 };
88383920 5811 my $err = $@;
08ac653f 5812
88383920 5813 my $cancel_job = sub {
08ac653f
DM
5814 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
5815 while (1) {
5816 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5817 my $stat = @$stats[0];
5818 last if !$stat;
5819 sleep 1;
cfad42af 5820 }
88383920
DM
5821 };
5822
5823 if ($err) {
f34ebd52 5824 eval { &$cancel_job(); };
88383920
DM
5825 die "mirroring error: $err";
5826 }
5827
5828 if ($vmiddst != $vmid) {
5829 # if we clone a disk for a new target vm, we don't switch the disk
5830 &$cancel_job(); # so we call block-job-cancel
cfad42af
AD
5831 }
5832}
5833
152fe752 5834sub clone_disk {
be190583 5835 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
5836 $newvmid, $storage, $format, $full, $newvollist) = @_;
5837
5838 my $newvolid;
5839
5840 if (!$full) {
5841 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 5842 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
5843 push @$newvollist, $newvolid;
5844 } else {
5845 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5846 $storeid = $storage if $storage;
5847
1377d7b0
DM
5848 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5849 if (!$format) {
5850 $format = $drive->{format} || $defFormat;
152fe752
DM
5851 }
5852
1377d7b0
DM
5853 # test if requested format is supported - else use default
5854 my $supported = grep { $_ eq $format } @$validFormats;
5855 $format = $defFormat if !$supported;
5856
152fe752
DM
5857 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5858
5859 print "create full clone of drive $drivename ($drive->{file})\n";
5860 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5861 push @$newvollist, $newvolid;
5862
5863 if (!$running || $snapname) {
5864 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5865 } else {
5866 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 5867 }
152fe752
DM
5868 }
5869
5870 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5871
5872 my $disk = $drive;
5873 $disk->{format} = undef;
5874 $disk->{file} = $newvolid;
5875 $disk->{size} = $size;
5876
5877 return $disk;
5878}
5879
ff556cf2
DM
5880# this only works if VM is running
5881sub get_current_qemu_machine {
5882 my ($vmid) = @_;
5883
5884 my $cmd = { execute => 'query-machines', arguments => {} };
8e90138a 5885 my $res = vm_qmp_command($vmid, $cmd);
ff556cf2
DM
5886
5887 my ($current, $default);
5888 foreach my $e (@$res) {
5889 $default = $e->{name} if $e->{'is-default'};
5890 $current = $e->{name} if $e->{'is-current'};
5891 }
5892
5893 # fallback to the default machine if current is not supported by qemu
5894 return $current || $default || 'pc';
5895}
5896
4543ecf0
AD
5897sub lspci {
5898
5899 my $devices = {};
5900
5901 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5902 my (undef, $id, $function) = @_;
5903 my $res = { id => $id, function => $function};
5904 push @{$devices->{$id}}, $res;
5905 });
5906
5907 return $devices;
5908}
5909
1e3baf05 59101;