]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
add optionnal current param to config api
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05 154my $confdesc = {
7183bd9a
AD
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
1e3baf05
DM
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
2ff09f52
DA
173 hotplug => {
174 optional => 1,
e8b9c17c 175 type => 'boolean',
6c52b679 176 description => "Allow hotplug for disk and network device",
2dbe827e 177 default => 0,
2ff09f52 178 },
1e3baf05
DM
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
22c377f0 189 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
7878afeb 209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
210 minimum => 16,
211 default => 512,
212 },
13a48620
DA
213 balloon => {
214 optional => 1,
215 type => 'integer',
8b1accf7
DM
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
13a48620 226 },
1e3baf05
DM
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 231 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
7fabe17d 236 type => 'string', format => 'dns-name',
1e3baf05
DM
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
cdd20088
AD
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
5b952ff5 243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
244 default => 'lsi',
245 },
1e3baf05
DM
246 description => {
247 optional => 1,
248 type => 'string',
0581fe4f 249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
6b9d84cf 254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
255 description => <<EODESC,
256Used to enable special optimization/features for specific
257operating systems:
258
259other => unspecified OS
260wxp => Microsoft Windows XP
261w2k => Microsoft Windows 2000
262w2k3 => Microsoft Windows 2003
263w2k8 => Microsoft Windows 2008
264wvista => Microsoft Windows Vista
265win7 => Microsoft Windows 7
a70ebde3 266win8 => Microsoft Windows 8/2012
1e3baf05
DM
267l24 => Linux 2.4 Kernel
268l26 => Linux 2.6/3.X Kernel
6b9d84cf 269solaris => solaris/opensolaris/openindiania kernel
1e3baf05 270
6b9d84cf 271other|l24|l26|solaris ... no special behaviour
a70ebde3 272wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
273EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
32baffb4 280 default => 'cdn',
1e3baf05
DM
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
03e480fc 286 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
8a010eae
AD
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
3bd18e48
AD
315 maxcpus => {
316 optional => 1,
317 type => 'integer',
318 description => "Maximum cpus for hotplug.",
319 minimum => 1,
320 default => 1,
321 },
1e3baf05
DM
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
bc84dcca 328 agent => {
ab6a046f
AD
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
be79c214 332 default => 0,
ab6a046f 333 },
1e3baf05
DM
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
8c559505
DM
343 description => "Enable/disable time drift fix.",
344 default => 0,
1e3baf05 345 },
19672434 346 localtime => {
1e3baf05
DM
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
ef5e2be2 359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 361 },
0ea9541d
DM
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
1e3baf05
DM
368 startdate => {
369 optional => 1,
19672434 370 type => 'string',
1e3baf05
DM
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
59411c4e
DM
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
68eda3ab
AD
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
1e3baf05
DM
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394args: -no-reboot -no-hpet
395EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
5acbfe9e 401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
04432191 412 type => 'number',
1e3baf05
DM
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
04432191 415 default => 0.1,
1e3baf05
DM
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
3aefd6fd 427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 428 default => 'kvm64',
1e3baf05 429 },
b7ba6b79
DM
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
982c7f12
DM
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
18bfb361
DM
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
3bafc510
DM
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
2796e7d5
DM
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
1e3baf05
DM
459};
460
461# what about other qemu settings ?
462#cpu => 'string',
463#machine => 'string',
464#fda => 'file',
465#fdb => 'file',
466#mtdblock => 'file',
467#sd => 'file',
468#pflash => 'file',
469#snapshot => 'bool',
470#bootp => 'file',
471##tftp => 'dir',
472##smb => 'dir',
473#kernel => 'file',
474#append => 'string',
475#initrd => 'file',
476##soundhw => 'string',
477
478while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480}
481
482my $MAX_IDE_DISKS = 4;
f62db2a4 483my $MAX_SCSI_DISKS = 14;
a2650619 484my $MAX_VIRTIO_DISKS = 16;
cdb0931f 485my $MAX_SATA_DISKS = 6;
1e3baf05 486my $MAX_USB_DEVICES = 5;
5bdcf937 487my $MAX_NETS = 32;
1e3baf05 488my $MAX_UNUSED_DISKS = 8;
5cffb2d2 489my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 490my $MAX_SERIAL_PORTS = 4;
1989a89c 491my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
492my $MAX_NUMA = 8;
493
494my $numadesc = {
495 optional => 1,
496 type => 'string', format => 'pve-qm-numanode',
497 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>][,policy=<preferred|bind|interleave>]]",
498 description => "numa topology",
499};
500PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
501
502for (my $i = 0; $i < $MAX_NUMA; $i++) {
503 $confdesc->{"numa$i"} = $numadesc;
504}
1e3baf05
DM
505
506my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
e4c6e0b8 507 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
6b64503e 508my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 509
1e3baf05
DM
510my $netdesc = {
511 optional => 1,
512 type => 'string', format => 'pve-qm-net',
a9410357 513 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
1e3baf05 514 description => <<EODESCR,
19672434 515Specify network devices.
1e3baf05
DM
516
517MODEL is one of: $nic_model_list_txt
518
19672434 519XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
520automatically generated if not specified.
521
522The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
523
524Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
525
526If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
527
52810.0.2.2 Gateway
52910.0.2.3 DNS Server
53010.0.2.4 SMB Server
531
532The DHCP server assign addresses to the guest starting from 10.0.2.15.
533
534EODESCR
535};
536PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
537
538for (my $i = 0; $i < $MAX_NETS; $i++) {
539 $confdesc->{"net$i"} = $netdesc;
540}
541
542my $drivename_hash;
19672434 543
1e3baf05
DM
544my $idedesc = {
545 optional => 1,
546 type => 'string', format => 'pve-qm-drive',
8d87f8aa 547 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 548 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
549};
550PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
551
552my $scsidesc = {
553 optional => 1,
554 type => 'string', format => 'pve-qm-drive',
8d87f8aa 555 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 556 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
557};
558PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
559
cdb0931f
DA
560my $satadesc = {
561 optional => 1,
562 type => 'string', format => 'pve-qm-drive',
8d87f8aa 563 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 564 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
565};
566PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
567
1e3baf05
DM
568my $virtiodesc = {
569 optional => 1,
570 type => 'string', format => 'pve-qm-drive',
8d87f8aa 571 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 572 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
573};
574PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
575
576my $usbdesc = {
577 optional => 1,
578 type => 'string', format => 'pve-qm-usb-device',
80401dd8 579 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 580 description => <<EODESCR,
2fe1a152 581Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
582pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
583
19672434 584'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
585'vendor_id:product_id' (hexadeciaml numbers)
586
19672434 587You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
588
589Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
590
80401dd8
DM
591The value 'spice' can be used to add a usb redirection devices for spice.
592
1e3baf05
DM
593EODESCR
594};
595PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
596
040b06b7
DA
597my $hostpcidesc = {
598 optional => 1,
599 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 600 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
601 description => <<EODESCR,
602Map host pci devices. HOSTPCIDEVICE syntax is:
603
604'bus:dev.func' (hexadecimal numbers)
605
606You can us the 'lspci' command to list existing pci devices.
607
0cea6a01
DM
608The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
609
040b06b7
DA
610Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
611
612Experimental: user reported problems with this option.
613EODESCR
614};
615PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
616
bae179aa
DA
617my $serialdesc = {
618 optional => 1,
ca0cef26 619 type => 'string',
1b0b51ed 620 pattern => '(/dev/.+|socket)',
bae179aa 621 description => <<EODESCR,
1b0b51ed 622Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
623
624Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
625
626Experimental: user reported problems with this option.
627EODESCR
628};
bae179aa 629
1989a89c
DA
630my $paralleldesc= {
631 optional => 1,
ca0cef26 632 type => 'string',
9ecc8431 633 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 634 description => <<EODESCR,
19672434 635Map host parallel devices (n is 0 to 2).
1989a89c
DA
636
637Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
638
639Experimental: user reported problems with this option.
640EODESCR
641};
1989a89c
DA
642
643for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
644 $confdesc->{"parallel$i"} = $paralleldesc;
645}
646
bae179aa
DA
647for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
648 $confdesc->{"serial$i"} = $serialdesc;
649}
650
040b06b7
DA
651for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
652 $confdesc->{"hostpci$i"} = $hostpcidesc;
653}
1e3baf05
DM
654
655for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
656 $drivename_hash->{"ide$i"} = 1;
657 $confdesc->{"ide$i"} = $idedesc;
658}
659
cdb0931f
DA
660for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
661 $drivename_hash->{"sata$i"} = 1;
662 $confdesc->{"sata$i"} = $satadesc;
663}
664
1e3baf05
DM
665for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
666 $drivename_hash->{"scsi$i"} = 1;
667 $confdesc->{"scsi$i"} = $scsidesc ;
668}
669
670for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
671 $drivename_hash->{"virtio$i"} = 1;
672 $confdesc->{"virtio$i"} = $virtiodesc;
673}
674
675for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
676 $confdesc->{"usb$i"} = $usbdesc;
677}
678
679my $unuseddesc = {
680 optional => 1,
681 type => 'string', format => 'pve-volume-id',
682 description => "Reference to unused volumes.",
683};
684
685for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
686 $confdesc->{"unused$i"} = $unuseddesc;
687}
688
689my $kvm_api_version = 0;
690
691sub kvm_version {
692
693 return $kvm_api_version if $kvm_api_version;
694
6b64503e 695 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
696 return 0;
697
6b64503e 698 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
699 $kvm_api_version = $v;
700 }
701
702 $fh->close();
703
704 return $kvm_api_version;
705}
706
707my $kvm_user_version;
708
709sub kvm_user_version {
710
711 return $kvm_user_version if $kvm_user_version;
712
713 $kvm_user_version = 'unknown';
714
715 my $tmp = `kvm -help 2>/dev/null`;
19672434 716
fa7ae705 717 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
718 $kvm_user_version = $2;
719 }
720
721 return $kvm_user_version;
722
723}
724
725my $kernel_has_vhost_net = -c '/dev/vhost-net';
726
727sub disknames {
728 # order is important - used to autoselect boot disk
19672434 729 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 730 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
731 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
732 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
733}
734
735sub valid_drivename {
736 my $dev = shift;
737
6b64503e 738 return defined($drivename_hash->{$dev});
1e3baf05
DM
739}
740
741sub option_exists {
742 my $key = shift;
743 return defined($confdesc->{$key});
19672434 744}
1e3baf05
DM
745
746sub nic_models {
747 return $nic_model_list;
748}
749
750sub os_list_description {
751
752 return {
753 other => 'Other',
754 wxp => 'Windows XP',
755 w2k => 'Windows 2000',
756 w2k3 =>, 'Windows 2003',
757 w2k8 => 'Windows 2008',
758 wvista => 'Windows Vista',
759 win7 => 'Windows 7',
a70ebde3 760 win8 => 'Windows 8/2012',
1e3baf05
DM
761 l24 => 'Linux 2.4',
762 l26 => 'Linux 2.6',
19672434 763 };
1e3baf05
DM
764}
765
1e3baf05
DM
766my $cdrom_path;
767
768sub get_cdrom_path {
769
770 return $cdrom_path if $cdrom_path;
771
772 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
773 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
774 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
775}
776
777sub get_iso_path {
778 my ($storecfg, $vmid, $cdrom) = @_;
779
780 if ($cdrom eq 'cdrom') {
781 return get_cdrom_path();
782 } elsif ($cdrom eq 'none') {
783 return '';
784 } elsif ($cdrom =~ m|^/|) {
785 return $cdrom;
786 } else {
6b64503e 787 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
788 }
789}
790
791# try to convert old style file names to volume IDs
792sub filename_to_volume_id {
793 my ($vmid, $file, $media) = @_;
794
795 if (!($file eq 'none' || $file eq 'cdrom' ||
796 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 797
1e3baf05 798 return undef if $file =~ m|/|;
19672434 799
1e3baf05
DM
800 if ($media && $media eq 'cdrom') {
801 $file = "local:iso/$file";
802 } else {
803 $file = "local:$vmid/$file";
804 }
805 }
806
807 return $file;
808}
809
810sub verify_media_type {
811 my ($opt, $vtype, $media) = @_;
812
813 return if !$media;
814
815 my $etype;
816 if ($media eq 'disk') {
a125592c 817 $etype = 'images';
1e3baf05
DM
818 } elsif ($media eq 'cdrom') {
819 $etype = 'iso';
820 } else {
821 die "internal error";
822 }
823
824 return if ($vtype eq $etype);
19672434 825
1e3baf05
DM
826 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
827}
828
829sub cleanup_drive_path {
830 my ($opt, $storecfg, $drive) = @_;
831
832 # try to convert filesystem paths to volume IDs
833
834 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
835 ($drive->{file} !~ m|^/dev/.+|) &&
836 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 837 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
838 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
839 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
840 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
841 verify_media_type($opt, $vtype, $drive->{media});
842 $drive->{file} = $volid;
843 }
844
845 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
846}
847
848sub create_conf_nolock {
849 my ($vmid, $settings) = @_;
850
6b64503e 851 my $filename = config_file($vmid);
1e3baf05
DM
852
853 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 854
1e3baf05
DM
855 my $defaults = load_defaults();
856
857 $settings->{name} = "vm$vmid" if !$settings->{name};
858 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
859
860 my $data = '';
861 foreach my $opt (keys %$settings) {
862 next if !$confdesc->{$opt};
863
864 my $value = $settings->{$opt};
865 next if !$value;
866
867 $data .= "$opt: $value\n";
868 }
869
870 PVE::Tools::file_set_contents($filename, $data);
871}
872
f36ed4f4
DM
873my $parse_size = sub {
874 my ($value) = @_;
875
9bf371a6 876 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
877 my ($size, $unit) = ($1, $3);
878 if ($unit) {
879 if ($unit eq 'K') {
880 $size = $size * 1024;
881 } elsif ($unit eq 'M') {
882 $size = $size * 1024 * 1024;
883 } elsif ($unit eq 'G') {
884 $size = $size * 1024 * 1024 * 1024;
885 }
886 }
887 return int($size);
888};
889
890my $format_size = sub {
891 my ($size) = @_;
892
893 $size = int($size);
894
895 my $kb = int($size/1024);
896 return $size if $kb*1024 != $size;
897
898 my $mb = int($kb/1024);
899 return "${kb}K" if $mb*1024 != $kb;
900
901 my $gb = int($mb/1024);
902 return "${mb}M" if $gb*1024 != $mb;
903
904 return "${gb}G";
905};
906
1e3baf05
DM
907# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
908# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 909# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 910# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
911
912sub parse_drive {
913 my ($key, $data) = @_;
914
915 my $res = {};
19672434 916
1e3baf05
DM
917 # $key may be undefined - used to verify JSON parameters
918 if (!defined($key)) {
919 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
920 $res->{index} = 0;
921 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
922 $res->{interface} = $1;
923 $res->{index} = $2;
924 } else {
925 return undef;
926 }
927
928 foreach my $p (split (/,/, $data)) {
929 next if $p =~ m/^\s*$/;
930
74edd76b 931 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
932 my ($k, $v) = ($1, $2);
933
934 $k = 'file' if $k eq 'volume';
935
936 return undef if defined $res->{$k};
19672434 937
9bf371a6
DM
938 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
939 return undef if !$v || $v !~ m/^\d+/;
940 $k = "m$k";
941 $v = sprintf("%.3f", $v / (1024*1024));
942 }
1e3baf05
DM
943 $res->{$k} = $v;
944 } else {
945 if (!$res->{file} && $p !~ m/=/) {
946 $res->{file} = $p;
947 } else {
948 return undef;
949 }
950 }
951 }
952
953 return undef if !$res->{file};
954
bdf3f362
AD
955 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
956 $res->{format} = $1;
957 }
958
19672434 959 return undef if $res->{cache} &&
e482cec3 960 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
961 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
962 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
963 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
964 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
965 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
966 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
967 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
968 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
969 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
970 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
971 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 972 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 973
9bf371a6
DM
974 return undef if $res->{mbps_rd} && $res->{mbps};
975 return undef if $res->{mbps_wr} && $res->{mbps};
976
977 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 978 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 979 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 980 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 981 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 982 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 983
affd2f88
AD
984 return undef if $res->{iops_rd} && $res->{iops};
985 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
986
987
affd2f88 988 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 989 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 990 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 991 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 992 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 993 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
994
995
24afaca0 996 if ($res->{size}) {
be190583 997 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
998 }
999
1e3baf05
DM
1000 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1001 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1002 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1003 return undef if $res->{interface} eq 'virtio';
1004 }
1005
1006 # rerror does not work with scsi drives
1007 if ($res->{rerror}) {
1008 return undef if $res->{interface} eq 'scsi';
1009 }
1010
1011 return $res;
1012}
1013
74edd76b 1014my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
1015
1016sub print_drive {
1017 my ($vmid, $drive) = @_;
1018
1019 my $opts = '';
74edd76b 1020 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
1021 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1022 }
1023
24afaca0
DM
1024 if ($drive->{size}) {
1025 $opts .= ",size=" . &$format_size($drive->{size});
1026 }
1027
1e3baf05
DM
1028 return "$drive->{file}$opts";
1029}
1030
28ef82d3
DM
1031sub scsi_inquiry {
1032 my($fh, $noerr) = @_;
1033
1034 my $SG_IO = 0x2285;
1035 my $SG_GET_VERSION_NUM = 0x2282;
1036
1037 my $versionbuf = "\x00" x 8;
1038 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1039 if (!$ret) {
1040 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1041 return undef;
1042 }
97d62eb7 1043 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1044 if ($version < 30000) {
1045 die "scsi generic interface too old\n" if !$noerr;
1046 return undef;
1047 }
97d62eb7 1048
28ef82d3
DM
1049 my $buf = "\x00" x 36;
1050 my $sensebuf = "\x00" x 8;
f334aa3e 1051 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1052
28ef82d3
DM
1053 # see /usr/include/scsi/sg.h
1054 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1055
97d62eb7
DM
1056 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1057 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1058 $cmd, $sensebuf, 6000);
1059
1060 $ret = ioctl($fh, $SG_IO, $packet);
1061 if (!$ret) {
1062 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1063 return undef;
1064 }
97d62eb7 1065
28ef82d3
DM
1066 my @res = unpack($sg_io_hdr_t, $packet);
1067 if ($res[17] || $res[18]) {
1068 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1069 return undef;
1070 }
1071
1072 my $res = {};
09984754 1073 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1074 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1075
09984754
DM
1076 $res->{removable} = $byte1 & 128 ? 1 : 0;
1077 $res->{type} = $byte0 & 31;
1078
28ef82d3
DM
1079 return $res;
1080}
1081
1082sub path_is_scsi {
1083 my ($path) = @_;
1084
1085 my $fh = IO::File->new("+<$path") || return undef;
1086 my $res = scsi_inquiry($fh, 1);
1087 close($fh);
1088
1089 return $res;
1090}
1091
db656e5f
DM
1092sub machine_type_is_q35 {
1093 my ($conf) = @_;
b467f79a 1094
db656e5f
DM
1095 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1096}
1097
1098sub print_tabletdevice_full {
1099 my ($conf) = @_;
b467f79a 1100
db656e5f
DM
1101 my $q35 = machine_type_is_q35($conf);
1102
1103 # we use uhci for old VMs because tablet driver was buggy in older qemu
1104 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1105
db656e5f
DM
1106 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1107}
1108
ca916ecc 1109sub print_drivedevice_full {
5bdcf937 1110 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1111
1112 my $device = '';
1113 my $maxdev = 0;
19672434 1114
ca916ecc 1115 if ($drive->{interface} eq 'virtio') {
5bdcf937 1116 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1117 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
7183bd9a 1118 $device .= ",iothread=iothread0" if $conf->{iothread};
2ed36a41 1119 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1120 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1121 my $controller = int($drive->{index} / $maxdev);
1122 my $unit = $drive->{index} % $maxdev;
1123 my $devicetype = 'hd';
231f2e13
DA
1124 my $path = '';
1125 if (drive_is_cdrom($drive)) {
1126 $devicetype = 'cd';
29b19529 1127 } else {
231f2e13
DA
1128 if ($drive->{file} =~ m|^/|) {
1129 $path = $drive->{file};
1130 } else {
1131 $path = PVE::Storage::path($storecfg, $drive->{file});
1132 }
d454d040
AD
1133
1134 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1135 $devicetype = 'generic';
1136 } else {
09984754
DM
1137 if (my $info = path_is_scsi($path)) {
1138 if ($info->{type} == 0) {
1139 $devicetype = 'block';
1140 } elsif ($info->{type} == 1) { # tape
1141 $devicetype = 'generic';
1142 }
1143 }
d454d040 1144 }
231f2e13 1145 }
ca916ecc 1146
5b952ff5
DM
1147 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1148 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1149 } else {
1150 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1151 }
1152
2ed36a41
DM
1153 } elsif ($drive->{interface} eq 'ide'){
1154 $maxdev = 2;
1155 my $controller = int($drive->{index} / $maxdev);
1156 my $unit = $drive->{index} % $maxdev;
1157 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1158
7ebe888a 1159 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1160 } elsif ($drive->{interface} eq 'sata'){
1161 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1162 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1163 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1164 } elsif ($drive->{interface} eq 'usb') {
1165 die "implement me";
1166 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1167 } else {
1168 die "unsupported interface type";
ca916ecc
DA
1169 }
1170
3b408e82
DM
1171 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1172
ca916ecc
DA
1173 return $device;
1174}
1175
15b21acc 1176sub get_initiator_name {
46f58b5f 1177 my $initiator;
15b21acc 1178
46f58b5f
DM
1179 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1180 while (defined(my $line = <$fh>)) {
1181 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1182 $initiator = $1;
1183 last;
1184 }
46f58b5f
DM
1185 $fh->close();
1186
15b21acc
MR
1187 return $initiator;
1188}
1189
1e3baf05
DM
1190sub print_drive_full {
1191 my ($storecfg, $vmid, $drive) = @_;
1192
1193 my $opts = '';
1194 foreach my $o (@qemu_drive_options) {
3b408e82 1195 next if $o eq 'bootindex';
1e3baf05 1196 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1197 }
1e3baf05 1198
9bf371a6
DM
1199 foreach my $o (qw(bps bps_rd bps_wr)) {
1200 my $v = $drive->{"m$o"};
1201 $opts .= ",$o=" . int($v*1024*1024) if $v;
1202 }
1203
1e3baf05 1204 # use linux-aio by default (qemu default is threads)
19672434 1205 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1206
1207 my $path;
1208 my $volid = $drive->{file};
6b64503e
DM
1209 if (drive_is_cdrom($drive)) {
1210 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1211 } else {
1212 if ($volid =~ m|^/|) {
1213 $path = $volid;
1214 } else {
6b64503e 1215 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1216 }
1217 }
1218
ef86170e 1219 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1220
f1e05305
AD
1221 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1222 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1223
1e3baf05
DM
1224 my $pathinfo = $path ? "file=$path," : '';
1225
3ebfcc86 1226 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1227}
1228
cc4d6182 1229sub print_netdevice_full {
5bdcf937 1230 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1231
1232 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1233
1234 my $device = $net->{model};
1235 if ($net->{model} eq 'virtio') {
1236 $device = 'virtio-net-pci';
1237 };
1238
1239 # qemu > 0.15 always try to boot from network - we disable that by
1240 # not loading the pxe rom file
1241 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
5bdcf937 1242 my $pciaddr = print_pci_addr("$netid", $bridges);
cc4d6182 1243 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1244 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1245 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1246 my $vectors = $net->{queues} * 2 + 2;
1247 $tmpstr .= ",vectors=$vectors,mq=on";
1248 }
cc4d6182
DA
1249 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1250 return $tmpstr;
1251}
1252
1253sub print_netdev_full {
1254 my ($vmid, $conf, $net, $netid) = @_;
1255
1256 my $i = '';
1257 if ($netid =~ m/^net(\d+)$/) {
1258 $i = int($1);
1259 }
1260
1261 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1262
1263 my $ifname = "tap${vmid}i$i";
1264
1265 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1266 die "interface name '$ifname' is too long (max 15 character)\n"
1267 if length($ifname) >= 16;
1268
1269 my $vhostparam = '';
1270 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1271
1272 my $vmname = $conf->{name} || "vm$vmid";
1273
a9410357
AD
1274 my $netdev = "";
1275
cc4d6182 1276 if ($net->{bridge}) {
a9410357 1277 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1278 } else {
a9410357 1279 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1280 }
a9410357
AD
1281
1282 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1283
1284 return $netdev;
cc4d6182 1285}
1e3baf05
DM
1286
1287sub drive_is_cdrom {
1288 my ($drive) = @_;
1289
1290 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1291
1292}
1293
2ed5d572
AD
1294sub parse_numa {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 foreach my $kvp (split(/,/, $data)) {
1300
1301 if ($kvp =~ m/^memory=(\S+)$/) {
1302 $res->{memory} = $1;
1303 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1304 $res->{policy} = $1;
1305 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1306 $res->{cpus}->{start} = $1;
1307 $res->{cpus}->{end} = $3;
1308 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1309 $res->{hostnodes}->{start} = $1;
1310 $res->{hostnodes}->{end} = $3;
1311 } else {
1312 return undef;
1313 }
1314 }
1315
1316 return $res;
1317}
1318
040b06b7
DA
1319sub parse_hostpci {
1320 my ($value) = @_;
1321
1322 return undef if !$value;
1323
0cea6a01
DM
1324
1325 my @list = split(/,/, $value);
1326 my $found;
1327
040b06b7 1328 my $res = {};
0cea6a01 1329 foreach my $kv (@list) {
040b06b7 1330
4543ecf0 1331 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1332 $found = 1;
4543ecf0
AD
1333 if(defined($4)){
1334 push @{$res->{pciid}}, { id => $2 , function => $4};
1335
1336 }else{
1337 my $pcidevices = lspci($2);
1338 $res->{pciid} = $pcidevices->{$2};
1339 }
0cea6a01
DM
1340 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1341 $res->{driver} = $1;
1342 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1343 $res->{rombar} = $1;
2e3b7e2a
AD
1344 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1345 $res->{'x-vga'} = $1;
1346 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1347 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1348 } else {
1349 warn "unknown hostpci setting '$kv'\n";
1350 }
040b06b7
DA
1351 }
1352
0cea6a01
DM
1353 return undef if !$found;
1354
040b06b7
DA
1355 return $res;
1356}
1357
1e3baf05
DM
1358# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1359sub parse_net {
1360 my ($data) = @_;
1361
1362 my $res = {};
1363
6b64503e 1364 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1365
e4c6e0b8 1366 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1367 my $model = lc($1);
92f0fedc 1368 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1369 $res->{model} = $model;
1370 $res->{macaddr} = $mac;
1371 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1372 $res->{bridge} = $1;
a9410357
AD
1373 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1374 $res->{queues} = $1;
1e3baf05
DM
1375 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1376 $res->{rate} = $1;
5070f384
DA
1377 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1378 $res->{tag} = $1;
2dd4aa4c
AD
1379 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1380 $res->{firewall} = $1;
1e3baf05
DM
1381 } else {
1382 return undef;
1383 }
19672434 1384
1e3baf05
DM
1385 }
1386
1387 return undef if !$res->{model};
1388
1389 return $res;
1390}
1391
1392sub print_net {
1393 my $net = shift;
1394
1395 my $res = "$net->{model}";
1396 $res .= "=$net->{macaddr}" if $net->{macaddr};
1397 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1398 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1399 $res .= ",tag=$net->{tag}" if $net->{tag};
28138e9a 1400 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1e3baf05
DM
1401
1402 return $res;
1403}
1404
1405sub add_random_macs {
1406 my ($settings) = @_;
1407
1408 foreach my $opt (keys %$settings) {
1409 next if $opt !~ m/^net(\d+)$/;
1410 my $net = parse_net($settings->{$opt});
1411 next if !$net;
1412 $settings->{$opt} = print_net($net);
1413 }
1414}
1415
1416sub add_unused_volume {
1858638f 1417 my ($config, $volid) = @_;
1e3baf05
DM
1418
1419 my $key;
1420 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1421 my $test = "unused$ind";
1422 if (my $vid = $config->{$test}) {
1423 return if $vid eq $volid; # do not add duplicates
1424 } else {
1425 $key = $test;
19672434 1426 }
1e3baf05
DM
1427 }
1428
1429 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1430
1858638f 1431 $config->{$key} = $volid;
1e3baf05 1432
1858638f 1433 return $key;
1e3baf05
DM
1434}
1435
055d554d
DM
1436sub vm_is_volid_owner {
1437 my ($storecfg, $vmid, $volid) = @_;
1438
1439 if ($volid !~ m|^/|) {
1440 my ($path, $owner);
1441 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1442 if ($owner && ($owner == $vmid)) {
1443 return 1;
1444 }
1445 }
1446
1447 return undef;
1448}
1449
1450sub vmconfig_delete_pending_option {
1451 my ($conf, $key) = @_;
1452
1453 delete $conf->{pending}->{$key};
1454 my $pending_delete_hash = { $key => 1 };
1455 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1456 $pending_delete_hash->{$opt} = 1;
1457 }
1458 $conf->{pending}->{delete} = join(',', keys %$pending_delete_hash);
1459}
1460
1461sub vmconfig_undelete_pending_option {
1462 my ($conf, $key) = @_;
1463
1464 my $pending_delete_hash = {};
1465 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1466 $pending_delete_hash->{$opt} = 1;
1467 }
1468 delete $pending_delete_hash->{$key};
1469
1470 my @keylist = keys %$pending_delete_hash;
1471 if (scalar(@keylist)) {
1472 $conf->{pending}->{delete} = join(',', @keylist);
1473 } else {
1474 delete $conf->{pending}->{delete};
1475 }
1476}
1477
1478sub vmconfig_register_unused_drive {
1479 my ($storecfg, $vmid, $conf, $drive) = @_;
1480
1481 if (!drive_is_cdrom($drive)) {
1482 my $volid = $drive->{file};
1483 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
1484 add_unused_volume($conf, $volid, $vmid);
1485 }
1486 }
1487}
1488
c750e90a
DM
1489sub vmconfig_cleanup_pending {
1490 my ($conf) = @_;
1491
1492 # remove pending changes when nothing changed
1493 my $changes;
1494 foreach my $opt (keys %{$conf->{pending}}) {
1495 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1496 $changes = 1;
1497 delete $conf->{pending}->{$opt};
1498 }
1499 }
1500
1501 # remove delete if option is not set
1502 my $pending_delete_hash = {};
1503 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1504 if (defined($conf->{$opt})) {
1505 $pending_delete_hash->{$opt} = 1;
1506 } else {
1507 $changes = 1;
1508 }
1509 }
1510
1511 my @keylist = keys %$pending_delete_hash;
1512 if (scalar(@keylist)) {
1513 $conf->{pending}->{delete} = join(',', @keylist);
1514 } else {
1515 delete $conf->{pending}->{delete};
1516 }
1517
1518 return $changes;
1519}
1520
2796e7d5
DM
1521my $valid_smbios1_options = {
1522 manufacturer => '\S+',
1523 product => '\S+',
1524 version => '\S+',
1525 serial => '\S+',
1526 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1527 sku => '\S+',
1528 family => '\S+',
1529};
1530
1531# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1532sub parse_smbios1 {
1533 my ($data) = @_;
1534
1535 my $res = {};
1536
1537 foreach my $kvp (split(/,/, $data)) {
1538 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1539 my ($k, $v) = split(/=/, $kvp);
1540 return undef if !defined($k) || !defined($v);
1541 return undef if !$valid_smbios1_options->{$k};
1542 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1543 $res->{$k} = $v;
1544 }
1545
1546 return $res;
1547}
1548
cd11416f
DM
1549sub print_smbios1 {
1550 my ($smbios1) = @_;
1551
1552 my $data = '';
1553 foreach my $k (keys %$smbios1) {
1554 next if !defined($smbios1->{$k});
1555 next if !$valid_smbios1_options->{$k};
1556 $data .= ',' if $data;
1557 $data .= "$k=$smbios1->{$k}";
1558 }
1559 return $data;
1560}
1561
2796e7d5
DM
1562PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1563sub verify_smbios1 {
1564 my ($value, $noerr) = @_;
1565
1566 return $value if parse_smbios1($value);
1567
1568 return undef if $noerr;
1569
1570 die "unable to parse smbios (type 1) options\n";
1571}
1572
1e3baf05
DM
1573PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1574sub verify_bootdisk {
1575 my ($value, $noerr) = @_;
1576
19672434 1577 return $value if valid_drivename($value);
1e3baf05
DM
1578
1579 return undef if $noerr;
1580
1581 die "invalid boot disk '$value'\n";
1582}
1583
2ed5d572
AD
1584PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1585sub verify_numa {
1586 my ($value, $noerr) = @_;
1587
1588 return $value if parse_numa($value);
1589
1590 return undef if $noerr;
1591
1592 die "unable to parse numa options\n";
1593}
1594
1e3baf05
DM
1595PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1596sub verify_net {
1597 my ($value, $noerr) = @_;
1598
1599 return $value if parse_net($value);
1600
1601 return undef if $noerr;
19672434 1602
1e3baf05
DM
1603 die "unable to parse network options\n";
1604}
1605
1606PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1607sub verify_drive {
1608 my ($value, $noerr) = @_;
1609
6b64503e 1610 return $value if parse_drive(undef, $value);
1e3baf05
DM
1611
1612 return undef if $noerr;
19672434 1613
1e3baf05
DM
1614 die "unable to parse drive options\n";
1615}
1616
1617PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1618sub verify_hostpci {
1619 my ($value, $noerr) = @_;
1620
040b06b7
DA
1621 return $value if parse_hostpci($value);
1622
1623 return undef if $noerr;
1624
1625 die "unable to parse pci id\n";
1e3baf05
DM
1626}
1627
0ea9541d
DM
1628PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1629sub verify_watchdog {
1630 my ($value, $noerr) = @_;
1631
1632 return $value if parse_watchdog($value);
1633
1634 return undef if $noerr;
19672434 1635
0ea9541d
DM
1636 die "unable to parse watchdog options\n";
1637}
1638
1639sub parse_watchdog {
1640 my ($value) = @_;
1641
1642 return undef if !$value;
1643
1644 my $res = {};
1645
6b64503e 1646 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1647 next if $p =~ m/^\s*$/;
1648
1649 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1650 $res->{model} = $2;
1651 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1652 $res->{action} = $2;
1653 } else {
1654 return undef;
1655 }
1656 }
1657
1658 return $res;
1659}
1660
59411c4e
DM
1661PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1662sub verify_startup {
1663 my ($value, $noerr) = @_;
1664
1665 return $value if parse_startup($value);
1666
1667 return undef if $noerr;
1668
1669 die "unable to parse startup options\n";
1670}
1671
1672sub parse_startup {
1673 my ($value) = @_;
1674
1675 return undef if !$value;
1676
1677 my $res = {};
1678
1679 foreach my $p (split(/,/, $value)) {
1680 next if $p =~ m/^\s*$/;
1681
1682 if ($p =~ m/^(order=)?(\d+)$/) {
1683 $res->{order} = $2;
1684 } elsif ($p =~ m/^up=(\d+)$/) {
1685 $res->{up} = $1;
1686 } elsif ($p =~ m/^down=(\d+)$/) {
1687 $res->{down} = $1;
1688 } else {
1689 return undef;
1690 }
1691 }
1692
1693 return $res;
1694}
1695
1e3baf05
DM
1696sub parse_usb_device {
1697 my ($value) = @_;
1698
1699 return undef if !$value;
1700
6b64503e 1701 my @dl = split(/,/, $value);
1e3baf05
DM
1702 my $found;
1703
1704 my $res = {};
1705 foreach my $v (@dl) {
036e0e2b 1706 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1707 $found = 1;
036e0e2b
DM
1708 $res->{vendorid} = $2;
1709 $res->{productid} = $4;
1e3baf05
DM
1710 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1711 $found = 1;
1712 $res->{hostbus} = $1;
1713 $res->{hostport} = $2;
80401dd8
DM
1714 } elsif ($v =~ m/^spice$/) {
1715 $found = 1;
1716 $res->{spice} = 1;
1e3baf05
DM
1717 } else {
1718 return undef;
1719 }
1720 }
1721 return undef if !$found;
1722
1723 return $res;
1724}
19672434 1725
1e3baf05
DM
1726PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1727sub verify_usb_device {
1728 my ($value, $noerr) = @_;
1729
1730 return $value if parse_usb_device($value);
1731
1732 return undef if $noerr;
19672434 1733
1e3baf05
DM
1734 die "unable to parse usb device\n";
1735}
1736
1e3baf05
DM
1737# add JSON properties for create and set function
1738sub json_config_properties {
1739 my $prop = shift;
1740
1741 foreach my $opt (keys %$confdesc) {
18bfb361 1742 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1743 $prop->{$opt} = $confdesc->{$opt};
1744 }
1745
1746 return $prop;
1747}
1748
1749sub check_type {
1750 my ($key, $value) = @_;
1751
1752 die "unknown setting '$key'\n" if !$confdesc->{$key};
1753
1754 my $type = $confdesc->{$key}->{type};
1755
6b64503e 1756 if (!defined($value)) {
1e3baf05
DM
1757 die "got undefined value\n";
1758 }
1759
1760 if ($value =~ m/[\n\r]/) {
1761 die "property contains a line feed\n";
1762 }
1763
1764 if ($type eq 'boolean') {
19672434
DM
1765 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1766 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1767 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1768 } elsif ($type eq 'integer') {
1769 return int($1) if $value =~ m/^(\d+)$/;
1770 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1771 } elsif ($type eq 'number') {
1772 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1773 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1774 } elsif ($type eq 'string') {
1775 if (my $fmt = $confdesc->{$key}->{format}) {
1776 if ($fmt eq 'pve-qm-drive') {
1777 # special case - we need to pass $key to parse_drive()
6b64503e 1778 my $drive = parse_drive($key, $value);
1e3baf05
DM
1779 return $value if $drive;
1780 die "unable to parse drive options\n";
1781 }
1782 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1783 return $value;
1784 }
1e3baf05 1785 $value =~ s/^\"(.*)\"$/$1/;
19672434 1786 return $value;
1e3baf05
DM
1787 } else {
1788 die "internal error"
1789 }
1790}
1791
191435c6
DM
1792sub lock_config_full {
1793 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1794
6b64503e 1795 my $filename = config_file_lock($vmid);
1e3baf05 1796
191435c6 1797 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1798
1799 die $@ if $@;
5fdbe4f0
DM
1800
1801 return $res;
1e3baf05
DM
1802}
1803
4e4f83fe
DM
1804sub lock_config_mode {
1805 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1806
1807 my $filename = config_file_lock($vmid);
1808
4e4f83fe 1809 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1810
1811 die $@ if $@;
1812
1813 return $res;
1814}
1815
191435c6
DM
1816sub lock_config {
1817 my ($vmid, $code, @param) = @_;
1818
1819 return lock_config_full($vmid, 10, $code, @param);
1820}
1821
1e3baf05 1822sub cfs_config_path {
a78ccf26 1823 my ($vmid, $node) = @_;
1e3baf05 1824
a78ccf26
DM
1825 $node = $nodename if !$node;
1826 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1827}
1828
040b06b7
DA
1829sub check_iommu_support{
1830 #fixme : need to check IOMMU support
1831 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1832
1833 my $iommu=1;
1834 return $iommu;
1835
1836}
1837
1e3baf05 1838sub config_file {
a78ccf26 1839 my ($vmid, $node) = @_;
1e3baf05 1840
a78ccf26 1841 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1842 return "/etc/pve/$cfspath";
1843}
1844
1845sub config_file_lock {
1846 my ($vmid) = @_;
1847
1848 return "$lock_dir/lock-$vmid.conf";
1849}
1850
1851sub touch_config {
1852 my ($vmid) = @_;
1853
6b64503e 1854 my $conf = config_file($vmid);
1e3baf05
DM
1855 utime undef, undef, $conf;
1856}
1857
1e3baf05 1858sub destroy_vm {
a6af7b3e 1859 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1860
6b64503e 1861 my $conffile = config_file($vmid);
1e3baf05 1862
6b64503e 1863 my $conf = load_config($vmid);
1e3baf05 1864
6b64503e 1865 check_lock($conf);
1e3baf05 1866
19672434 1867 # only remove disks owned by this VM
1e3baf05
DM
1868 foreach_drive($conf, sub {
1869 my ($ds, $drive) = @_;
1870
6b64503e 1871 return if drive_is_cdrom($drive);
1e3baf05
DM
1872
1873 my $volid = $drive->{file};
ed221350 1874
ff1a2432 1875 return if !$volid || $volid =~ m|^/|;
1e3baf05 1876
6b64503e 1877 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1878 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1879
6b64503e 1880 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1881 });
19672434 1882
a6af7b3e 1883 if ($keep_empty_config) {
9c502e26 1884 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1885 } else {
1886 unlink $conffile;
1887 }
1e3baf05
DM
1888
1889 # also remove unused disk
1890 eval {
6b64503e 1891 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1892
1893 eval {
6b64503e 1894 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1895 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1896 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1897 });
1898 };
1899 warn $@ if $@;
1900
1901 };
1902 warn $@ if $@;
1903}
1904
1e3baf05 1905sub load_config {
7e8dcf2c 1906 my ($vmid, $node) = @_;
1e3baf05 1907
7e8dcf2c 1908 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1909
1910 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1911
1912 die "no such VM ('$vmid')\n" if !defined($conf);
1913
1914 return $conf;
19672434 1915}
1e3baf05
DM
1916
1917sub parse_vm_config {
1918 my ($filename, $raw) = @_;
1919
1920 return undef if !defined($raw);
1921
554ac7e7 1922 my $res = {
fc1ddcdc 1923 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1924 snapshots => {},
0d732d16 1925 pending => {},
554ac7e7 1926 };
1e3baf05 1927
19672434 1928 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1929 || die "got strange filename '$filename'";
1930
1931 my $vmid = $1;
1932
0d18dcfc 1933 my $conf = $res;
0581fe4f 1934 my $descr = '';
e297c490 1935 my $section = '';
0581fe4f 1936
0d18dcfc
DM
1937 my @lines = split(/\n/, $raw);
1938 foreach my $line (@lines) {
1e3baf05 1939 next if $line =~ m/^\s*$/;
be190583 1940
eab09f4e 1941 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 1942 $section = 'pending';
0d732d16
DM
1943 $conf->{description} = $descr if $descr;
1944 $descr = '';
e297c490 1945 $conf = $res->{$section} = {};
eab09f4e
AD
1946 next;
1947
0d732d16 1948 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 1949 $section = $1;
0d18dcfc 1950 $conf->{description} = $descr if $descr;
782f4f75 1951 $descr = '';
e297c490 1952 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
1953 next;
1954 }
1e3baf05 1955
0581fe4f
DM
1956 if ($line =~ m/^\#(.*)\s*$/) {
1957 $descr .= PVE::Tools::decode_text($1) . "\n";
1958 next;
1959 }
1960
1e3baf05 1961 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1962 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1963 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1964 $conf->{snapstate} = $1;
1e3baf05
DM
1965 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1966 my $key = $1;
1967 my $value = $2;
0d18dcfc 1968 $conf->{$key} = $value;
ef824322 1969 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
e297c490 1970 my $value = $1;
ef824322
DM
1971 if ($section eq 'pending') {
1972 $conf->{delete} = $value; # we parse this later
1973 } else {
1974 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
eab09f4e 1975 }
1e3baf05
DM
1976 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1977 my $key = $1;
1978 my $value = $2;
1979 eval { $value = check_type($key, $value); };
1980 if ($@) {
1981 warn "vm $vmid - unable to parse value of '$key' - $@";
1982 } else {
1983 my $fmt = $confdesc->{$key}->{format};
1984 if ($fmt && $fmt eq 'pve-qm-drive') {
1985 my $v = parse_drive($key, $value);
1986 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1987 $v->{file} = $volid;
6b64503e 1988 $value = print_drive($vmid, $v);
1e3baf05
DM
1989 } else {
1990 warn "vm $vmid - unable to parse value of '$key'\n";
1991 next;
1992 }
1993 }
1994
1995 if ($key eq 'cdrom') {
0d18dcfc 1996 $conf->{ide2} = $value;
1e3baf05 1997 } else {
0d18dcfc 1998 $conf->{$key} = $value;
1e3baf05
DM
1999 }
2000 }
2001 }
2002 }
2003
0d18dcfc 2004 $conf->{description} = $descr if $descr;
0581fe4f 2005
0d18dcfc 2006 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
2007
2008 return $res;
2009}
2010
1858638f
DM
2011sub write_vm_config {
2012 my ($filename, $conf) = @_;
1e3baf05 2013
0d18dcfc
DM
2014 delete $conf->{snapstate}; # just to be sure
2015
1858638f
DM
2016 if ($conf->{cdrom}) {
2017 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2018 $conf->{ide2} = $conf->{cdrom};
2019 delete $conf->{cdrom};
2020 }
1e3baf05
DM
2021
2022 # we do not use 'smp' any longer
1858638f
DM
2023 if ($conf->{sockets}) {
2024 delete $conf->{smp};
2025 } elsif ($conf->{smp}) {
2026 $conf->{sockets} = $conf->{smp};
2027 delete $conf->{cores};
2028 delete $conf->{smp};
1e3baf05
DM
2029 }
2030
264e519f 2031 if ($conf->{maxcpus} && $conf->{sockets}) {
3bd18e48
AD
2032 delete $conf->{sockets};
2033 }
264e519f 2034
ee2f90b1 2035 my $used_volids = {};
0d18dcfc 2036
ee2f90b1 2037 my $cleanup_config = sub {
ef824322 2038 my ($cref, $pending, $snapname) = @_;
1858638f 2039
ee2f90b1
DM
2040 foreach my $key (keys %$cref) {
2041 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
ef824322 2042 $key eq 'snapstate' || $key eq 'pending';
ee2f90b1 2043 my $value = $cref->{$key};
ef824322
DM
2044 if ($key eq 'delete') {
2045 die "propertry 'delete' is only allowed in [PENDING]\n"
2046 if !$pending;
2047 # fixme: check syntax?
2048 next;
2049 }
ee2f90b1
DM
2050 eval { $value = check_type($key, $value); };
2051 die "unable to parse value of '$key' - $@" if $@;
1858638f 2052
ee2f90b1
DM
2053 $cref->{$key} = $value;
2054
a8e2f942 2055 if (!$snapname && valid_drivename($key)) {
ed221350 2056 my $drive = parse_drive($key, $value);
ee2f90b1
DM
2057 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2058 }
1e3baf05 2059 }
ee2f90b1
DM
2060 };
2061
2062 &$cleanup_config($conf);
ef824322
DM
2063
2064 &$cleanup_config($conf->{pending}, 1);
2065
ee2f90b1 2066 foreach my $snapname (keys %{$conf->{snapshots}}) {
ef824322
DM
2067 die "internal error" if $snapname eq 'pending';
2068 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
1e3baf05
DM
2069 }
2070
1858638f
DM
2071 # remove 'unusedX' settings if we re-add a volume
2072 foreach my $key (keys %$conf) {
2073 my $value = $conf->{$key};
ee2f90b1 2074 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 2075 delete $conf->{$key};
1e3baf05 2076 }
1858638f 2077 }
be190583 2078
0d18dcfc
DM
2079 my $generate_raw_config = sub {
2080 my ($conf) = @_;
0581fe4f 2081
0d18dcfc
DM
2082 my $raw = '';
2083
2084 # add description as comment to top of file
2085 my $descr = $conf->{description} || '';
2086 foreach my $cl (split(/\n/, $descr)) {
2087 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2088 }
2089
2090 foreach my $key (sort keys %$conf) {
ef824322 2091 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
0d18dcfc
DM
2092 $raw .= "$key: $conf->{$key}\n";
2093 }
2094 return $raw;
2095 };
0581fe4f 2096
0d18dcfc 2097 my $raw = &$generate_raw_config($conf);
ef824322
DM
2098
2099 if (scalar(keys %{$conf->{pending}})){
2100 $raw .= "\n[PENDING]\n";
2101 $raw .= &$generate_raw_config($conf->{pending});
2102 }
2103
0d18dcfc
DM
2104 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2105 $raw .= "\n[$snapname]\n";
2106 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2107 }
1e3baf05 2108
1858638f
DM
2109 return $raw;
2110}
1e3baf05 2111
1858638f
DM
2112sub update_config_nolock {
2113 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2114
1858638f 2115 check_lock($conf) if !$skiplock;
97d62eb7 2116
1858638f 2117 my $cfspath = cfs_config_path($vmid);
1e3baf05 2118
1858638f
DM
2119 PVE::Cluster::cfs_write_file($cfspath, $conf);
2120}
1e3baf05 2121
1858638f
DM
2122sub update_config {
2123 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2124
1858638f 2125 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
2126}
2127
19672434 2128sub load_defaults {
1e3baf05
DM
2129
2130 my $res = {};
2131
2132 # we use static defaults from our JSON schema configuration
2133 foreach my $key (keys %$confdesc) {
2134 if (defined(my $default = $confdesc->{$key}->{default})) {
2135 $res->{$key} = $default;
2136 }
2137 }
19672434 2138
1e3baf05
DM
2139 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2140 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2141
2142 return $res;
2143}
2144
2145sub config_list {
2146 my $vmlist = PVE::Cluster::get_vmlist();
2147 my $res = {};
2148 return $res if !$vmlist || !$vmlist->{ids};
2149 my $ids = $vmlist->{ids};
2150
1e3baf05
DM
2151 foreach my $vmid (keys %$ids) {
2152 my $d = $ids->{$vmid};
2153 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2154 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2155 $res->{$vmid}->{exists} = 1;
2156 }
2157 return $res;
2158}
2159
64e13401
DM
2160# test if VM uses local resources (to prevent migration)
2161sub check_local_resources {
2162 my ($conf, $noerr) = @_;
2163
2164 my $loc_res = 0;
19672434 2165
e0ab7331
DM
2166 $loc_res = 1 if $conf->{hostusb}; # old syntax
2167 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2168
0d29ab3b 2169 foreach my $k (keys %$conf) {
49ca581d 2170 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 2171 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2172 }
2173
2174 die "VM uses local resources\n" if $loc_res && !$noerr;
2175
2176 return $loc_res;
2177}
2178
719893a9 2179# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2180sub check_storage_availability {
2181 my ($storecfg, $conf, $node) = @_;
2182
2183 foreach_drive($conf, sub {
2184 my ($ds, $drive) = @_;
2185
2186 my $volid = $drive->{file};
2187 return if !$volid;
2188
2189 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2190 return if !$sid;
2191
2192 # check if storage is available on both nodes
2193 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2194 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2195 });
2196}
2197
719893a9
DM
2198# list nodes where all VM images are available (used by has_feature API)
2199sub shared_nodes {
2200 my ($conf, $storecfg) = @_;
2201
2202 my $nodelist = PVE::Cluster::get_nodelist();
2203 my $nodehash = { map { $_ => 1 } @$nodelist };
2204 my $nodename = PVE::INotify::nodename();
be190583 2205
719893a9
DM
2206 foreach_drive($conf, sub {
2207 my ($ds, $drive) = @_;
2208
2209 my $volid = $drive->{file};
2210 return if !$volid;
2211
2212 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2213 if ($storeid) {
2214 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2215 if ($scfg->{disable}) {
2216 $nodehash = {};
2217 } elsif (my $avail = $scfg->{nodes}) {
2218 foreach my $node (keys %$nodehash) {
2219 delete $nodehash->{$node} if !$avail->{$node};
2220 }
2221 } elsif (!$scfg->{shared}) {
2222 foreach my $node (keys %$nodehash) {
2223 delete $nodehash->{$node} if $node ne $nodename
2224 }
2225 }
2226 }
2227 });
2228
2229 return $nodehash
2230}
2231
1e3baf05
DM
2232sub check_lock {
2233 my ($conf) = @_;
2234
2235 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2236}
2237
2238sub check_cmdline {
2239 my ($pidfile, $pid) = @_;
2240
6b64503e
DM
2241 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2242 if (defined($fh)) {
1e3baf05
DM
2243 my $line = <$fh>;
2244 $fh->close;
2245 return undef if !$line;
6b64503e 2246 my @param = split(/\0/, $line);
1e3baf05
DM
2247
2248 my $cmd = $param[0];
06094efd 2249 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2250
2251 for (my $i = 0; $i < scalar (@param); $i++) {
2252 my $p = $param[$i];
2253 next if !$p;
2254 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2255 my $p = $param[$i+1];
2256 return 1 if $p && ($p eq $pidfile);
2257 return undef;
2258 }
2259 }
2260 }
2261 return undef;
2262}
2263
2264sub check_running {
7e8dcf2c 2265 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2266
7e8dcf2c 2267 my $filename = config_file($vmid, $node);
1e3baf05
DM
2268
2269 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2270 if !$nocheck && ! -f $filename;
1e3baf05 2271
e6c3b671 2272 my $pidfile = pidfile_name($vmid);
1e3baf05 2273
e6c3b671
DM
2274 if (my $fd = IO::File->new("<$pidfile")) {
2275 my $st = stat($fd);
1e3baf05 2276 my $line = <$fd>;
6b64503e 2277 close($fd);
1e3baf05
DM
2278
2279 my $mtime = $st->mtime;
2280 if ($mtime > time()) {
2281 warn "file '$filename' modified in future\n";
2282 }
2283
2284 if ($line =~ m/^(\d+)$/) {
2285 my $pid = $1;
e6c3b671
DM
2286 if (check_cmdline($pidfile, $pid)) {
2287 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2288 return $pid;
2289 }
2290 }
1e3baf05
DM
2291 }
2292 }
2293
2294 return undef;
2295}
2296
2297sub vzlist {
19672434 2298
1e3baf05
DM
2299 my $vzlist = config_list();
2300
6b64503e 2301 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2302
19672434 2303 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2304 next if $de !~ m/^(\d+)\.pid$/;
2305 my $vmid = $1;
6b64503e
DM
2306 next if !defined($vzlist->{$vmid});
2307 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2308 $vzlist->{$vmid}->{pid} = $pid;
2309 }
2310 }
2311
2312 return $vzlist;
2313}
2314
1e3baf05
DM
2315sub disksize {
2316 my ($storecfg, $conf) = @_;
2317
2318 my $bootdisk = $conf->{bootdisk};
2319 return undef if !$bootdisk;
2320 return undef if !valid_drivename($bootdisk);
2321
2322 return undef if !$conf->{$bootdisk};
2323
2324 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2325 return undef if !defined($drive);
2326
2327 return undef if drive_is_cdrom($drive);
2328
2329 my $volid = $drive->{file};
2330 return undef if !$volid;
2331
24afaca0 2332 return $drive->{size};
1e3baf05
DM
2333}
2334
2335my $last_proc_pid_stat;
2336
03a33f30
DM
2337# get VM status information
2338# This must be fast and should not block ($full == false)
2339# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2340sub vmstatus {
03a33f30 2341 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2342
2343 my $res = {};
2344
19672434 2345 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2346
2347 my $list = vzlist();
694fcad4 2348 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2349
ae4915a2
DM
2350 my $cpucount = $cpuinfo->{cpus} || 1;
2351
1e3baf05
DM
2352 foreach my $vmid (keys %$list) {
2353 next if $opt_vmid && ($vmid ne $opt_vmid);
2354
2355 my $cfspath = cfs_config_path($vmid);
2356 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2357
2358 my $d = {};
2359 $d->{pid} = $list->{$vmid}->{pid};
2360
2361 # fixme: better status?
2362 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2363
af990afe
DM
2364 my $size = disksize($storecfg, $conf);
2365 if (defined($size)) {
2366 $d->{disk} = 0; # no info available
1e3baf05
DM
2367 $d->{maxdisk} = $size;
2368 } else {
2369 $d->{disk} = 0;
2370 $d->{maxdisk} = 0;
2371 }
2372
2373 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2374 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2375
1e3baf05 2376 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2377 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2378
8b1accf7 2379 if ($conf->{balloon}) {
4bdb0514 2380 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2381 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2382 }
2383
1e3baf05
DM
2384 $d->{uptime} = 0;
2385 $d->{cpu} = 0;
1e3baf05
DM
2386 $d->{mem} = 0;
2387
2388 $d->{netout} = 0;
2389 $d->{netin} = 0;
2390
2391 $d->{diskread} = 0;
2392 $d->{diskwrite} = 0;
2393
4d8c851b
AD
2394 $d->{template} = is_template($conf);
2395
1e3baf05
DM
2396 $res->{$vmid} = $d;
2397 }
2398
2399 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2400 foreach my $dev (keys %$netdev) {
2401 next if $dev !~ m/^tap([1-9]\d*)i/;
2402 my $vmid = $1;
2403 my $d = $res->{$vmid};
2404 next if !$d;
19672434 2405
1e3baf05
DM
2406 $d->{netout} += $netdev->{$dev}->{receive};
2407 $d->{netin} += $netdev->{$dev}->{transmit};
2408 }
2409
1e3baf05
DM
2410 my $ctime = gettimeofday;
2411
2412 foreach my $vmid (keys %$list) {
2413
2414 my $d = $res->{$vmid};
2415 my $pid = $d->{pid};
2416 next if !$pid;
2417
694fcad4
DM
2418 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2419 next if !$pstat; # not running
19672434 2420
694fcad4 2421 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2422
694fcad4 2423 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2424
694fcad4 2425 if ($pstat->{vsize}) {
6b64503e 2426 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2427 }
2428
2429 my $old = $last_proc_pid_stat->{$pid};
2430 if (!$old) {
19672434
DM
2431 $last_proc_pid_stat->{$pid} = {
2432 time => $ctime,
1e3baf05
DM
2433 used => $used,
2434 cpu => 0,
1e3baf05
DM
2435 };
2436 next;
2437 }
2438
7f0b5beb 2439 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2440
2441 if ($dtime > 1000) {
2442 my $dutime = $used - $old->{used};
2443
ae4915a2 2444 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2445 $last_proc_pid_stat->{$pid} = {
19672434 2446 time => $ctime,
1e3baf05
DM
2447 used => $used,
2448 cpu => $d->{cpu},
1e3baf05
DM
2449 };
2450 } else {
2451 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2452 }
2453 }
2454
f5eb281a 2455 return $res if !$full;
03a33f30
DM
2456
2457 my $qmpclient = PVE::QMPClient->new();
2458
64e7fcf2
DM
2459 my $ballooncb = sub {
2460 my ($vmid, $resp) = @_;
2461
2462 my $info = $resp->{'return'};
2463 return if !$info->{max_mem};
be190583 2464
64e7fcf2
DM
2465 my $d = $res->{$vmid};
2466
2467 # use memory assigned to VM
2468 $d->{maxmem} = $info->{max_mem};
2469 $d->{balloon} = $info->{actual};
be190583 2470
64e7fcf2
DM
2471 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2472 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2473 $d->{freemem} = $info->{free_mem};
2474 }
2475
2476 };
2477
03a33f30
DM
2478 my $blockstatscb = sub {
2479 my ($vmid, $resp) = @_;
2480 my $data = $resp->{'return'} || [];
2481 my $totalrdbytes = 0;
2482 my $totalwrbytes = 0;
2483 for my $blockstat (@$data) {
2484 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2485 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2486 }
2487 $res->{$vmid}->{diskread} = $totalrdbytes;
2488 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2489 };
2490
2491 my $statuscb = sub {
2492 my ($vmid, $resp) = @_;
64e7fcf2 2493
03a33f30 2494 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2495 # this fails if ballon driver is not loaded, so this must be
2496 # the last commnand (following command are aborted if this fails).
2497 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2498
2499 my $status = 'unknown';
2500 if (!defined($status = $resp->{'return'}->{status})) {
2501 warn "unable to get VM status\n";
2502 return;
2503 }
2504
2505 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2506 };
2507
2508 foreach my $vmid (keys %$list) {
2509 next if $opt_vmid && ($vmid ne $opt_vmid);
2510 next if !$res->{$vmid}->{pid}; # not running
2511 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2512 }
2513
c8125172 2514 $qmpclient->queue_execute(undef, 1);
03a33f30
DM
2515
2516 foreach my $vmid (keys %$list) {
2517 next if $opt_vmid && ($vmid ne $opt_vmid);
2518 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2519 }
2520
1e3baf05
DM
2521 return $res;
2522}
2523
2524sub foreach_drive {
2525 my ($conf, $func) = @_;
2526
2527 foreach my $ds (keys %$conf) {
2528 next if !valid_drivename($ds);
2529
6b64503e 2530 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2531 next if !$drive;
2532
2533 &$func($ds, $drive);
2534 }
2535}
2536
d5769dc2
DM
2537sub foreach_volid {
2538 my ($conf, $func) = @_;
be190583 2539
d5769dc2
DM
2540 my $volhash = {};
2541
2542 my $test_volid = sub {
2543 my ($volid, $is_cdrom) = @_;
2544
2545 return if !$volid;
be190583 2546
d5769dc2
DM
2547 $volhash->{$volid} = $is_cdrom || 0;
2548 };
2549
ed221350 2550 foreach_drive($conf, sub {
d5769dc2
DM
2551 my ($ds, $drive) = @_;
2552 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2553 });
2554
2555 foreach my $snapname (keys %{$conf->{snapshots}}) {
2556 my $snap = $conf->{snapshots}->{$snapname};
2557 &$test_volid($snap->{vmstate}, 0);
ed221350 2558 foreach_drive($snap, sub {
d5769dc2
DM
2559 my ($ds, $drive) = @_;
2560 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2561 });
2562 }
2563
2564 foreach my $volid (keys %$volhash) {
be190583 2565 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2566 }
2567}
2568
86b8228b
DM
2569sub vga_conf_has_spice {
2570 my ($vga) = @_;
2571
590e698c
DM
2572 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2573
2574 return $1 || 1;
86b8228b
DM
2575}
2576
1e3baf05 2577sub config_to_command {
952958bc 2578 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2579
2580 my $cmd = [];
8c559505
DM
2581 my $globalFlags = [];
2582 my $machineFlags = [];
2583 my $rtcFlags = [];
519ed28c 2584 my $cpuFlags = [];
5bdcf937 2585 my $devices = [];
b78ebef7 2586 my $pciaddr = '';
5bdcf937 2587 my $bridges = {};
1e3baf05
DM
2588 my $kvmver = kvm_user_version();
2589 my $vernum = 0; # unknown
a3c52213
DM
2590 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2591 $vernum = $1*1000000+$2*1000;
2592 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2593 $vernum = $1*1000000+$2*1000+$3;
2594 }
2595
a3c52213 2596 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2597
2598 my $have_ovz = -f '/proc/vz/vestat';
2599
db656e5f
DM
2600 my $q35 = machine_type_is_q35($conf);
2601
1e3baf05
DM
2602 push @$cmd, '/usr/bin/kvm';
2603
2604 push @$cmd, '-id', $vmid;
2605
2606 my $use_virtio = 0;
2607
c971c4f2
AD
2608 my $qmpsocket = qmp_socket($vmid);
2609 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2610 push @$cmd, '-mon', "chardev=qmp,mode=control";
2611
7b7c6d1b 2612 my $socket = vnc_socket($vmid);
1e3baf05
DM
2613 push @$cmd, '-vnc', "unix:$socket,x509,password";
2614
6b64503e 2615 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2616
1e3baf05
DM
2617 push @$cmd, '-daemonize';
2618
2796e7d5
DM
2619 if ($conf->{smbios1}) {
2620 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2621 }
2622
7183bd9a
AD
2623 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2624
db656e5f 2625 if ($q35) {
b467f79a 2626 # the q35 chipset support native usb2, so we enable usb controller
db656e5f 2627 # by default for this machine type
f8e83f05 2628 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2629 } else {
f8e83f05
AD
2630 $pciaddr = print_pci_addr("piix3", $bridges);
2631 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2632
f8e83f05 2633 my $use_usb2 = 0;
db656e5f
DM
2634 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2635 next if !$conf->{"usb$i"};
2636 $use_usb2 = 1;
2637 }
2638 # include usb device config
2639 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2640 }
19672434 2641
5acbfe9e 2642 my $vga = $conf->{vga};
2fa3151e 2643
590e698c
DM
2644 my $qxlnum = vga_conf_has_spice($vga);
2645 $vga = 'qxl' if $qxlnum;
2fa3151e 2646
5acbfe9e 2647 if (!$vga) {
264e519f
DM
2648 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2649 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2650 $conf->{ostype} eq 'w2k8')) {
2651 $vga = 'std';
2652 } else {
2653 $vga = 'cirrus';
2654 }
2655 }
2656
1e3baf05 2657 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2658 my $tablet;
2659 if (defined($conf->{tablet})) {
2660 $tablet = $conf->{tablet};
2661 } else {
2662 $tablet = $defaults->{tablet};
590e698c 2663 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2664 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2665 }
2666
db656e5f 2667 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2668
1e3baf05 2669 # host pci devices
040b06b7 2670 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2671 my $d = parse_hostpci($conf->{"hostpci$i"});
2672 next if !$d;
2673
2674 my $pcie = $d->{pcie};
2675 if($pcie){
2676 die "q35 machine model is not enabled" if !$q35;
2677 $pciaddr = print_pcie_addr("hostpci$i");
2678 }else{
2679 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2680 }
2681
2682 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2683 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2684 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2685 if ($xvga && $xvga ne '') {
2686 push @$cpuFlags, 'kvm=off';
2687 $vga = 'none';
2688 }
2e3b7e2a 2689 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2690 my $pcidevices = $d->{pciid};
2691 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2692
4543ecf0
AD
2693 my $j=0;
2694 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2695
4543ecf0
AD
2696 my $id = "hostpci$i";
2697 $id .= ".$j" if $multifunction;
2698 my $addr = $pciaddr;
2699 $addr .= ".$j" if $multifunction;
2700 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2701
2702 if($j == 0){
2703 $devicestr .= "$rombar$xvga";
2704 $devicestr .= ",multifunction=on" if $multifunction;
2705 }
2706
2707 push @$devices, '-device', $devicestr;
2708 $j++;
2709 }
1e3baf05
DM
2710 }
2711
2712 # usb devices
2713 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2714 my $d = parse_usb_device($conf->{"usb$i"});
2715 next if !$d;
2716 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2717 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2718 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2719 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2720 } elsif ($d->{spice}) {
2721 # usb redir support for spice
2722 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2723 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2724 }
2725 }
2726
1e3baf05 2727 # serial devices
bae179aa 2728 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2729 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2730 if ($path eq 'socket') {
2731 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2732 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2733 push @$devices, '-device', "isa-serial,chardev=serial$i";
2734 } else {
2735 die "no such serial device\n" if ! -c $path;
2736 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2737 push @$devices, '-device', "isa-serial,chardev=serial$i";
2738 }
34978be3 2739 }
1e3baf05
DM
2740 }
2741
2742 # parallel devices
1989a89c 2743 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2744 if (my $path = $conf->{"parallel$i"}) {
19672434 2745 die "no such parallel device\n" if ! -c $path;
32e69805 2746 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2747 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2748 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2749 }
1e3baf05
DM
2750 }
2751
2752 my $vmname = $conf->{name} || "vm$vmid";
2753
2754 push @$cmd, '-name', $vmname;
19672434 2755
1e3baf05
DM
2756 my $sockets = 1;
2757 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2758 $sockets = $conf->{sockets} if $conf->{sockets};
2759
2760 my $cores = $conf->{cores} || 1;
3bd18e48
AD
2761 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2762
76267728
WL
2763 my $total_cores = $sockets * $cores;
2764 my $allowed_cores = $cpuinfo->{cpus};
2765
f34ebd52 2766 die "MAX $allowed_cores cores allowed per VM on this node\n"
76267728
WL
2767 if ($allowed_cores < $total_cores);
2768
264e519f 2769 if ($maxcpus) {
3bd18e48 2770 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
264e519f 2771 } else {
3bd18e48
AD
2772 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2773 }
1e3baf05 2774
1e3baf05
DM
2775 push @$cmd, '-nodefaults';
2776
32baffb4 2777 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2778
0888fdce
DM
2779 my $bootindex_hash = {};
2780 my $i = 1;
2781 foreach my $o (split(//, $bootorder)) {
2782 $bootindex_hash->{$o} = $i*100;
2783 $i++;
afdb31d5 2784 }
3b408e82
DM
2785
2786 push @$cmd, '-boot', "menu=on";
1e3baf05 2787
6b64503e 2788 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2789
6b64503e 2790 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2791
ef5e2be2 2792 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2793
2794 # time drift fix
6b64503e 2795 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2796
6b64503e 2797 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2798 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2799
2800 if (my $ost = $conf->{ostype}) {
6b9d84cf 2801 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2802
2803 if ($ost =~ m/^w/) { # windows
8c559505 2804 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2805
8c559505 2806 # use time drift fix when acpi is enabled
6b64503e 2807 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2808 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2809 }
2810 }
2811
be190583 2812 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2813 $ost eq 'wvista') {
8c559505 2814 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2815 push @$cmd, '-no-hpet';
462e8d19
AD
2816 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2817 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2818 }
2819
2820 if ($ost eq 'win7' || $ost eq 'win8') {
2821 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2822 }
1e3baf05
DM
2823 }
2824
8c559505
DM
2825 push @$rtcFlags, 'driftfix=slew' if $tdf;
2826
7f0b5beb 2827 if ($nokvm) {
8c559505 2828 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2829 } else {
2830 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2831 }
1e3baf05 2832
952958bc
DM
2833 my $machine_type = $forcemachine || $conf->{machine};
2834 if ($machine_type) {
2835 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2836 }
2837
8c559505
DM
2838 if ($conf->{startdate}) {
2839 push @$rtcFlags, "base=$conf->{startdate}";
2840 } elsif ($useLocaltime) {
2841 push @$rtcFlags, 'base=localtime';
2842 }
1e3baf05 2843
519ed28c
AD
2844 my $cpu = $nokvm ? "qemu64" : "kvm64";
2845 $cpu = $conf->{cpu} if $conf->{cpu};
2846
4dc339e7
AD
2847 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2848
6b9d84cf
AD
2849 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2850
2851 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2852
2e1a5389
AD
2853 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2854
be190583 2855 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2856
c0efd8cd
DM
2857 # Note: enforce needs kernel 3.10, so we do not use it for now
2858 # push @$cmd, '-cpu', "$cpu,enforce";
2859 push @$cmd, '-cpu', $cpu;
519ed28c 2860
67fb9de6 2861 my $memory = $conf->{memory} || $defaults->{memory};
8a010eae
AD
2862 push @$cmd, '-m', $memory;
2863
67fb9de6 2864 if ($conf->{numa}) {
8a010eae 2865
2ed5d572
AD
2866 my $numa_totalmemory = undef;
2867 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2868 next if !$conf->{"numa$i"};
2869 my $numa = parse_numa($conf->{"numa$i"});
2870 next if !$numa;
67fb9de6
DM
2871 # memory
2872 die "missing numa node$i memory value\n" if !$numa->{memory};
2ed5d572
AD
2873 my $numa_memory = $numa->{memory};
2874 $numa_totalmemory += $numa_memory;
2875 my $numa_object = "memory-backend-ram,id=ram-node$i,size=$numa_memory"."M";
2876
67fb9de6 2877 # cpus
2ed5d572 2878 my $cpus_start = $numa->{cpus}->{start};
67fb9de6 2879 die "missing numa node$i cpus\n" if !defined($cpus_start);
2ed5d572
AD
2880 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2881 my $cpus = $cpus_start;
2882 if (defined($cpus_end)) {
2883 $cpus .= "-$cpus_end";
67fb9de6 2884 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2ed5d572 2885 }
8a010eae 2886
67fb9de6 2887 # hostnodes
2ed5d572
AD
2888 my $hostnodes_start = $numa->{hostnodes}->{start};
2889 if (defined($hostnodes_start)) {
2890 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2891 my $hostnodes = $hostnodes_start;
2892 if (defined($hostnodes_end)) {
2893 $hostnodes .= "-$hostnodes_end";
67fb9de6 2894 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2ed5d572 2895 }
8a010eae 2896
2ed5d572
AD
2897 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2898 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
67fb9de6 2899 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2ed5d572 2900 }
8a010eae 2901
67fb9de6 2902 # policy
2ed5d572 2903 my $policy = $numa->{policy};
67fb9de6
DM
2904 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2905 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2ed5d572
AD
2906 }
2907
2908 push @$cmd, '-object', $numa_object;
8a010eae
AD
2909 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2910 }
67fb9de6
DM
2911
2912 die "total memory for NUMA nodes must be equal to vm memory\n"
2913 if $numa_totalmemory && $numa_totalmemory != $memory;
2ed5d572
AD
2914
2915 #if no custom tology, we split memory and cores across numa nodes
2916 if(!$numa_totalmemory) {
2917
67fb9de6 2918 my $numa_memory = ($memory / $sockets) . "M";
2ed5d572
AD
2919
2920 for (my $i = 0; $i < $sockets; $i++) {
2921
2922 my $cpustart = ($cores * $i);
2923 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2924 my $cpus = $cpustart;
2925 $cpus .= "-$cpuend" if $cpuend;
2926
2927 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2928 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2929 }
2930 }
8a010eae
AD
2931 }
2932
1e3baf05
DM
2933 push @$cmd, '-S' if $conf->{freeze};
2934
2935 # set keyboard layout
2936 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2937 push @$cmd, '-k', $kb if $kb;
2938
2939 # enable sound
2940 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2941 #push @$cmd, '-soundhw', 'es1370';
2942 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 2943
bc84dcca 2944 if($conf->{agent}) {
7a6c2150 2945 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
2946 my $pciaddr = print_pci_addr("qga0", $bridges);
2947 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2948 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2949 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2950 }
2951
1d794448 2952 my $spice_port;
2fa3151e 2953
590e698c
DM
2954 if ($qxlnum) {
2955 if ($qxlnum > 1) {
2956 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2957 for(my $i = 1; $i < $qxlnum; $i++){
2958 my $pciaddr = print_pci_addr("vga$i", $bridges);
2959 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2960 }
2961 } else {
2962 # assume other OS works like Linux
2963 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2964 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
2965 }
2966 }
2967
1011b570 2968 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 2969
cd339d1f 2970 $spice_port = PVE::Tools::next_spice_port();
943340a6 2971
d2da6d9b 2972 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 2973
d2da6d9b
AD
2974 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2975 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2976 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
2977 }
2978
8d9ae0d2
DM
2979 # enable balloon by default, unless explicitly disabled
2980 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2981 $pciaddr = print_pci_addr("balloon0", $bridges);
2982 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2983 }
1e3baf05 2984
0ea9541d
DM
2985 if ($conf->{watchdog}) {
2986 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 2987 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 2988 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
2989 push @$devices, '-device', "$watchdog$pciaddr";
2990 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
2991 }
2992
1e3baf05 2993 my $vollist = [];
941e0c42 2994 my $scsicontroller = {};
26ee04b6 2995 my $ahcicontroller = {};
cdd20088 2996 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 2997
5881b913
DM
2998 # Add iscsi initiator name if available
2999 if (my $initiator = get_initiator_name()) {
3000 push @$devices, '-iscsi', "initiator-name=$initiator";
3001 }
3002
1e3baf05
DM
3003 foreach_drive($conf, sub {
3004 my ($ds, $drive) = @_;
3005
ff1a2432 3006 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 3007 push @$vollist, $drive->{file};
ff1a2432 3008 }
afdb31d5 3009
1e3baf05 3010 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
3011
3012 if (drive_is_cdrom ($drive)) {
3013 if ($bootindex_hash->{d}) {
3014 $drive->{bootindex} = $bootindex_hash->{d};
3015 $bootindex_hash->{d} += 1;
3016 }
3017 } else {
3018 if ($bootindex_hash->{c}) {
3019 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3020 $bootindex_hash->{c} += 1;
3021 }
3022 }
3023
941e0c42 3024 if ($drive->{interface} eq 'scsi') {
cdd20088 3025
5b952ff5 3026 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 3027 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
3028 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
3029 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 3030 $scsicontroller->{$controller}=1;
941e0c42 3031 }
3b408e82 3032
26ee04b6
DA
3033 if ($drive->{interface} eq 'sata') {
3034 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
3035 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3036 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
3037 $ahcicontroller->{$controller}=1;
3038 }
46f58b5f 3039
15b21acc
MR
3040 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3041 push @$devices, '-drive',$drive_cmd;
46f58b5f 3042 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
3043 });
3044
cc4d6182 3045 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 3046 next if !$conf->{"net$i"};
cc4d6182
DA
3047 my $d = parse_net($conf->{"net$i"});
3048 next if !$d;
1e3baf05 3049
cc4d6182 3050 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 3051
cc4d6182
DA
3052 if ($bootindex_hash->{n}) {
3053 $d->{bootindex} = $bootindex_hash->{n};
3054 $bootindex_hash->{n} += 1;
3055 }
1e3baf05 3056
cc4d6182 3057 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
3058 push @$devices, '-netdev', $netdevfull;
3059
3060 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
3061 push @$devices, '-device', $netdevicefull;
3062 }
1e3baf05 3063
db656e5f
DM
3064 if (!$q35) {
3065 # add pci bridges
f8e83f05
AD
3066 while (my ($k, $v) = each %$bridges) {
3067 $pciaddr = print_pci_addr("pci.$k");
3068 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3069 }
19672434
DM
3070 }
3071
1e3baf05
DM
3072 # hack: virtio with fairsched is unreliable, so we do not use fairsched
3073 # when the VM uses virtio devices.
19672434
DM
3074 if (!$use_virtio && $have_ovz) {
3075
6b64503e 3076 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
3077 $conf->{cpuunits} : $defaults->{cpuunits};
3078
3079 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
3080
3081 # fixme: cpulimit is currently ignored
3082 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
3083 }
3084
3085 # add custom args
3086 if ($conf->{args}) {
3ada46c9 3087 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
3088 push @$cmd, @$aa;
3089 }
3090
5bdcf937 3091 push @$cmd, @$devices;
be190583 3092 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 3093 if scalar(@$rtcFlags);
be190583 3094 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
3095 if scalar(@$machineFlags);
3096 push @$cmd, '-global', join(',', @$globalFlags)
3097 if scalar(@$globalFlags);
3098
1d794448 3099 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 3100}
19672434 3101
1e3baf05
DM
3102sub vnc_socket {
3103 my ($vmid) = @_;
3104 return "${var_run_tmpdir}/$vmid.vnc";
3105}
3106
943340a6 3107sub spice_port {
1011b570 3108 my ($vmid) = @_;
943340a6 3109
1d794448 3110 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
3111
3112 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3113}
3114
c971c4f2 3115sub qmp_socket {
693d12a2
AD
3116 my ($vmid, $qga) = @_;
3117 my $sockettype = $qga ? 'qga' : 'qmp';
3118 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3119}
3120
1e3baf05
DM
3121sub pidfile_name {
3122 my ($vmid) = @_;
3123 return "${var_run_tmpdir}/$vmid.pid";
3124}
3125
86fdcfb2
DA
3126sub vm_devices_list {
3127 my ($vmid) = @_;
3128
ceea9078 3129 my $res = vm_mon_cmd($vmid, 'query-pci');
ceea9078
DM
3130 my $devices = {};
3131 foreach my $pcibus (@$res) {
3132 foreach my $device (@{$pcibus->{devices}}) {
3133 next if !$device->{'qdev_id'};
f78cc802
AD
3134 $devices->{$device->{'qdev_id'}} = 1;
3135 }
3136 }
3137
3138 my $resblock = vm_mon_cmd($vmid, 'query-block');
3139 foreach my $block (@$resblock) {
3140 if($block->{device} =~ m/^drive-(\S+)/){
3141 $devices->{$1} = 1;
1dc4f496
DM
3142 }
3143 }
86fdcfb2 3144
3d7389fe
DM
3145 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3146 foreach my $mice (@$resmice) {
3147 if ($mice->{name} eq 'QEMU HID Tablet') {
3148 $devices->{tablet} = 1;
3149 last;
3150 }
3151 }
3152
1dc4f496 3153 return $devices;
86fdcfb2
DA
3154}
3155
ec21aa11 3156sub vm_deviceplug {
f19d1c47 3157 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3158
fee46675 3159 die "internal error" if !$conf->{hotplug};
db656e5f
DM
3160
3161 my $q35 = machine_type_is_q35($conf);
3162
95d6343b
DA
3163 my $devices_list = vm_devices_list($vmid);
3164 return 1 if defined($devices_list->{$deviceid});
3165
fee46675
DM
3166 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid); # add PCI bridge if we need it for the device
3167
3d7389fe 3168 if ($deviceid eq 'tablet') {
fee46675 3169
3d7389fe 3170 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3d7389fe 3171
fee46675 3172 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
40f28a9f 3173
fee46675 3174 qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3175 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
fee46675 3176
5e5dcb73 3177 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3178 eval { qemu_deviceaddverify($vmid, $deviceid); };
3179 if (my $err = $@) {
63c2da2f
DM
3180 eval { qemu_drivedel($vmid, $deviceid); };
3181 warn $@ if $@;
fee46675 3182 die $err;
5e5dcb73 3183 }
cfc817c7 3184
fee46675
DM
3185 } elsif ($deviceid =~ m/^(scsihw)(\d+)$/) {
3186
cdd20088 3187 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3188 my $pciaddr = print_pci_addr($deviceid);
cdd20088 3189 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
fee46675 3190
cfc817c7 3191 qemu_deviceadd($vmid, $devicefull);
fee46675 3192 qemu_deviceaddverify($vmid, $deviceid);
cfc817c7 3193
fee46675
DM
3194 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3195
3196 qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
3197 qemu_driveadd($storecfg, $vmid, $device);
3198
3199 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3200 eval { qemu_deviceadd($vmid, $devicefull); };
3201 if (my $err = $@) {
63c2da2f
DM
3202 eval { qemu_drivedel($vmid, $deviceid); };
3203 warn $@ if $@;
fee46675 3204 die $err;
a4f091a0 3205 }
a4f091a0 3206
fee46675
DM
3207 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3208
2630d2a9
DA
3209 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3210 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3211 qemu_deviceadd($vmid, $netdevicefull);
fee46675
DM
3212 eval { qemu_deviceaddverify($vmid, $deviceid); };
3213 if (my $err = $@) {
3214 eval { qemu_netdevdel($vmid, $deviceid); };
3215 warn $@ if $@;
3216 die $err;
2630d2a9 3217 }
2630d2a9 3218
fee46675 3219 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
b467f79a 3220
40f28a9f
AD
3221 my $bridgeid = $2;
3222 my $pciaddr = print_pci_addr($deviceid);
3223 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
fee46675 3224
40f28a9f 3225 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3226 qemu_deviceaddverify($vmid, $deviceid);
3227
3228 } else {
3229 die "can't hotplug device '$deviceid'\n";
40f28a9f
AD
3230 }
3231
5e5dcb73 3232 return 1;
a4dea331
DA
3233}
3234
3eec5767 3235# fixme: this should raise exceptions on error!
ec21aa11 3236sub vm_deviceunplug {
f19d1c47 3237 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3238
63c2da2f 3239 die "internal error" if !$conf->{hotplug};
873c2d69 3240
95d6343b
DA
3241 my $devices_list = vm_devices_list($vmid);
3242 return 1 if !defined($devices_list->{$deviceid});
3243
63c2da2f
DM
3244 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3245
3d7389fe 3246 if ($deviceid eq 'tablet') {
63c2da2f 3247
3d7389fe 3248 qemu_devicedel($vmid, $deviceid);
3d7389fe 3249
63c2da2f 3250 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
f19d1c47 3251
5e5dcb73 3252 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3253 qemu_devicedelverify($vmid, $deviceid);
3254 qemu_drivedel($vmid, $deviceid);
3255
3256 } elsif ($deviceid =~ m/^(lsi)(\d+)$/) {
3257
3258 qemu_devicedel($vmid, $deviceid);
3259
3260 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
cfc817c7 3261
63c2da2f
DM
3262 qemu_devicedel($vmid, $deviceid);
3263 qemu_drivedel($vmid, $deviceid);
3264
3265 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
a4f091a0 3266
2630d2a9 3267 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3268 qemu_devicedelverify($vmid, $deviceid);
3269 qemu_netdevdel($vmid, $deviceid);
3270
3271 } else {
3272 die "can't unplug device '$deviceid'\n";
2630d2a9
DA
3273 }
3274
5e5dcb73
DA
3275 return 1;
3276}
3277
3278sub qemu_deviceadd {
3279 my ($vmid, $devicefull) = @_;
873c2d69 3280
d695b5b7
AD
3281 $devicefull = "driver=".$devicefull;
3282 my %options = split(/[=,]/, $devicefull);
f19d1c47 3283
d695b5b7 3284 vm_mon_cmd($vmid, "device_add" , %options);
5e5dcb73 3285}
afdb31d5 3286
5e5dcb73 3287sub qemu_devicedel {
fee46675 3288 my ($vmid, $deviceid) = @_;
63c2da2f 3289
5a77d8c1 3290 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
5e5dcb73
DA
3291}
3292
3293sub qemu_driveadd {
fee46675 3294 my ($storecfg, $vmid, $device) = @_;
5e5dcb73
DA
3295
3296 my $drive = print_drive_full($storecfg, $vmid, $device);
7b7c6d1b 3297 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
fee46675 3298
5e5dcb73 3299 # If the command succeeds qemu prints: "OK"
fee46675
DM
3300 return 1 if $ret =~ m/OK/s;
3301
3302 die "adding drive failed: $ret\n";
5e5dcb73 3303}
afdb31d5 3304
5e5dcb73
DA
3305sub qemu_drivedel {
3306 my($vmid, $deviceid) = @_;
873c2d69 3307
7b7c6d1b 3308 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73 3309 $ret =~ s/^\s+//;
63c2da2f
DM
3310
3311 return 1 if $ret eq "";
3312
3313 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
3314 return 1 if $ret =~ m/Device \'.*?\' not found/s;
3315
3316 die "deleting drive $deviceid failed : $ret\n";
5e5dcb73 3317}
f19d1c47 3318
5e5dcb73 3319sub qemu_deviceaddverify {
fee46675 3320 my ($vmid, $deviceid) = @_;
873c2d69 3321
5e5dcb73
DA
3322 for (my $i = 0; $i <= 5; $i++) {
3323 my $devices_list = vm_devices_list($vmid);
3324 return 1 if defined($devices_list->{$deviceid});
3325 sleep 1;
afdb31d5 3326 }
fee46675
DM
3327
3328 die "error on hotplug device '$deviceid'\n";
5e5dcb73 3329}
afdb31d5 3330
5e5dcb73
DA
3331
3332sub qemu_devicedelverify {
63c2da2f
DM
3333 my ($vmid, $deviceid) = @_;
3334
3335 # need to verify that the device is correctly removed as device_del
3336 # is async and empty return is not reliable
5e5dcb73 3337
5e5dcb73
DA
3338 for (my $i = 0; $i <= 5; $i++) {
3339 my $devices_list = vm_devices_list($vmid);
3340 return 1 if !defined($devices_list->{$deviceid});
3341 sleep 1;
afdb31d5 3342 }
63c2da2f
DM
3343
3344 die "error on hot-unplugging device '$deviceid'\n";
873c2d69
DA
3345}
3346
cdd20088 3347sub qemu_findorcreatescsihw {
cfc817c7
DA
3348 my ($storecfg, $conf, $vmid, $device) = @_;
3349
5b952ff5 3350 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3351 my $controller = int($device->{index} / $maxdev);
cdd20088 3352 my $scsihwid="scsihw$controller";
cfc817c7
DA
3353 my $devices_list = vm_devices_list($vmid);
3354
cdd20088 3355 if(!defined($devices_list->{$scsihwid})) {
fee46675 3356 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7 3357 }
fee46675 3358
cfc817c7
DA
3359 return 1;
3360}
3361
281fedb3 3362sub qemu_add_pci_bridge {
40f28a9f
AD
3363 my ($storecfg, $conf, $vmid, $device) = @_;
3364
3365 my $bridges = {};
281fedb3
DM
3366
3367 my $bridgeid;
3368
40f28a9f
AD
3369 print_pci_addr($device, $bridges);
3370
3371 while (my ($k, $v) = each %$bridges) {
3372 $bridgeid = $k;
3373 }
fee46675 3374 return 1 if !defined($bridgeid) || $bridgeid < 1;
281fedb3 3375
40f28a9f
AD
3376 my $bridge = "pci.$bridgeid";
3377 my $devices_list = vm_devices_list($vmid);
3378
281fedb3 3379 if (!defined($devices_list->{$bridge})) {
fee46675 3380 vm_deviceplug($storecfg, $conf, $vmid, $bridge);
40f28a9f 3381 }
281fedb3 3382
40f28a9f
AD
3383 return 1;
3384}
3385
2630d2a9
DA
3386sub qemu_netdevadd {
3387 my ($vmid, $conf, $device, $deviceid) = @_;
3388
3389 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3390 my %options = split(/[=,]/, $netdev);
2630d2a9 3391
73aa03b8
AD
3392 vm_mon_cmd($vmid, "netdev_add", %options);
3393 return 1;
2630d2a9
DA
3394}
3395
3396sub qemu_netdevdel {
3397 my ($vmid, $deviceid) = @_;
3398
89c1e0f4 3399 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
2630d2a9
DA
3400}
3401
838776ab
AD
3402sub qemu_cpu_hotplug {
3403 my ($vmid, $conf, $cores) = @_;
3404
3a11fadb
DM
3405 my $sockets = $conf->{sockets} || 1;
3406 die "cpu hotplug only works with one socket\n"
3407 if $sockets > 1;
838776ab 3408
3a11fadb
DM
3409 die "maxcpus is not defined\n"
3410 if !$conf->{maxcpus};
3411
3412 die "you can't add more cores than maxcpus\n"
3413 if $cores > $conf->{maxcpus};
3414
3415 my $currentcores = $conf->{cores} || 1;
3416 die "online cpu unplug is not yet possible\n"
3417 if $cores < $currentcores;
838776ab
AD
3418
3419 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
3a11fadb
DM
3420 die "cores number if running vm is different than configuration\n"
3421 if scalar(@{$currentrunningcores}) != $currentcores;
838776ab 3422
3a11fadb 3423 for (my $i = $currentcores; $i < $cores; $i++) {
838776ab
AD
3424 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3425 }
3426}
3427
affd2f88
AD
3428sub qemu_block_set_io_throttle {
3429 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3430
f3f323a3
AD
3431 return if !check_running($vmid) ;
3432
f3f323a3
AD
3433 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3434
affd2f88
AD
3435}
3436
f5eb281a 3437# old code, only used to shutdown old VM after update
dab36e1e
DM
3438sub __read_avail {
3439 my ($fh, $timeout) = @_;
3440
3441 my $sel = new IO::Select;
3442 $sel->add($fh);
3443
3444 my $res = '';
3445 my $buf;
3446
3447 my @ready;
3448 while (scalar (@ready = $sel->can_read($timeout))) {
3449 my $count;
3450 if ($count = $fh->sysread($buf, 8192)) {
3451 if ($buf =~ /^(.*)\(qemu\) $/s) {
3452 $res .= $1;
3453 last;
3454 } else {
3455 $res .= $buf;
3456 }
3457 } else {
3458 if (!defined($count)) {
3459 die "$!\n";
3460 }
3461 last;
3462 }
3463 }
3464
3465 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3466
dab36e1e
DM
3467 return $res;
3468}
3469
f5eb281a 3470# old code, only used to shutdown old VM after update
dab36e1e
DM
3471sub vm_monitor_command {
3472 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3473
dab36e1e
DM
3474 my $res;
3475
3476 eval {
3477 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3478
3479 my $sname = "${var_run_tmpdir}/$vmid.mon";
3480
3481 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3482 die "unable to connect to VM $vmid socket - $!\n";
3483
3484 my $timeout = 3;
3485
3486 # hack: migrate sometime blocks the monitor (when migrate_downtime
3487 # is set)
3488 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3489 $timeout = 60*60; # 1 hour
3490 }
3491
3492 # read banner;
3493 my $data = __read_avail($sock, $timeout);
3494
3495 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3496 die "got unexpected qemu monitor banner\n";
3497 }
3498
3499 my $sel = new IO::Select;
3500 $sel->add($sock);
3501
3502 if (!scalar(my @ready = $sel->can_write($timeout))) {
3503 die "monitor write error - timeout";
3504 }
3505
3506 my $fullcmd = "$cmdstr\r";
3507
3508 # syslog('info', "VM $vmid monitor command: $cmdstr");
3509
3510 my $b;
3511 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3512 die "monitor write error - $!";
3513 }
3514
3515 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3516
3517 $timeout = 20;
3518
3519 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3520 $timeout = 60*60; # 1 hour
3521 } elsif ($cmdstr =~ m/^(eject|change)/) {
3522 $timeout = 60; # note: cdrom mount command is slow
3523 }
3524 if ($res = __read_avail($sock, $timeout)) {
3525
3526 my @lines = split("\r?\n", $res);
f5eb281a 3527
dab36e1e 3528 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3529
dab36e1e
DM
3530 $res = join("\n", @lines);
3531 $res .= "\n";
3532 }
3533 };
3534
3535 my $err = $@;
3536
3537 if ($err) {
3538 syslog("err", "VM $vmid monitor command failed - $err");
3539 die $err;
3540 }
f5eb281a 3541
dab36e1e
DM
3542 return $res;
3543}
3544
c1175c92
AD
3545sub qemu_block_resize {
3546 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3547
ed221350 3548 my $running = check_running($vmid);
c1175c92
AD
3549
3550 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3551
3552 return if !$running;
3553
3554 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3555
3556}
3557
1ab0057c
AD
3558sub qemu_volume_snapshot {
3559 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3560
ed221350 3561 my $running = check_running($vmid);
1ab0057c
AD
3562
3563 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3564
3565 return if !$running;
3566
3567 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3568
3569}
3570
fc46aff9
AD
3571sub qemu_volume_snapshot_delete {
3572 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3573
ed221350 3574 my $running = check_running($vmid);
fc46aff9
AD
3575
3576 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3577
3578 return if !$running;
3579
18bfb361 3580 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3581}
3582
264e519f
DM
3583sub set_migration_caps {
3584 my ($vmid) = @_;
a89fded1 3585
8b8345f3 3586 my $cap_ref = [];
a89fded1
AD
3587
3588 my $enabled_cap = {
8b8345f3
DM
3589 "auto-converge" => 1,
3590 "xbzrle" => 0,
3591 "x-rdma-pin-all" => 0,
3592 "zero-blocks" => 0,
a89fded1
AD
3593 };
3594
8b8345f3 3595 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3596
8b8345f3 3597 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3598 push @$cap_ref, {
3599 capability => $supported_capability->{capability},
22430fa2
DM
3600 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3601 };
a89fded1
AD
3602 }
3603
8b8345f3
DM
3604 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3605}
a89fded1 3606
3a11fadb
DM
3607# hotplug changes in [PENDING]
3608# $selection hash can be used to only apply specified options, for
3609# example: { cores => 1 } (only apply changed 'cores')
3610# $errors ref is used to return error messages
c427973b 3611sub vmconfig_hotplug_pending {
3a11fadb 3612 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
c427973b 3613
8e90138a 3614 my $defaults = load_defaults();
c427973b
DM
3615
3616 # commit values which do not have any impact on running VM first
3a11fadb
DM
3617 # Note: those option cannot raise errors, we we do not care about
3618 # $selection and always apply them.
3619
3620 my $add_error = sub {
3621 my ($opt, $msg) = @_;
3622 $errors->{$opt} = "hotplug problem - $msg";
3623 };
c427973b
DM
3624
3625 my $changes = 0;
3626 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3627 if ($opt eq 'name' || $opt eq 'hotplug' || $opt eq 'onboot' || $opt eq 'shares') {
3628 $conf->{$opt} = $conf->{pending}->{$opt};
3629 delete $conf->{pending}->{$opt};
3630 $changes = 1;
3631 }
3632 }
3633
3634 if ($changes) {
3635 update_config_nolock($vmid, $conf, 1);
3636 $conf = load_config($vmid); # update/reload
3637 }
3638
3a11fadb 3639 my $hotplug = defined($conf->{hotplug}) ? $conf->{hotplug} : $defaults->{hotplug};
c427973b 3640
3d7389fe
DM
3641 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3642 foreach my $opt (@delete) {
3a11fadb 3643 next if $selection && !$selection->{$opt};
3a11fadb
DM
3644 eval {
3645 if ($opt eq 'tablet') {
e56beeda 3646 die "skip\n" if !$hotplug;
3a11fadb
DM
3647 if ($defaults->{tablet}) {
3648 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3649 } else {
3650 vm_deviceunplug($vmid, $conf, $opt);
3651 }
3652 } elsif ($opt eq 'cores') {
e56beeda 3653 die "skip\n" if !$hotplug;
3a11fadb 3654 qemu_cpu_hotplug($vmid, $conf, 1);
3eec5767
DM
3655 } elsif ($opt =~ m/^net(\d+)$/) {
3656 die "skip\n" if !$hotplug;
3657 vm_deviceunplug($vmid, $conf, $opt);
a05cff86 3658 } elsif (valid_drivename($opt)) {
19120f99
AD
3659 die "skip\n" if !$hotplug;
3660 vm_deviceunplug($vmid, $conf, $opt);
3661 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
3d7389fe 3662 } else {
e56beeda 3663 die "skip\n";
3d7389fe 3664 }
3a11fadb
DM
3665 };
3666 if (my $err = $@) {
e56beeda
DM
3667 &$add_error($opt, $err) if $err ne "skip\n";
3668 } else {
3a11fadb
DM
3669 # save new config if hotplug was successful
3670 delete $conf->{$opt};
3671 vmconfig_undelete_pending_option($conf, $opt);
3672 update_config_nolock($vmid, $conf, 1);
3673 $conf = load_config($vmid); # update/reload
3d7389fe 3674 }
3d7389fe
DM
3675 }
3676
3677 foreach my $opt (keys %{$conf->{pending}}) {
3a11fadb 3678 next if $selection && !$selection->{$opt};
3d7389fe 3679 my $value = $conf->{pending}->{$opt};
3a11fadb
DM
3680 eval {
3681 if ($opt eq 'tablet') {
e56beeda 3682 die "skip\n" if !$hotplug;
3a11fadb
DM
3683 if ($value == 1) {
3684 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3685 } elsif ($value == 0) {
3686 vm_deviceunplug($vmid, $conf, $opt);
3687 }
3688 } elsif ($opt eq 'cores') {
e56beeda 3689 die "skip\n" if !$hotplug;
3a11fadb
DM
3690 qemu_cpu_hotplug($vmid, $conf, $value);
3691 } elsif ($opt eq 'balloon') {
e56beeda 3692 die "skip\n" if !(defined($conf->{shares}) && ($conf->{shares} == 0));
3a11fadb
DM
3693 # allow manual ballooning if shares is set to zero
3694 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
3695 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
3eec5767
DM
3696 } elsif ($opt =~ m/^net(\d+)$/) {
3697 # some changes can be done without hotplug
3698 vmconfig_update_net($storecfg, $conf, $vmid, $opt, $value);
a05cff86
DM
3699 } elsif (valid_drivename($opt)) {
3700 # some changes can be done without hotplug
3701 vmconfig_update_disk($storecfg, $conf, $vmid, $opt, $value, 1);
3a11fadb 3702 } else {
e56beeda 3703 die "skip\n"; # skip non-hot-pluggable options
3d7389fe 3704 }
3a11fadb
DM
3705 };
3706 if (my $err = $@) {
e56beeda
DM
3707 &$add_error($opt, $err) if $err ne "skip\n";
3708 } else {
3a11fadb
DM
3709 # save new config if hotplug was successful
3710 $conf->{$opt} = $value;
3711 delete $conf->{pending}->{$opt};
3712 update_config_nolock($vmid, $conf, 1);
3713 $conf = load_config($vmid); # update/reload
3d7389fe 3714 }
3d7389fe 3715 }
c427973b 3716}
055d554d
DM
3717
3718sub vmconfig_apply_pending {
3a11fadb 3719 my ($vmid, $conf, $storecfg) = @_;
c427973b
DM
3720
3721 # cold plug
055d554d
DM
3722
3723 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3724 foreach my $opt (@delete) { # delete
3725 die "internal error" if $opt =~ m/^unused/;
3726 $conf = load_config($vmid); # update/reload
3727 if (!defined($conf->{$opt})) {
3728 vmconfig_undelete_pending_option($conf, $opt);
3729 update_config_nolock($vmid, $conf, 1);
3730 } elsif (valid_drivename($opt)) {
3731 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
3732 vmconfig_undelete_pending_option($conf, $opt);
3733 delete $conf->{$opt};
3734 update_config_nolock($vmid, $conf, 1);
3735 } else {
3736 vmconfig_undelete_pending_option($conf, $opt);
3737 delete $conf->{$opt};
3738 update_config_nolock($vmid, $conf, 1);
3739 }
3740 }
3741
3742 $conf = load_config($vmid); # update/reload
3743
3744 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3745 $conf = load_config($vmid); # update/reload
3746
3747 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
3748 # skip if nothing changed
3749 } elsif (valid_drivename($opt)) {
3750 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
3751 if defined($conf->{$opt});
3752 $conf->{$opt} = $conf->{pending}->{$opt};
3753 } else {
3754 $conf->{$opt} = $conf->{pending}->{$opt};
3755 }
3756
3757 delete $conf->{pending}->{$opt};
3758 update_config_nolock($vmid, $conf, 1);
3759 }
3760}
3761
3eec5767
DM
3762my $safe_num_ne = sub {
3763 my ($a, $b) = @_;
3764
3765 return 0 if !defined($a) && !defined($b);
3766 return 1 if !defined($a);
3767 return 1 if !defined($b);
3768
3769 return $a != $b;
3770};
3771
3772my $safe_string_ne = sub {
3773 my ($a, $b) = @_;
3774
3775 return 0 if !defined($a) && !defined($b);
3776 return 1 if !defined($a);
3777 return 1 if !defined($b);
3778
3779 return $a ne $b;
3780};
3781
3782sub vmconfig_update_net {
3783 my ($storecfg, $conf, $vmid, $opt, $value) = @_;
3784
3785 my $newnet = parse_net($value);
3786
3787 if ($conf->{$opt}) {
3788 my $oldnet = parse_net($conf->{$opt});
3789
3790 if (&$safe_string_ne($oldnet->{model}, $newnet->{model}) ||
3791 &$safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
3792 &$safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
3793 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
3794
3795 # for non online change, we try to hot-unplug
3796 die "skip\n" if !$conf->{hotplug};
3797 vm_deviceunplug($vmid, $conf, $opt);
3798 } else {
3799
3800 die "internal error" if $opt !~ m/net(\d+)/;
3801 my $iface = "tap${vmid}i$1";
3802
3803 if (&$safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
3804 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3805 }
3806
3807 if(&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
3808 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
3809 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3810 PVE::Network::tap_unplug($iface);
3811 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall});
3812 }
38c590d9
DM
3813
3814 return 1;
3eec5767
DM
3815 }
3816 }
3817
38c590d9
DM
3818 if ($conf->{hotplug}) {
3819 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet);
3820 } else {
3821 die "skip\n";
3822 }
3eec5767
DM
3823}
3824
a05cff86
DM
3825sub vmconfig_update_disk {
3826 my ($storecfg, $conf, $vmid, $opt, $value, $force) = @_;
3827
3828 # fixme: do we need force?
3829
3830 my $drive = parse_drive($opt, $value);
3831
3832 if ($conf->{$opt}) {
3833
3834 if (my $old_drive = parse_drive($opt, $conf->{$opt})) {
3835
3836 my $media = $drive->{media} || 'disk';
3837 my $oldmedia = $old_drive->{media} || 'disk';
3838 die "unable to change media type\n" if $media ne $oldmedia;
3839
3840 if (!drive_is_cdrom($old_drive)) {
3841
3842 if ($drive->{file} ne $old_drive->{file}) {
3843
3844 die "skip\n" if !$conf->{hotplug};
3845
3846 # unplug and register as unused
3847 vm_deviceunplug($vmid, $conf, $opt);
3848 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $old_drive)
3849
3850 } else {
3851 # update existing disk
3852
3853 # skip non hotpluggable value
3854 if (&$safe_num_ne($drive->{discard}, $old_drive->{discard}) ||
3855 &$safe_string_ne($drive->{cache}, $old_drive->{cache})) {
3856 die "skip\n";
3857 }
3858
3859 # apply throttle
3860 if (&$safe_num_ne($drive->{mbps}, $old_drive->{mbps}) ||
3861 &$safe_num_ne($drive->{mbps_rd}, $old_drive->{mbps_rd}) ||
3862 &$safe_num_ne($drive->{mbps_wr}, $old_drive->{mbps_wr}) ||
3863 &$safe_num_ne($drive->{iops}, $old_drive->{iops}) ||
3864 &$safe_num_ne($drive->{iops_rd}, $old_drive->{iops_rd}) ||
3865 &$safe_num_ne($drive->{iops_wr}, $old_drive->{iops_wr}) ||
3866 &$safe_num_ne($drive->{mbps_max}, $old_drive->{mbps_max}) ||
3867 &$safe_num_ne($drive->{mbps_rd_max}, $old_drive->{mbps_rd_max}) ||
3868 &$safe_num_ne($drive->{mbps_wr_max}, $old_drive->{mbps_wr_max}) ||
3869 &$safe_num_ne($drive->{iops_max}, $old_drive->{iops_max}) ||
3870 &$safe_num_ne($drive->{iops_rd_max}, $old_drive->{iops_rd_max}) ||
3871 &$safe_num_ne($drive->{iops_wr_max}, $old_drive->{iops_wr_max})) {
3872
3873 qemu_block_set_io_throttle($vmid,"drive-$opt",
3874 ($drive->{mbps} || 0)*1024*1024,
3875 ($drive->{mbps_rd} || 0)*1024*1024,
3876 ($drive->{mbps_wr} || 0)*1024*1024,
3877 $drive->{iops} || 0,
3878 $drive->{iops_rd} || 0,
3879 $drive->{iops_wr} || 0,
3880 ($drive->{mbps_max} || 0)*1024*1024,
3881 ($drive->{mbps_rd_max} || 0)*1024*1024,
3882 ($drive->{mbps_wr_max} || 0)*1024*1024,
3883 $drive->{iops_max} || 0,
3884 $drive->{iops_rd_max} || 0,
3885 $drive->{iops_wr_max} || 0);
3886
3887 }
3888
3889 return 1;
3890 }
3891 }
3892 }
3893 }
3894
3895 if (drive_is_cdrom($drive)) { # cdrom
3896
3897 if ($drive->{file} eq 'none') {
3898 vm_mon_cmd($vmid, "eject",force => JSON::true,device => "drive-$opt");
3899 } else {
3900 my $path = get_iso_path($storecfg, $vmid, $drive->{file});
3901 vm_mon_cmd($vmid, "eject", force => JSON::true,device => "drive-$opt"); # force eject if locked
3902 vm_mon_cmd($vmid, "change", device => "drive-$opt",target => "$path") if $path;
3903 }
3904
3905 } else {
3906 die "skip\n" if !$conf->{hotplug};
3907 # hotplug new disks
3908 vm_deviceplug($storecfg, $conf, $vmid, $opt, $drive);
3909 }
3910}
3911
1e3baf05 3912sub vm_start {
1d794448 3913 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 3914
6b64503e 3915 lock_config($vmid, sub {
7e8dcf2c 3916 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 3917
8b43bc11 3918 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 3919
6b64503e 3920 check_lock($conf) if !$skiplock;
1e3baf05 3921
7e8dcf2c 3922 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 3923
055d554d 3924 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3a11fadb 3925 vmconfig_apply_pending($vmid, $conf, $storecfg);
055d554d
DM
3926 $conf = load_config($vmid); # update/reload
3927 }
3928
6c47d546
DM
3929 my $defaults = load_defaults();
3930
3931 # set environment variable useful inside network script
3932 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3933
1d794448 3934 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 3935
1e3baf05 3936 my $migrate_port = 0;
5bc1e039 3937 my $migrate_uri;
1e3baf05
DM
3938 if ($statefile) {
3939 if ($statefile eq 'tcp') {
5bc1e039
SP
3940 my $localip = "localhost";
3941 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3942 if ($datacenterconf->{migration_unsecure}) {
3943 my $nodename = PVE::INotify::nodename();
3944 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3945 }
f9a971e0 3946 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 3947 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
3948 push @$cmd, '-incoming', $migrate_uri;
3949 push @$cmd, '-S';
1e3baf05 3950 } else {
6c47d546 3951 push @$cmd, '-loadstate', $statefile;
1e3baf05 3952 }
91bd6c90
DM
3953 } elsif ($paused) {
3954 push @$cmd, '-S';
1e3baf05
DM
3955 }
3956
1e3baf05 3957 # host pci devices
040b06b7
DA
3958 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3959 my $d = parse_hostpci($conf->{"hostpci$i"});
3960 next if !$d;
b1f72af6
AD
3961 my $pcidevices = $d->{pciid};
3962 foreach my $pcidevice (@$pcidevices) {
3963 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 3964
b1f72af6
AD
3965 my $info = pci_device_info("0000:$pciid");
3966 die "IOMMU not present\n" if !check_iommu_support();
3967 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 3968
b1f72af6
AD
3969 if ($d->{driver} && $d->{driver} eq "vfio") {
3970 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3971 } else {
3972 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3973 }
3974
8f3e88af 3975 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 3976 }
040b06b7 3977 }
1e3baf05
DM
3978
3979 PVE::Storage::activate_volumes($storecfg, $vollist);
3980
585b6e28
DM
3981 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3982 umask => 0077); };
1e3baf05 3983 my $err = $@;
ff1a2432 3984 die "start failed: $err" if $err;
1e3baf05 3985
5bc1e039 3986 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 3987
8c609afd 3988 if ($statefile && $statefile ne 'tcp') {
95381ce0 3989 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 3990 warn $@ if $@;
62de2cbd
DM
3991 }
3992
1d794448 3993 if ($migratedfrom) {
a89fded1
AD
3994
3995 eval {
8e90138a 3996 set_migration_caps($vmid);
a89fded1 3997 };
1d794448 3998 warn $@ if $@;
a89fded1 3999
1d794448
DM
4000 if ($spice_port) {
4001 print "spice listens on port $spice_port\n";
4002 if ($spice_ticket) {
8e90138a
DM
4003 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
4004 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
4005 }
4006 }
4007
1d794448 4008 } else {
4ec05c4c 4009
15b1fc93 4010 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 4011 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 4012 if $conf->{balloon};
be190583
DM
4013 vm_mon_cmd_nocheck($vmid, 'qom-set',
4014 path => "machine/peripheral/balloon0",
4015 property => "guest-stats-polling-interval",
4ec05c4c
AD
4016 value => 2);
4017 }
e18b0b99 4018 }
1e3baf05
DM
4019 });
4020}
4021
0eedc444
AD
4022sub vm_mon_cmd {
4023 my ($vmid, $execute, %params) = @_;
4024
26f11676
DM
4025 my $cmd = { execute => $execute, arguments => \%params };
4026 vm_qmp_command($vmid, $cmd);
0eedc444
AD
4027}
4028
4029sub vm_mon_cmd_nocheck {
4030 my ($vmid, $execute, %params) = @_;
4031
26f11676
DM
4032 my $cmd = { execute => $execute, arguments => \%params };
4033 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
4034}
4035
c971c4f2 4036sub vm_qmp_command {
c5a07de5 4037 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 4038
c971c4f2 4039 my $res;
26f11676 4040
14db5366
DM
4041 my $timeout;
4042 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
4043 $timeout = $cmd->{arguments}->{timeout};
4044 delete $cmd->{arguments}->{timeout};
4045 }
be190583 4046
c971c4f2
AD
4047 eval {
4048 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
4049 my $sname = qmp_socket($vmid);
4050 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 4051 my $qmpclient = PVE::QMPClient->new();
dab36e1e 4052
14db5366 4053 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 4054 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
4055 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
4056 if scalar(%{$cmd->{arguments}});
4057 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
4058 } else {
4059 die "unable to open monitor socket\n";
4060 }
c971c4f2 4061 };
26f11676 4062 if (my $err = $@) {
c971c4f2
AD
4063 syslog("err", "VM $vmid qmp command failed - $err");
4064 die $err;
4065 }
4066
4067 return $res;
4068}
4069
9df5cbcc
DM
4070sub vm_human_monitor_command {
4071 my ($vmid, $cmdline) = @_;
4072
4073 my $res;
4074
f5eb281a 4075 my $cmd = {
9df5cbcc
DM
4076 execute => 'human-monitor-command',
4077 arguments => { 'command-line' => $cmdline},
4078 };
4079
4080 return vm_qmp_command($vmid, $cmd);
4081}
4082
1e3baf05
DM
4083sub vm_commandline {
4084 my ($storecfg, $vmid) = @_;
4085
6b64503e 4086 my $conf = load_config($vmid);
1e3baf05
DM
4087
4088 my $defaults = load_defaults();
4089
6b64503e 4090 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 4091
6b64503e 4092 return join(' ', @$cmd);
1e3baf05
DM
4093}
4094
4095sub vm_reset {
4096 my ($vmid, $skiplock) = @_;
4097
6b64503e 4098 lock_config($vmid, sub {
1e3baf05 4099
6b64503e 4100 my $conf = load_config($vmid);
1e3baf05 4101
6b64503e 4102 check_lock($conf) if !$skiplock;
1e3baf05 4103
816e2c4a 4104 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
4105 });
4106}
4107
4108sub get_vm_volumes {
4109 my ($conf) = @_;
1e3baf05 4110
ff1a2432 4111 my $vollist = [];
d5769dc2
DM
4112 foreach_volid($conf, sub {
4113 my ($volid, $is_cdrom) = @_;
ff1a2432 4114
d5769dc2 4115 return if $volid =~ m|^/|;
ff1a2432 4116
d5769dc2
DM
4117 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4118 return if !$sid;
ff1a2432
DM
4119
4120 push @$vollist, $volid;
1e3baf05 4121 });
ff1a2432
DM
4122
4123 return $vollist;
4124}
4125
4126sub vm_stop_cleanup {
254575e9 4127 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 4128
745fed70
DM
4129 eval {
4130 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 4131
254575e9
DM
4132 if (!$keepActive) {
4133 my $vollist = get_vm_volumes($conf);
4134 PVE::Storage::deactivate_volumes($storecfg, $vollist);
4135 }
961bfcb2 4136
ab6a046f 4137 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
4138 unlink "/var/run/qemu-server/${vmid}.$ext";
4139 }
745fed70
DM
4140 };
4141 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
4142}
4143
e6c3b671 4144# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
4145# We need that when migration VMs to other nodes (files already moved)
4146# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 4147sub vm_stop {
af30308f 4148 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 4149
9269013a 4150 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 4151
af30308f
DM
4152 if ($migratedfrom){
4153 my $pid = check_running($vmid, $nocheck, $migratedfrom);
4154 kill 15, $pid if $pid;
4155 my $conf = load_config($vmid, $migratedfrom);
4156 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
4157 return;
4158 }
4159
e6c3b671 4160 lock_config($vmid, sub {
1e3baf05 4161
e6c3b671 4162 my $pid = check_running($vmid, $nocheck);
ff1a2432 4163 return if !$pid;
1e3baf05 4164
ff1a2432 4165 my $conf;
e6c3b671 4166 if (!$nocheck) {
ff1a2432 4167 $conf = load_config($vmid);
e6c3b671 4168 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
4169 if (!defined($timeout) && $shutdown && $conf->{startup}) {
4170 my $opts = parse_startup($conf->{startup});
4171 $timeout = $opts->{down} if $opts->{down};
4172 }
e6c3b671 4173 }
19672434 4174
7f4a5b5a 4175 $timeout = 60 if !defined($timeout);
67fb9de6 4176
9269013a
DM
4177 eval {
4178 if ($shutdown) {
6fab033c 4179 if (!$nocheck && $conf->{agent}) {
2ea54503 4180 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 4181 } else {
2ea54503 4182 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 4183 }
9269013a 4184 } else {
2ea54503 4185 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 4186 }
9269013a 4187 };
1e3baf05
DM
4188 my $err = $@;
4189
4190 if (!$err) {
1e3baf05 4191 my $count = 0;
e6c3b671 4192 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4193 $count++;
4194 sleep 1;
4195 }
4196
4197 if ($count >= $timeout) {
9269013a
DM
4198 if ($force) {
4199 warn "VM still running - terminating now with SIGTERM\n";
4200 kill 15, $pid;
4201 } else {
4202 die "VM quit/powerdown failed - got timeout\n";
4203 }
4204 } else {
254575e9 4205 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 4206 return;
1e3baf05
DM
4207 }
4208 } else {
9269013a
DM
4209 if ($force) {
4210 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4211 kill 15, $pid;
4212 } else {
afdb31d5 4213 die "VM quit/powerdown failed\n";
9269013a 4214 }
1e3baf05
DM
4215 }
4216
4217 # wait again
ff1a2432 4218 $timeout = 10;
1e3baf05
DM
4219
4220 my $count = 0;
e6c3b671 4221 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4222 $count++;
4223 sleep 1;
4224 }
4225
4226 if ($count >= $timeout) {
ff1a2432 4227 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 4228 kill 9, $pid;
ff1a2432 4229 sleep 1;
1e3baf05
DM
4230 }
4231
254575e9 4232 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 4233 });
1e3baf05
DM
4234}
4235
4236sub vm_suspend {
4237 my ($vmid, $skiplock) = @_;
4238
6b64503e 4239 lock_config($vmid, sub {
1e3baf05 4240
6b64503e 4241 my $conf = load_config($vmid);
1e3baf05 4242
051347aa 4243 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 4244
f77f91f3 4245 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
4246 });
4247}
4248
4249sub vm_resume {
4250 my ($vmid, $skiplock) = @_;
4251
6b64503e 4252 lock_config($vmid, sub {
1e3baf05 4253
6b64503e 4254 my $conf = load_config($vmid);
1e3baf05 4255
051347aa 4256 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 4257
12060fe8 4258 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
4259 });
4260}
4261
5fdbe4f0
DM
4262sub vm_sendkey {
4263 my ($vmid, $skiplock, $key) = @_;
1e3baf05 4264
6b64503e 4265 lock_config($vmid, sub {
1e3baf05 4266
6b64503e 4267 my $conf = load_config($vmid);
f5eb281a 4268
7b7c6d1b
DM
4269 # there is no qmp command, so we use the human monitor command
4270 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
4271 });
4272}
4273
4274sub vm_destroy {
4275 my ($storecfg, $vmid, $skiplock) = @_;
4276
6b64503e 4277 lock_config($vmid, sub {
1e3baf05 4278
6b64503e 4279 my $conf = load_config($vmid);
1e3baf05 4280
6b64503e 4281 check_lock($conf) if !$skiplock;
1e3baf05 4282
ff1a2432
DM
4283 if (!check_running($vmid)) {
4284 fairsched_rmnod($vmid); # try to destroy group
4285 destroy_vm($storecfg, $vmid);
4286 } else {
4287 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
4288 }
4289 });
4290}
4291
1e3baf05
DM
4292# pci helpers
4293
4294sub file_write {
4295 my ($filename, $buf) = @_;
4296
6b64503e 4297 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
4298 return undef if !$fh;
4299
4300 my $res = print $fh $buf;
4301
4302 $fh->close();
4303
4304 return $res;
4305}
4306
4307sub pci_device_info {
4308 my ($name) = @_;
4309
4310 my $res;
4311
4312 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
4313 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
4314
4315 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
4316 return undef if !defined($irq) || $irq !~ m/^\d+$/;
4317
4318 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
4319 return undef if !defined($vendor) || $vendor !~ s/^0x//;
4320
4321 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
4322 return undef if !defined($product) || $product !~ s/^0x//;
4323
4324 $res = {
4325 name => $name,
4326 vendor => $vendor,
4327 product => $product,
4328 domain => $domain,
4329 bus => $bus,
4330 slot => $slot,
4331 func => $func,
4332 irq => $irq,
4333 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
4334 };
4335
4336 return $res;
4337}
4338
4339sub pci_dev_reset {
4340 my ($dev) = @_;
4341
4342 my $name = $dev->{name};
4343
4344 my $fn = "$pcisysfs/devices/$name/reset";
4345
6b64503e 4346 return file_write($fn, "1");
1e3baf05
DM
4347}
4348
4349sub pci_dev_bind_to_stub {
4350 my ($dev) = @_;
4351
4352 my $name = $dev->{name};
4353
4354 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
4355 return 1 if -d $testdir;
4356
4357 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 4358 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
4359
4360 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 4361 if (!file_write($fn, $name)) {
1e3baf05
DM
4362 return undef if -f $fn;
4363 }
4364
4365 $fn = "$pcisysfs/drivers/pci-stub/bind";
4366 if (! -d $testdir) {
6b64503e 4367 return undef if !file_write($fn, $name);
1e3baf05
DM
4368 }
4369
4370 return -d $testdir;
4371}
4372
000fc0a2
SP
4373sub pci_dev_bind_to_vfio {
4374 my ($dev) = @_;
4375
4376 my $name = $dev->{name};
4377
4378 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4379
4380 if (!-d $vfio_basedir) {
4381 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4382 }
4383 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4384
4385 my $testdir = "$vfio_basedir/$name";
4386 return 1 if -d $testdir;
4387
4388 my $data = "$dev->{vendor} $dev->{product}";
4389 return undef if !file_write("$vfio_basedir/new_id", $data);
4390
4391 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4392 if (!file_write($fn, $name)) {
4393 return undef if -f $fn;
4394 }
4395
4396 $fn = "$vfio_basedir/bind";
4397 if (! -d $testdir) {
4398 return undef if !file_write($fn, $name);
4399 }
4400
4401 return -d $testdir;
4402}
4403
4404sub pci_dev_group_bind_to_vfio {
4405 my ($pciid) = @_;
4406
4407 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4408
4409 if (!-d $vfio_basedir) {
4410 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4411 }
4412 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4413
4414 # get IOMMU group devices
4415 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
4416 my @devs = grep /^0000:/, readdir($D);
4417 closedir($D);
4418
4419 foreach my $pciid (@devs) {
4420 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
4421 my $info = pci_device_info($1);
4422 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
4423 }
4424
4425 return 1;
4426}
4427
afdb31d5 4428sub print_pci_addr {
5bdcf937 4429 my ($id, $bridges) = @_;
6b64503e 4430
72a063e4 4431 my $res = '';
6b64503e 4432 my $devices = {
24f0d39a 4433 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 4434 #addr2 : first videocard
13b5a753 4435 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 4436 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
4437 scsihw0 => { bus => 0, addr => 5 },
4438 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 4439 ahci0 => { bus => 0, addr => 7 },
ab6a046f 4440 qga0 => { bus => 0, addr => 8 },
1011b570 4441 spice => { bus => 0, addr => 9 },
6b64503e
DM
4442 virtio0 => { bus => 0, addr => 10 },
4443 virtio1 => { bus => 0, addr => 11 },
4444 virtio2 => { bus => 0, addr => 12 },
4445 virtio3 => { bus => 0, addr => 13 },
4446 virtio4 => { bus => 0, addr => 14 },
4447 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
4448 hostpci0 => { bus => 0, addr => 16 },
4449 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
4450 net0 => { bus => 0, addr => 18 },
4451 net1 => { bus => 0, addr => 19 },
4452 net2 => { bus => 0, addr => 20 },
4453 net3 => { bus => 0, addr => 21 },
4454 net4 => { bus => 0, addr => 22 },
4455 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
4456 vga1 => { bus => 0, addr => 24 },
4457 vga2 => { bus => 0, addr => 25 },
4458 vga3 => { bus => 0, addr => 26 },
5cffb2d2
AD
4459 hostpci2 => { bus => 0, addr => 27 },
4460 hostpci3 => { bus => 0, addr => 28 },
e5f7f8ed 4461 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
4462 'pci.1' => { bus => 0, addr => 30 },
4463 'pci.2' => { bus => 0, addr => 31 },
4464 'net6' => { bus => 1, addr => 1 },
4465 'net7' => { bus => 1, addr => 2 },
4466 'net8' => { bus => 1, addr => 3 },
4467 'net9' => { bus => 1, addr => 4 },
4468 'net10' => { bus => 1, addr => 5 },
4469 'net11' => { bus => 1, addr => 6 },
4470 'net12' => { bus => 1, addr => 7 },
4471 'net13' => { bus => 1, addr => 8 },
4472 'net14' => { bus => 1, addr => 9 },
4473 'net15' => { bus => 1, addr => 10 },
4474 'net16' => { bus => 1, addr => 11 },
4475 'net17' => { bus => 1, addr => 12 },
4476 'net18' => { bus => 1, addr => 13 },
4477 'net19' => { bus => 1, addr => 14 },
4478 'net20' => { bus => 1, addr => 15 },
4479 'net21' => { bus => 1, addr => 16 },
4480 'net22' => { bus => 1, addr => 17 },
4481 'net23' => { bus => 1, addr => 18 },
4482 'net24' => { bus => 1, addr => 19 },
4483 'net25' => { bus => 1, addr => 20 },
4484 'net26' => { bus => 1, addr => 21 },
4485 'net27' => { bus => 1, addr => 22 },
4486 'net28' => { bus => 1, addr => 23 },
4487 'net29' => { bus => 1, addr => 24 },
4488 'net30' => { bus => 1, addr => 25 },
4489 'net31' => { bus => 1, addr => 26 },
4490 'virtio6' => { bus => 2, addr => 1 },
4491 'virtio7' => { bus => 2, addr => 2 },
4492 'virtio8' => { bus => 2, addr => 3 },
4493 'virtio9' => { bus => 2, addr => 4 },
4494 'virtio10' => { bus => 2, addr => 5 },
4495 'virtio11' => { bus => 2, addr => 6 },
4496 'virtio12' => { bus => 2, addr => 7 },
4497 'virtio13' => { bus => 2, addr => 8 },
4498 'virtio14' => { bus => 2, addr => 9 },
4499 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
4500 };
4501
4502 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 4503 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
4504 my $bus = $devices->{$id}->{bus};
4505 $res = ",bus=pci.$bus,addr=$addr";
98627641 4506 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
4507 }
4508 return $res;
4509
4510}
4511
2e3b7e2a
AD
4512sub print_pcie_addr {
4513 my ($id) = @_;
4514
4515 my $res = '';
4516 my $devices = {
4517 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4518 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4519 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4520 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4521 };
4522
4523 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4524 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4525 my $bus = $devices->{$id}->{bus};
4526 $res = ",bus=$bus,addr=$addr";
4527 }
4528 return $res;
4529
4530}
4531
3e16d5fc
DM
4532# vzdump restore implementaion
4533
ed221350 4534sub tar_archive_read_firstfile {
3e16d5fc 4535 my $archive = shift;
afdb31d5 4536
3e16d5fc
DM
4537 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4538
4539 # try to detect archive type first
4540 my $pid = open (TMP, "tar tf '$archive'|") ||
4541 die "unable to open file '$archive'\n";
4542 my $firstfile = <TMP>;
4543 kill 15, $pid;
4544 close TMP;
4545
4546 die "ERROR: archive contaions no data\n" if !$firstfile;
4547 chomp $firstfile;
4548
4549 return $firstfile;
4550}
4551
ed221350
DM
4552sub tar_restore_cleanup {
4553 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
4554
4555 print STDERR "starting cleanup\n";
4556
4557 if (my $fd = IO::File->new($statfile, "r")) {
4558 while (defined(my $line = <$fd>)) {
4559 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4560 my $volid = $2;
4561 eval {
4562 if ($volid =~ m|^/|) {
4563 unlink $volid || die 'unlink failed\n';
4564 } else {
ed221350 4565 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 4566 }
afdb31d5 4567 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
4568 };
4569 print STDERR "unable to cleanup '$volid' - $@" if $@;
4570 } else {
4571 print STDERR "unable to parse line in statfile - $line";
afdb31d5 4572 }
3e16d5fc
DM
4573 }
4574 $fd->close();
4575 }
4576}
4577
4578sub restore_archive {
a0d1b1a2 4579 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 4580
91bd6c90
DM
4581 my $format = $opts->{format};
4582 my $comp;
4583
4584 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4585 $format = 'tar' if !$format;
4586 $comp = 'gzip';
4587 } elsif ($archive =~ m/\.tar$/) {
4588 $format = 'tar' if !$format;
4589 } elsif ($archive =~ m/.tar.lzo$/) {
4590 $format = 'tar' if !$format;
4591 $comp = 'lzop';
4592 } elsif ($archive =~ m/\.vma$/) {
4593 $format = 'vma' if !$format;
4594 } elsif ($archive =~ m/\.vma\.gz$/) {
4595 $format = 'vma' if !$format;
4596 $comp = 'gzip';
4597 } elsif ($archive =~ m/\.vma\.lzo$/) {
4598 $format = 'vma' if !$format;
4599 $comp = 'lzop';
4600 } else {
4601 $format = 'vma' if !$format; # default
4602 }
4603
4604 # try to detect archive format
4605 if ($format eq 'tar') {
4606 return restore_tar_archive($archive, $vmid, $user, $opts);
4607 } else {
4608 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4609 }
4610}
4611
4612sub restore_update_config_line {
4613 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4614
4615 return if $line =~ m/^\#qmdump\#/;
4616 return if $line =~ m/^\#vzdump\#/;
4617 return if $line =~ m/^lock:/;
4618 return if $line =~ m/^unused\d+:/;
4619 return if $line =~ m/^parent:/;
ca3e4fa4 4620 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4621
4622 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4623 # try to convert old 1.X settings
4624 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4625 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4626 my ($model, $macaddr) = split(/\=/, $devconfig);
4627 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4628 my $net = {
4629 model => $model,
4630 bridge => "vmbr$ind",
4631 macaddr => $macaddr,
4632 };
4633 my $netstr = print_net($net);
4634
4635 print $outfd "net$cookie->{netcount}: $netstr\n";
4636 $cookie->{netcount}++;
4637 }
4638 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4639 my ($id, $netstr) = ($1, $2);
4640 my $net = parse_net($netstr);
4641 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4642 $netstr = print_net($net);
4643 print $outfd "$id: $netstr\n";
4644 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4645 my $virtdev = $1;
907ea891 4646 my $value = $3;
91bd6c90
DM
4647 if ($line =~ m/backup=no/) {
4648 print $outfd "#$line";
4649 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4650 my $di = parse_drive($virtdev, $value);
8fd57431 4651 delete $di->{format}; # format can change on restore
91bd6c90 4652 $di->{file} = $map->{$virtdev};
ed221350 4653 $value = print_drive($vmid, $di);
91bd6c90
DM
4654 print $outfd "$virtdev: $value\n";
4655 } else {
4656 print $outfd $line;
4657 }
4658 } else {
4659 print $outfd $line;
4660 }
4661}
4662
4663sub scan_volids {
4664 my ($cfg, $vmid) = @_;
4665
4666 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4667
4668 my $volid_hash = {};
4669 foreach my $storeid (keys %$info) {
4670 foreach my $item (@{$info->{$storeid}}) {
4671 next if !($item->{volid} && $item->{size});
5996a936 4672 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4673 $volid_hash->{$item->{volid}} = $item;
4674 }
4675 }
4676
4677 return $volid_hash;
4678}
4679
a8e2f942
DM
4680sub get_used_paths {
4681 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4682
4683 my $used_path = {};
4684
4685 my $scan_config = sub {
4686 my ($cref, $snapname) = @_;
4687
4688 foreach my $key (keys %$cref) {
4689 my $value = $cref->{$key};
4690 if (valid_drivename($key)) {
4691 next if $skip_drive && $key eq $skip_drive;
4692 my $drive = parse_drive($key, $value);
4693 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4694 if ($drive->{file} =~ m!^/!) {
4695 $used_path->{$drive->{file}}++; # = 1;
4696 } else {
4697 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4698 next if !$storeid;
4699 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4700 next if !$scfg;
4701 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4702 $used_path->{$path}++; # = 1;
4703 }
4704 }
4705 }
4706 };
4707
4708 &$scan_config($conf);
4709
4710 undef $skip_drive;
4711
4712 if ($scan_snapshots) {
4713 foreach my $snapname (keys %{$conf->{snapshots}}) {
4714 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4715 }
4716 }
4717
4718 return $used_path;
4719}
4720
91bd6c90
DM
4721sub update_disksize {
4722 my ($vmid, $conf, $volid_hash) = @_;
be190583 4723
91bd6c90
DM
4724 my $changes;
4725
4726 my $used = {};
4727
5996a936
DM
4728 # Note: it is allowed to define multiple storages with same path (alias), so
4729 # we need to check both 'volid' and real 'path' (two different volid can point
4730 # to the same path).
4731
4732 my $usedpath = {};
be190583 4733
91bd6c90
DM
4734 # update size info
4735 foreach my $opt (keys %$conf) {
ed221350
DM
4736 if (valid_drivename($opt)) {
4737 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4738 my $volid = $drive->{file};
4739 next if !$volid;
4740
4741 $used->{$volid} = 1;
be190583 4742 if ($volid_hash->{$volid} &&
5996a936
DM
4743 (my $path = $volid_hash->{$volid}->{path})) {
4744 $usedpath->{$path} = 1;
4745 }
91bd6c90 4746
ed221350 4747 next if drive_is_cdrom($drive);
91bd6c90
DM
4748 next if !$volid_hash->{$volid};
4749
4750 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4751 my $new = print_drive($vmid, $drive);
4752 if ($new ne $conf->{$opt}) {
4753 $changes = 1;
4754 $conf->{$opt} = $new;
4755 }
91bd6c90
DM
4756 }
4757 }
4758
5996a936
DM
4759 # remove 'unusedX' entry if volume is used
4760 foreach my $opt (keys %$conf) {
4761 next if $opt !~ m/^unused\d+$/;
4762 my $volid = $conf->{$opt};
4763 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4764 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4765 $changes = 1;
4766 delete $conf->{$opt};
4767 }
4768 }
4769
91bd6c90
DM
4770 foreach my $volid (sort keys %$volid_hash) {
4771 next if $volid =~ m/vm-$vmid-state-/;
4772 next if $used->{$volid};
5996a936
DM
4773 my $path = $volid_hash->{$volid}->{path};
4774 next if !$path; # just to be sure
4775 next if $usedpath->{$path};
91bd6c90 4776 $changes = 1;
ed221350 4777 add_unused_volume($conf, $volid);
05937a14 4778 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4779 }
4780
4781 return $changes;
4782}
4783
4784sub rescan {
4785 my ($vmid, $nolock) = @_;
4786
4787 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4788
4789 my $volid_hash = scan_volids($cfg, $vmid);
4790
4791 my $updatefn = sub {
4792 my ($vmid) = @_;
4793
ed221350 4794 my $conf = load_config($vmid);
be190583 4795
ed221350 4796 check_lock($conf);
91bd6c90 4797
03da3f0d
DM
4798 my $vm_volids = {};
4799 foreach my $volid (keys %$volid_hash) {
4800 my $info = $volid_hash->{$volid};
4801 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4802 }
4803
4804 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 4805
ed221350 4806 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
4807 };
4808
4809 if (defined($vmid)) {
4810 if ($nolock) {
4811 &$updatefn($vmid);
4812 } else {
ed221350 4813 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
4814 }
4815 } else {
4816 my $vmlist = config_list();
4817 foreach my $vmid (keys %$vmlist) {
4818 if ($nolock) {
4819 &$updatefn($vmid);
4820 } else {
ed221350 4821 lock_config($vmid, $updatefn, $vmid);
be190583 4822 }
91bd6c90
DM
4823 }
4824 }
4825}
4826
4827sub restore_vma_archive {
4828 my ($archive, $vmid, $user, $opts, $comp) = @_;
4829
4830 my $input = $archive eq '-' ? "<&STDIN" : undef;
4831 my $readfrom = $archive;
4832
4833 my $uncomp = '';
4834 if ($comp) {
4835 $readfrom = '-';
4836 my $qarchive = PVE::Tools::shellquote($archive);
4837 if ($comp eq 'gzip') {
4838 $uncomp = "zcat $qarchive|";
4839 } elsif ($comp eq 'lzop') {
4840 $uncomp = "lzop -d -c $qarchive|";
4841 } else {
4842 die "unknown compression method '$comp'\n";
4843 }
be190583 4844
91bd6c90
DM
4845 }
4846
4847 my $tmpdir = "/var/tmp/vzdumptmp$$";
4848 rmtree $tmpdir;
4849
4850 # disable interrupts (always do cleanups)
4851 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4852 warn "got interrupt - ignored\n";
4853 };
4854
4855 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4856 POSIX::mkfifo($mapfifo, 0600);
4857 my $fifofh;
4858
4859 my $openfifo = sub {
4860 open($fifofh, '>', $mapfifo) || die $!;
4861 };
4862
4863 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4864
4865 my $oldtimeout;
4866 my $timeout = 5;
4867
4868 my $devinfo = {};
4869
4870 my $rpcenv = PVE::RPCEnvironment::get();
4871
ed221350 4872 my $conffile = config_file($vmid);
91bd6c90
DM
4873 my $tmpfn = "$conffile.$$.tmp";
4874
ed221350
DM
4875 # Note: $oldconf is undef if VM does not exists
4876 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4877
91bd6c90
DM
4878 my $print_devmap = sub {
4879 my $virtdev_hash = {};
4880
4881 my $cfgfn = "$tmpdir/qemu-server.conf";
4882
4883 # we can read the config - that is already extracted
4884 my $fh = IO::File->new($cfgfn, "r") ||
4885 "unable to read qemu-server.conf - $!\n";
4886
4887 while (defined(my $line = <$fh>)) {
4888 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4889 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4890 die "archive does not contain data for drive '$virtdev'\n"
4891 if !$devinfo->{$devname};
4892 if (defined($opts->{storage})) {
4893 $storeid = $opts->{storage} || 'local';
4894 } elsif (!$storeid) {
4895 $storeid = 'local';
4896 }
4897 $format = 'raw' if !$format;
4898 $devinfo->{$devname}->{devname} = $devname;
4899 $devinfo->{$devname}->{virtdev} = $virtdev;
4900 $devinfo->{$devname}->{format} = $format;
4901 $devinfo->{$devname}->{storeid} = $storeid;
4902
be190583 4903 # check permission on storage
91bd6c90
DM
4904 my $pool = $opts->{pool}; # todo: do we need that?
4905 if ($user ne 'root@pam') {
4906 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4907 }
4908
4909 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4910 }
4911 }
4912
4913 foreach my $devname (keys %$devinfo) {
be190583
DM
4914 die "found no device mapping information for device '$devname'\n"
4915 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
4916 }
4917
91bd6c90 4918 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
4919
4920 # create empty/temp config
be190583 4921 if ($oldconf) {
ed221350
DM
4922 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4923 foreach_drive($oldconf, sub {
4924 my ($ds, $drive) = @_;
4925
4926 return if drive_is_cdrom($drive);
4927
4928 my $volid = $drive->{file};
4929
4930 return if !$volid || $volid =~ m|^/|;
4931
4932 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4933 return if !$path || !$owner || ($owner != $vmid);
4934
4935 # Note: only delete disk we want to restore
4936 # other volumes will become unused
4937 if ($virtdev_hash->{$ds}) {
4938 PVE::Storage::vdisk_free($cfg, $volid);
4939 }
4940 });
4941 }
4942
4943 my $map = {};
91bd6c90
DM
4944 foreach my $virtdev (sort keys %$virtdev_hash) {
4945 my $d = $virtdev_hash->{$virtdev};
4946 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4947 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
4948
4949 # test if requested format is supported
4950 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4951 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4952 $d->{format} = $defFormat if !$supported;
4953
91bd6c90
DM
4954 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4955 $d->{format}, undef, $alloc_size);
4956 print STDERR "new volume ID is '$volid'\n";
4957 $d->{volid} = $volid;
4958 my $path = PVE::Storage::path($cfg, $volid);
4959
4960 my $write_zeros = 1;
4961 # fixme: what other storages types initialize volumes with zero?
244f2577 4962 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 4963 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
4964 $write_zeros = 0;
4965 }
4966
4967 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4968
4969 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4970 $map->{$virtdev} = $volid;
4971 }
4972
4973 $fh->seek(0, 0) || die "seek failed - $!\n";
4974
4975 my $outfd = new IO::File ($tmpfn, "w") ||
4976 die "unable to write config for VM $vmid\n";
4977
4978 my $cookie = { netcount => 0 };
4979 while (defined(my $line = <$fh>)) {
be190583 4980 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
4981 }
4982
4983 $fh->close();
4984 $outfd->close();
4985 };
4986
4987 eval {
4988 # enable interrupts
4989 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4990 die "interrupted by signal\n";
4991 };
4992 local $SIG{ALRM} = sub { die "got timeout\n"; };
4993
4994 $oldtimeout = alarm($timeout);
4995
4996 my $parser = sub {
4997 my $line = shift;
4998
4999 print "$line\n";
5000
5001 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
5002 my ($dev_id, $size, $devname) = ($1, $2, $3);
5003 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
5004 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 5005 # we correctly received the vma config, so we can disable
3cf90d7a
DM
5006 # the timeout now for disk allocation (set to 10 minutes, so
5007 # that we always timeout if something goes wrong)
5008 alarm(600);
91bd6c90
DM
5009 &$print_devmap();
5010 print $fifofh "done\n";
5011 my $tmp = $oldtimeout || 0;
5012 $oldtimeout = undef;
5013 alarm($tmp);
5014 close($fifofh);
5015 }
5016 };
be190583 5017
91bd6c90
DM
5018 print "restore vma archive: $cmd\n";
5019 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
5020 };
5021 my $err = $@;
5022
5023 alarm($oldtimeout) if $oldtimeout;
5024
5025 unlink $mapfifo;
5026
5027 if ($err) {
5028 rmtree $tmpdir;
5029 unlink $tmpfn;
5030
5031 my $cfg = cfs_read_file('storage.cfg');
5032 foreach my $devname (keys %$devinfo) {
5033 my $volid = $devinfo->{$devname}->{volid};
5034 next if !$volid;
5035 eval {
5036 if ($volid =~ m|^/|) {
5037 unlink $volid || die 'unlink failed\n';
5038 } else {
5039 PVE::Storage::vdisk_free($cfg, $volid);
5040 }
5041 print STDERR "temporary volume '$volid' sucessfuly removed\n";
5042 };
5043 print STDERR "unable to cleanup '$volid' - $@" if $@;
5044 }
5045 die $err;
5046 }
5047
5048 rmtree $tmpdir;
ed221350
DM
5049
5050 rename($tmpfn, $conffile) ||
91bd6c90
DM
5051 die "unable to commit configuration file '$conffile'\n";
5052
ed221350
DM
5053 PVE::Cluster::cfs_update(); # make sure we read new file
5054
91bd6c90
DM
5055 eval { rescan($vmid, 1); };
5056 warn $@ if $@;
5057}
5058
5059sub restore_tar_archive {
5060 my ($archive, $vmid, $user, $opts) = @_;
5061
9c502e26 5062 if ($archive ne '-') {
ed221350 5063 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
5064 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
5065 if $firstfile ne 'qemu-server.conf';
5066 }
3e16d5fc 5067
ed221350 5068 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 5069
ed221350 5070 # destroy existing data - keep empty config
8e90138a 5071 my $vmcfgfn = config_file($vmid);
ebb55558 5072 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 5073
3e16d5fc
DM
5074 my $tocmd = "/usr/lib/qemu-server/qmextract";
5075
2415a446 5076 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 5077 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
5078 $tocmd .= ' --prealloc' if $opts->{prealloc};
5079 $tocmd .= ' --info' if $opts->{info};
5080
a0d1b1a2 5081 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 5082 # so we pipe to zcat
2415a446
DM
5083 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
5084 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
5085
5086 my $tmpdir = "/var/tmp/vzdumptmp$$";
5087 mkpath $tmpdir;
5088
5089 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
5090 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 5091 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 5092
ed221350 5093 my $conffile = config_file($vmid);
3e16d5fc
DM
5094 my $tmpfn = "$conffile.$$.tmp";
5095
5096 # disable interrupts (always do cleanups)
5097 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5098 print STDERR "got interrupt - ignored\n";
5099 };
5100
afdb31d5 5101 eval {
3e16d5fc
DM
5102 # enable interrupts
5103 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5104 die "interrupted by signal\n";
5105 };
5106
9c502e26
DM
5107 if ($archive eq '-') {
5108 print "extracting archive from STDIN\n";
5109 run_command($cmd, input => "<&STDIN");
5110 } else {
5111 print "extracting archive '$archive'\n";
5112 run_command($cmd);
5113 }
3e16d5fc
DM
5114
5115 return if $opts->{info};
5116
5117 # read new mapping
5118 my $map = {};
5119 my $statfile = "$tmpdir/qmrestore.stat";
5120 if (my $fd = IO::File->new($statfile, "r")) {
5121 while (defined (my $line = <$fd>)) {
5122 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5123 $map->{$1} = $2 if $1;
5124 } else {
5125 print STDERR "unable to parse line in statfile - $line\n";
5126 }
5127 }
5128 $fd->close();
5129 }
5130
5131 my $confsrc = "$tmpdir/qemu-server.conf";
5132
5133 my $srcfd = new IO::File($confsrc, "r") ||
5134 die "unable to open file '$confsrc'\n";
5135
5136 my $outfd = new IO::File ($tmpfn, "w") ||
5137 die "unable to write config for VM $vmid\n";
5138
91bd6c90 5139 my $cookie = { netcount => 0 };
3e16d5fc 5140 while (defined (my $line = <$srcfd>)) {
be190583 5141 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
5142 }
5143
5144 $srcfd->close();
5145 $outfd->close();
5146 };
5147 my $err = $@;
5148
afdb31d5 5149 if ($err) {
3e16d5fc
DM
5150
5151 unlink $tmpfn;
5152
ed221350 5153 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 5154
3e16d5fc 5155 die $err;
afdb31d5 5156 }
3e16d5fc
DM
5157
5158 rmtree $tmpdir;
5159
5160 rename $tmpfn, $conffile ||
5161 die "unable to commit configuration file '$conffile'\n";
91bd6c90 5162
ed221350
DM
5163 PVE::Cluster::cfs_update(); # make sure we read new file
5164
91bd6c90
DM
5165 eval { rescan($vmid, 1); };
5166 warn $@ if $@;
3e16d5fc
DM
5167};
5168
0d18dcfc
DM
5169
5170# Internal snapshots
5171
5172# NOTE: Snapshot create/delete involves several non-atomic
5173# action, and can take a long time.
5174# So we try to avoid locking the file and use 'lock' variable
5175# inside the config file instead.
5176
ef59d1ca
DM
5177my $snapshot_copy_config = sub {
5178 my ($source, $dest) = @_;
5179
5180 foreach my $k (keys %$source) {
5181 next if $k eq 'snapshots';
982c7f12
DM
5182 next if $k eq 'snapstate';
5183 next if $k eq 'snaptime';
18bfb361 5184 next if $k eq 'vmstate';
ef59d1ca
DM
5185 next if $k eq 'lock';
5186 next if $k eq 'digest';
db7c26e5 5187 next if $k eq 'description';
ef59d1ca 5188 next if $k =~ m/^unused\d+$/;
be190583 5189
ef59d1ca
DM
5190 $dest->{$k} = $source->{$k};
5191 }
5192};
5193
5194my $snapshot_apply_config = sub {
5195 my ($conf, $snap) = @_;
5196
5197 # copy snapshot list
5198 my $newconf = {
5199 snapshots => $conf->{snapshots},
5200 };
5201
db7c26e5 5202 # keep description and list of unused disks
ef59d1ca 5203 foreach my $k (keys %$conf) {
db7c26e5 5204 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
5205 $newconf->{$k} = $conf->{$k};
5206 }
5207
5208 &$snapshot_copy_config($snap, $newconf);
5209
5210 return $newconf;
5211};
5212
18bfb361
DM
5213sub foreach_writable_storage {
5214 my ($conf, $func) = @_;
5215
5216 my $sidhash = {};
5217
5218 foreach my $ds (keys %$conf) {
5219 next if !valid_drivename($ds);
5220
5221 my $drive = parse_drive($ds, $conf->{$ds});
5222 next if !$drive;
5223 next if drive_is_cdrom($drive);
5224
5225 my $volid = $drive->{file};
5226
5227 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 5228 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
5229 }
5230
5231 foreach my $sid (sort keys %$sidhash) {
5232 &$func($sid);
5233 }
5234}
5235
5236my $alloc_vmstate_volid = sub {
5237 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 5238
18bfb361
DM
5239 # Note: we try to be smart when selecting a $target storage
5240
5241 my $target;
5242
5243 # search shared storage first
5244 foreach_writable_storage($conf, sub {
5245 my ($sid) = @_;
5246 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5247 return if !$scfg->{shared};
5248
5249 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
5250 });
5251
5252 if (!$target) {
5253 # now search local storage
5254 foreach_writable_storage($conf, sub {
5255 my ($sid) = @_;
5256 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5257 return if $scfg->{shared};
5258
5259 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
5260 });
5261 }
5262
5263 $target = 'local' if !$target;
5264
fe6249f4
DM
5265 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
5266 # we abort live save after $conf->{memory}, so we need at max twice that space
5267 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
5268
5269 my $name = "vm-$vmid-state-$snapname";
5270 my $scfg = PVE::Storage::storage_config($storecfg, $target);
5271 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
5272 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
5273
5274 return $volid;
5275};
5276
0d18dcfc 5277my $snapshot_prepare = sub {
18bfb361 5278 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
5279
5280 my $snap;
0d18dcfc
DM
5281
5282 my $updatefn = sub {
5283
5284 my $conf = load_config($vmid);
5285
be190583 5286 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
5287 if is_template($conf);
5288
0d18dcfc
DM
5289 check_lock($conf);
5290
22c377f0
DM
5291 $conf->{lock} = 'snapshot';
5292
be190583
DM
5293 die "snapshot name '$snapname' already used\n"
5294 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 5295
ee2f90b1 5296 my $storecfg = PVE::Storage::config();
7ea975ef 5297 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 5298
782f4f75 5299 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 5300
18bfb361
DM
5301 if ($save_vmstate && check_running($vmid)) {
5302 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
5303 }
5304
ef59d1ca 5305 &$snapshot_copy_config($conf, $snap);
0d18dcfc 5306
782f4f75
DM
5307 $snap->{snapstate} = "prepare";
5308 $snap->{snaptime} = time();
5309 $snap->{description} = $comment if $comment;
5310
4b15803d
DM
5311 # always overwrite machine if we save vmstate. This makes sure we
5312 # can restore it later using correct machine type
5313 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
5314
0d18dcfc
DM
5315 update_config_nolock($vmid, $conf, 1);
5316 };
5317
5318 lock_config($vmid, $updatefn);
22c377f0
DM
5319
5320 return $snap;
0d18dcfc
DM
5321};
5322
5323my $snapshot_commit = sub {
5324 my ($vmid, $snapname) = @_;
5325
5326 my $updatefn = sub {
5327
5328 my $conf = load_config($vmid);
5329
be190583
DM
5330 die "missing snapshot lock\n"
5331 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc 5332
7946e0fa
DM
5333 my $has_machine_config = defined($conf->{machine});
5334
0d18dcfc
DM
5335 my $snap = $conf->{snapshots}->{$snapname};
5336
be190583
DM
5337 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5338
5339 die "wrong snapshot state\n"
5340 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 5341
0d18dcfc 5342 delete $snap->{snapstate};
ee2f90b1 5343 delete $conf->{lock};
0d18dcfc 5344
ef59d1ca 5345 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 5346
7946e0fa
DM
5347 delete $newconf->{machine} if !$has_machine_config;
5348
05e5ad3f
DM
5349 $newconf->{parent} = $snapname;
5350
0d18dcfc
DM
5351 update_config_nolock($vmid, $newconf, 1);
5352 };
5353
5354 lock_config($vmid, $updatefn);
5355};
5356
22c377f0
DM
5357sub snapshot_rollback {
5358 my ($vmid, $snapname) = @_;
5359
5360 my $snap;
5361
5362 my $prepare = 1;
5363
a3222b91 5364 my $storecfg = PVE::Storage::config();
be190583 5365
22c377f0
DM
5366 my $updatefn = sub {
5367
5368 my $conf = load_config($vmid);
5369
8b43bc11 5370 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 5371
ab33a7c2
DM
5372 $snap = $conf->{snapshots}->{$snapname};
5373
be190583 5374 die "snapshot '$snapname' does not exist\n" if !defined($snap);
ab33a7c2 5375
be190583 5376 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
5377 if $snap->{snapstate};
5378
a3222b91
DM
5379 if ($prepare) {
5380 check_lock($conf);
5381 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
5382 }
22c377f0
DM
5383
5384 die "unable to rollback vm $vmid: vm is running\n"
5385 if check_running($vmid);
5386
5387 if ($prepare) {
5388 $conf->{lock} = 'rollback';
5389 } else {
5390 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
5391 delete $conf->{lock};
5392 }
5393
4b15803d
DM
5394 my $forcemachine;
5395
22c377f0 5396 if (!$prepare) {
4b15803d
DM
5397 my $has_machine_config = defined($conf->{machine});
5398
22c377f0 5399 # copy snapshot config to current config
ef59d1ca
DM
5400 $conf = &$snapshot_apply_config($conf, $snap);
5401 $conf->{parent} = $snapname;
4b15803d 5402
d8b916fd
DM
5403 # Note: old code did not store 'machine', so we try to be smart
5404 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
5405 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 5406 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
5407 # in the original config.
5408 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
5409 }
5410
5411 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
5412
5413 if (!$prepare && $snap->{vmstate}) {
5414 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 5415 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 5416 }
22c377f0
DM
5417 };
5418
5419 lock_config($vmid, $updatefn);
be190583 5420
22c377f0
DM
5421 foreach_drive($snap, sub {
5422 my ($ds, $drive) = @_;
5423
5424 return if drive_is_cdrom($drive);
5425
5426 my $volid = $drive->{file};
5427 my $device = "drive-$ds";
5428
79e57b29 5429 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
5430 });
5431
5432 $prepare = 0;
5433 lock_config($vmid, $updatefn);
5434}
5435
9dcf4909
DM
5436my $savevm_wait = sub {
5437 my ($vmid) = @_;
5438
5439 for(;;) {
ed221350 5440 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
5441 if (!$stat->{status}) {
5442 die "savevm not active\n";
5443 } elsif ($stat->{status} eq 'active') {
5444 sleep(1);
5445 next;
5446 } elsif ($stat->{status} eq 'completed') {
5447 last;
5448 } else {
5449 die "query-savevm returned status '$stat->{status}'\n";
5450 }
5451 }
5452};
5453
0d18dcfc 5454sub snapshot_create {
af9110dd 5455 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
0d18dcfc 5456
18bfb361 5457 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 5458
af9110dd 5459 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
18bfb361 5460
67fb9de6
DM
5461 my $config = load_config($vmid);
5462
af9110dd
WL
5463 my $running = check_running($vmid);
5464
67fb9de6 5465 my $freezefs = $running && $config->{agent};
af9110dd
WL
5466 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5467
5468 my $drivehash = {};
5469
5470 if ($freezefs) {
65994ad7
WL
5471 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5472 warn "guest-fsfreeze-freeze problems - $@" if $@;
5473 }
67fb9de6 5474
0d18dcfc
DM
5475 eval {
5476 # create internal snapshots of all drives
22c377f0
DM
5477
5478 my $storecfg = PVE::Storage::config();
a3222b91
DM
5479
5480 if ($running) {
5481 if ($snap->{vmstate}) {
be190583 5482 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
5483 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5484 &$savevm_wait($vmid);
a3222b91 5485 } else {
9dcf4909 5486 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
5487 }
5488 };
5489
22c377f0
DM
5490 foreach_drive($snap, sub {
5491 my ($ds, $drive) = @_;
5492
5493 return if drive_is_cdrom($drive);
0d18dcfc 5494
22c377f0
DM
5495 my $volid = $drive->{file};
5496 my $device = "drive-$ds";
5497
5498 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 5499 $drivehash->{$ds} = 1;
22c377f0 5500 });
0d18dcfc 5501 };
22c377f0
DM
5502 my $err = $@;
5503
65994ad7
WL
5504 if ($running) {
5505 eval { vm_mon_cmd($vmid, "savevm-end") };
5506 warn $@ if $@;
22c377f0 5507
af9110dd 5508 if ($freezefs) {
67fb9de6 5509 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
65994ad7
WL
5510 warn "guest-fsfreeze-thaw problems - $@" if $@;
5511 }
22c377f0 5512
65994ad7 5513 # savevm-end is async, we need to wait
f34ebd52 5514 for (;;) {
2c9e8036
AD
5515 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5516 if (!$stat->{bytes}) {
5517 last;
5518 } else {
5519 print "savevm not yet finished\n";
5520 sleep(1);
5521 next;
5522 }
5523 }
5524 }
5525
22c377f0 5526 if ($err) {
0d18dcfc 5527 warn "snapshot create failed: starting cleanup\n";
3ee28e38 5528 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
5529 warn $@ if $@;
5530 die $err;
5531 }
5532
5533 &$snapshot_commit($vmid, $snapname);
5534}
5535
3ee28e38 5536# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 5537sub snapshot_delete {
3ee28e38 5538 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
5539
5540 my $prepare = 1;
5541
22c377f0 5542 my $snap;
ee2f90b1 5543 my $unused = [];
0d18dcfc 5544
6cb1a8cf
DM
5545 my $unlink_parent = sub {
5546 my ($confref, $new_parent) = @_;
5547
5548 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5549 if ($new_parent) {
5550 $confref->{parent} = $new_parent;
5551 } else {
5552 delete $confref->{parent};
5553 }
5554 }
5555 };
be190583 5556
0d18dcfc 5557 my $updatefn = sub {
2009f324 5558 my ($remove_drive) = @_;
0d18dcfc 5559
22c377f0 5560 my $conf = load_config($vmid);
0d18dcfc 5561
5295b23d
DM
5562 if (!$drivehash) {
5563 check_lock($conf);
be190583 5564 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
5565 if is_template($conf);
5566 }
0d18dcfc 5567
22c377f0 5568 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 5569
be190583 5570 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
5571
5572 # remove parent refs
8fd882a4
SP
5573 if (!$prepare) {
5574 &$unlink_parent($conf, $snap->{parent});
5575 foreach my $sn (keys %{$conf->{snapshots}}) {
5576 next if $sn eq $snapname;
5577 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5578 }
0d18dcfc
DM
5579 }
5580
2009f324 5581 if ($remove_drive) {
18bfb361
DM
5582 if ($remove_drive eq 'vmstate') {
5583 delete $snap->{$remove_drive};
5584 } else {
5585 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5586 my $volid = $drive->{file};
5587 delete $snap->{$remove_drive};
5588 add_unused_volume($conf, $volid);
5589 }
2009f324
DM
5590 }
5591
0d18dcfc
DM
5592 if ($prepare) {
5593 $snap->{snapstate} = 'delete';
5594 } else {
5595 delete $conf->{snapshots}->{$snapname};
3ee28e38 5596 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
5597 foreach my $volid (@$unused) {
5598 add_unused_volume($conf, $volid);
5599 }
0d18dcfc
DM
5600 }
5601
5602 update_config_nolock($vmid, $conf, 1);
5603 };
5604
5605 lock_config($vmid, $updatefn);
5606
18bfb361 5607 # now remove vmstate file
0d18dcfc 5608
22c377f0
DM
5609 my $storecfg = PVE::Storage::config();
5610
18bfb361
DM
5611 if ($snap->{vmstate}) {
5612 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5613 if (my $err = $@) {
5614 die $err if !$force;
5615 warn $err;
5616 }
5617 # save changes (remove vmstate from snapshot)
5618 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5619 };
5620
5621 # now remove all internal snapshots
5622 foreach_drive($snap, sub {
22c377f0
DM
5623 my ($ds, $drive) = @_;
5624
5625 return if drive_is_cdrom($drive);
3ee28e38 5626
22c377f0
DM
5627 my $volid = $drive->{file};
5628 my $device = "drive-$ds";
5629
2009f324
DM
5630 if (!$drivehash || $drivehash->{$ds}) {
5631 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5632 if (my $err = $@) {
5633 die $err if !$force;
5634 warn $err;
5635 }
3ee28e38 5636 }
2009f324
DM
5637
5638 # save changes (remove drive fron snapshot)
5639 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5640 push @$unused, $volid;
22c377f0 5641 });
0d18dcfc
DM
5642
5643 # now cleanup config
5644 $prepare = 0;
5645 lock_config($vmid, $updatefn);
5646}
5647
9cd07842 5648sub has_feature {
7ea975ef
AD
5649 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5650
719893a9 5651 my $err;
7ea975ef
AD
5652 foreach_drive($conf, sub {
5653 my ($ds, $drive) = @_;
5654
5655 return if drive_is_cdrom($drive);
5656 my $volid = $drive->{file};
5657 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5658 });
5659
719893a9 5660 return $err ? 0 : 1;
7ea975ef 5661}
04a69bb4
AD
5662
5663sub template_create {
5664 my ($vmid, $conf, $disk) = @_;
5665
04a69bb4 5666 my $storecfg = PVE::Storage::config();
04a69bb4 5667
9cd07842
DM
5668 foreach_drive($conf, sub {
5669 my ($ds, $drive) = @_;
5670
5671 return if drive_is_cdrom($drive);
5672 return if $disk && $ds ne $disk;
5673
5674 my $volid = $drive->{file};
bbd56097 5675 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5676
04a69bb4
AD
5677 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5678 $drive->{file} = $voliddst;
152fe752
DM
5679 $conf->{$ds} = print_drive($vmid, $drive);
5680 update_config_nolock($vmid, $conf, 1);
04a69bb4 5681 });
04a69bb4
AD
5682}
5683
624361b3
AD
5684sub is_template {
5685 my ($conf) = @_;
5686
96d695c0 5687 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5688}
5689
5133de42
AD
5690sub qemu_img_convert {
5691 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5692
5693 my $storecfg = PVE::Storage::config();
5694 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5695 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5696
5697 if ($src_storeid && $dst_storeid) {
5698 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5699 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5700
5701 my $src_format = qemu_img_format($src_scfg, $src_volname);
5702 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5703
5704 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5705 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5706
5707 my $cmd = [];
71ddbff9 5708 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5709 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5710 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5711
5712 my $parser = sub {
5713 my $line = shift;
5714 if($line =~ m/\((\S+)\/100\%\)/){
5715 my $percent = $1;
5716 my $transferred = int($size * $percent / 100);
5717 my $remaining = $size - $transferred;
5718
5719 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5720 }
5721
5722 };
5723
5724 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5725 my $err = $@;
5726 die "copy failed: $err" if $err;
5727 }
5728}
5729
5730sub qemu_img_format {
5731 my ($scfg, $volname) = @_;
5732
ccb5c001 5733 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5734 return $1;
ccb5c001 5735 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5736 return "host_device";
be190583 5737 } else {
5133de42 5738 return "raw";
5133de42
AD
5739 }
5740}
5741
cfad42af 5742sub qemu_drive_mirror {
ab6ecffe 5743 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
cfad42af 5744
ab6ecffe 5745 my $count = 0;
cfad42af
AD
5746 my $old_len = 0;
5747 my $frozen = undef;
ab6ecffe 5748 my $maxwait = 120;
cfad42af
AD
5749
5750 my $storecfg = PVE::Storage::config();
08ac653f 5751 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
152fe752 5752
08ac653f 5753 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 5754
08ac653f
DM
5755 my $format;
5756 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5757 $format = $1;
5758 }
21ccdb50 5759
08ac653f 5760 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 5761
88383920
DM
5762 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5763 $opts->{format} = $format if $format;
5764
5765 #fixme : sometime drive-mirror timeout, but works fine after.
5766 # (I have see the problem with big volume > 200GB), so we need to eval
f34ebd52 5767 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
88383920 5768 # ignore errors here
21ccdb50 5769
08ac653f
DM
5770 eval {
5771 while (1) {
5772 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5773 my $stat = @$stats[0];
5774 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5775 die "error job is not mirroring" if $stat->{type} ne "mirror";
5776
08ac653f
DM
5777 my $busy = $stat->{busy};
5778
6f708643
DM
5779 if (my $total = $stat->{len}) {
5780 my $transferred = $stat->{offset} || 0;
5781 my $remaining = $total - $transferred;
5782 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
67fb9de6 5783
6f708643
DM
5784 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
5785 }
f34ebd52 5786
08ac653f
DM
5787 if ($stat->{len} == $stat->{offset}) {
5788 if ($busy eq 'false') {
5789
5790 last if $vmiddst != $vmid;
f34ebd52 5791
08ac653f
DM
5792 # try to switch the disk if source and destination are on the same guest
5793 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
5794 last if !$@;
5795 die $@ if $@ !~ m/cannot be completed/;
cfad42af 5796 }
b467f79a 5797
08ac653f
DM
5798 if ($count > $maxwait) {
5799 # if too much writes to disk occurs at the end of migration
5800 #the disk needs to be freezed to be able to complete the migration
5801 vm_suspend($vmid,1);
5802 $frozen = 1;
bcc87408 5803 }
08ac653f
DM
5804 $count ++
5805 }
5806 $old_len = $stat->{offset};
5807 sleep 1;
cfad42af
AD
5808 }
5809
08ac653f
DM
5810 vm_resume($vmid, 1) if $frozen;
5811
5812 };
88383920 5813 my $err = $@;
08ac653f 5814
88383920 5815 my $cancel_job = sub {
08ac653f
DM
5816 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
5817 while (1) {
5818 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5819 my $stat = @$stats[0];
5820 last if !$stat;
5821 sleep 1;
cfad42af 5822 }
88383920
DM
5823 };
5824
5825 if ($err) {
f34ebd52 5826 eval { &$cancel_job(); };
88383920
DM
5827 die "mirroring error: $err";
5828 }
5829
5830 if ($vmiddst != $vmid) {
5831 # if we clone a disk for a new target vm, we don't switch the disk
5832 &$cancel_job(); # so we call block-job-cancel
cfad42af
AD
5833 }
5834}
5835
152fe752 5836sub clone_disk {
be190583 5837 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
5838 $newvmid, $storage, $format, $full, $newvollist) = @_;
5839
5840 my $newvolid;
5841
5842 if (!$full) {
5843 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 5844 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
5845 push @$newvollist, $newvolid;
5846 } else {
5847 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5848 $storeid = $storage if $storage;
5849
1377d7b0
DM
5850 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5851 if (!$format) {
5852 $format = $drive->{format} || $defFormat;
152fe752
DM
5853 }
5854
1377d7b0
DM
5855 # test if requested format is supported - else use default
5856 my $supported = grep { $_ eq $format } @$validFormats;
5857 $format = $defFormat if !$supported;
5858
152fe752
DM
5859 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5860
5861 print "create full clone of drive $drivename ($drive->{file})\n";
5862 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5863 push @$newvollist, $newvolid;
5864
5865 if (!$running || $snapname) {
5866 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5867 } else {
5868 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 5869 }
152fe752
DM
5870 }
5871
5872 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5873
5874 my $disk = $drive;
5875 $disk->{format} = undef;
5876 $disk->{file} = $newvolid;
5877 $disk->{size} = $size;
5878
5879 return $disk;
5880}
5881
ff556cf2
DM
5882# this only works if VM is running
5883sub get_current_qemu_machine {
5884 my ($vmid) = @_;
5885
5886 my $cmd = { execute => 'query-machines', arguments => {} };
8e90138a 5887 my $res = vm_qmp_command($vmid, $cmd);
ff556cf2
DM
5888
5889 my ($current, $default);
5890 foreach my $e (@$res) {
5891 $default = $e->{name} if $e->{'is-default'};
5892 $current = $e->{name} if $e->{'is-current'};
5893 }
5894
5895 # fallback to the default machine if current is not supported by qemu
5896 return $current || $default || 'pc';
5897}
5898
4543ecf0
AD
5899sub lspci {
5900
5901 my $devices = {};
5902
5903 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5904 my (undef, $id, $function) = @_;
5905 my $res = { id => $id, function => $function};
5906 push @{$devices->{$id}}, $res;
5907 });
5908
5909 return $devices;
5910}
5911
1e3baf05 59121;