]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
bump version to 3.3-19
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05 154my $confdesc = {
7183bd9a
AD
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
1e3baf05
DM
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
2ff09f52
DA
173 hotplug => {
174 optional => 1,
b3c2bdd1
DM
175 type => 'string', format => 'pve-hotplug-features',
176 description => "Selectively enable hotplug features. This is a comma separated list of hotplug features: 'network', 'disk', 'cpu', 'memory' and 'usb'. Use '0' to disable hotplug completely. Value '1' is an alias for the default 'network,disk,usb'.",
177 default => 'network,disk,usb',
2ff09f52 178 },
1e3baf05
DM
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
22c377f0 189 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
7878afeb 209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
210 minimum => 16,
211 default => 512,
212 },
13a48620
DA
213 balloon => {
214 optional => 1,
215 type => 'integer',
8b1accf7
DM
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
13a48620 226 },
1e3baf05
DM
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 231 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
7fabe17d 236 type => 'string', format => 'dns-name',
1e3baf05
DM
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
cdd20088
AD
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
5b952ff5 243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
244 default => 'lsi',
245 },
1e3baf05
DM
246 description => {
247 optional => 1,
248 type => 'string',
0581fe4f 249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
6b9d84cf 254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
255 description => <<EODESC,
256Used to enable special optimization/features for specific
257operating systems:
258
259other => unspecified OS
260wxp => Microsoft Windows XP
261w2k => Microsoft Windows 2000
262w2k3 => Microsoft Windows 2003
263w2k8 => Microsoft Windows 2008
264wvista => Microsoft Windows Vista
265win7 => Microsoft Windows 7
a70ebde3 266win8 => Microsoft Windows 8/2012
1e3baf05
DM
267l24 => Linux 2.4 Kernel
268l26 => Linux 2.6/3.X Kernel
6b9d84cf 269solaris => solaris/opensolaris/openindiania kernel
1e3baf05 270
6b9d84cf 271other|l24|l26|solaris ... no special behaviour
a70ebde3 272wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
273EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
32baffb4 280 default => 'cdn',
1e3baf05
DM
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
03e480fc 286 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
8a010eae
AD
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
de9d1e55 315 vcpus => {
3bd18e48
AD
316 optional => 1,
317 type => 'integer',
de9d1e55 318 description => "Number of hotplugged vcpus.",
3bd18e48 319 minimum => 1,
de9d1e55 320 default => 0,
3bd18e48 321 },
1e3baf05
DM
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
bc84dcca 328 agent => {
ab6a046f
AD
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
be79c214 332 default => 0,
ab6a046f 333 },
1e3baf05
DM
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
8c559505
DM
343 description => "Enable/disable time drift fix.",
344 default => 0,
1e3baf05 345 },
19672434 346 localtime => {
1e3baf05
DM
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
ef5e2be2 359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 361 },
0ea9541d
DM
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
1e3baf05
DM
368 startdate => {
369 optional => 1,
19672434 370 type => 'string',
1e3baf05
DM
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
59411c4e
DM
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
68eda3ab
AD
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
1e3baf05
DM
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394args: -no-reboot -no-hpet
395EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
5acbfe9e 401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
04432191 412 type => 'number',
1e3baf05
DM
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
04432191 415 default => 0.1,
1e3baf05
DM
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
3aefd6fd 427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 428 default => 'kvm64',
1e3baf05 429 },
b7ba6b79
DM
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
982c7f12
DM
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
18bfb361
DM
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
3bafc510
DM
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
2796e7d5
DM
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
1e3baf05
DM
459};
460
461# what about other qemu settings ?
462#cpu => 'string',
463#machine => 'string',
464#fda => 'file',
465#fdb => 'file',
466#mtdblock => 'file',
467#sd => 'file',
468#pflash => 'file',
469#snapshot => 'bool',
470#bootp => 'file',
471##tftp => 'dir',
472##smb => 'dir',
473#kernel => 'file',
474#append => 'string',
475#initrd => 'file',
476##soundhw => 'string',
477
478while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480}
481
482my $MAX_IDE_DISKS = 4;
f62db2a4 483my $MAX_SCSI_DISKS = 14;
a2650619 484my $MAX_VIRTIO_DISKS = 16;
cdb0931f 485my $MAX_SATA_DISKS = 6;
1e3baf05 486my $MAX_USB_DEVICES = 5;
5bdcf937 487my $MAX_NETS = 32;
1e3baf05 488my $MAX_UNUSED_DISKS = 8;
5cffb2d2 489my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 490my $MAX_SERIAL_PORTS = 4;
1989a89c 491my $MAX_PARALLEL_PORTS = 3;
2ed5d572 492my $MAX_NUMA = 8;
4d3f29ed
AD
493my $MAX_MEM = 4194304;
494my $STATICMEM = 1024;
2ed5d572
AD
495
496my $numadesc = {
497 optional => 1,
498 type => 'string', format => 'pve-qm-numanode',
25088687 499 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>] [,policy=<preferred|bind|interleave>]]",
2ed5d572
AD
500 description => "numa topology",
501};
502PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
503
504for (my $i = 0; $i < $MAX_NUMA; $i++) {
505 $confdesc->{"numa$i"} = $numadesc;
506}
1e3baf05
DM
507
508my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
55034103
KT
509 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3',
510 'e1000-82540em', 'e1000-82544gc', 'e1000-82545em'];
6b64503e 511my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 512
1e3baf05
DM
513my $netdesc = {
514 optional => 1,
515 type => 'string', format => 'pve-qm-net',
25088687 516 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>] [,tag=<vlanid>][,firewall=0|1],link_down=0|1]",
1e3baf05 517 description => <<EODESCR,
19672434 518Specify network devices.
1e3baf05
DM
519
520MODEL is one of: $nic_model_list_txt
521
19672434 522XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
523automatically generated if not specified.
524
525The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
526
527Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
528
529If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
530
53110.0.2.2 Gateway
53210.0.2.3 DNS Server
53310.0.2.4 SMB Server
534
535The DHCP server assign addresses to the guest starting from 10.0.2.15.
536
537EODESCR
538};
539PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
540
541for (my $i = 0; $i < $MAX_NETS; $i++) {
542 $confdesc->{"net$i"} = $netdesc;
543}
544
545my $drivename_hash;
19672434 546
1e3baf05
DM
547my $idedesc = {
548 optional => 1,
549 type => 'string', format => 'pve-qm-drive',
8d87f8aa 550 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 551 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
552};
553PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
554
555my $scsidesc = {
556 optional => 1,
557 type => 'string', format => 'pve-qm-drive',
8d87f8aa 558 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 559 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
560};
561PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
562
cdb0931f
DA
563my $satadesc = {
564 optional => 1,
565 type => 'string', format => 'pve-qm-drive',
8d87f8aa 566 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 567 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
568};
569PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
570
1e3baf05
DM
571my $virtiodesc = {
572 optional => 1,
573 type => 'string', format => 'pve-qm-drive',
8d87f8aa 574 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 575 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
576};
577PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
578
579my $usbdesc = {
580 optional => 1,
581 type => 'string', format => 'pve-qm-usb-device',
80401dd8 582 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 583 description => <<EODESCR,
2fe1a152 584Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
585pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
586
19672434 587'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
588'vendor_id:product_id' (hexadeciaml numbers)
589
19672434 590You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
591
592Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
593
80401dd8
DM
594The value 'spice' can be used to add a usb redirection devices for spice.
595
1e3baf05
DM
596EODESCR
597};
598PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
599
040b06b7
DA
600my $hostpcidesc = {
601 optional => 1,
602 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 603 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
604 description => <<EODESCR,
605Map host pci devices. HOSTPCIDEVICE syntax is:
606
607'bus:dev.func' (hexadecimal numbers)
608
609You can us the 'lspci' command to list existing pci devices.
610
0cea6a01
DM
611The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
612
040b06b7
DA
613Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
614
615Experimental: user reported problems with this option.
616EODESCR
617};
618PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
619
bae179aa
DA
620my $serialdesc = {
621 optional => 1,
ca0cef26 622 type => 'string',
1b0b51ed 623 pattern => '(/dev/.+|socket)',
bae179aa 624 description => <<EODESCR,
1b0b51ed 625Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
626
627Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
628
629Experimental: user reported problems with this option.
630EODESCR
631};
bae179aa 632
1989a89c
DA
633my $paralleldesc= {
634 optional => 1,
ca0cef26 635 type => 'string',
9ecc8431 636 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 637 description => <<EODESCR,
19672434 638Map host parallel devices (n is 0 to 2).
1989a89c
DA
639
640Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
641
642Experimental: user reported problems with this option.
643EODESCR
644};
1989a89c
DA
645
646for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
647 $confdesc->{"parallel$i"} = $paralleldesc;
648}
649
bae179aa
DA
650for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
651 $confdesc->{"serial$i"} = $serialdesc;
652}
653
040b06b7
DA
654for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
655 $confdesc->{"hostpci$i"} = $hostpcidesc;
656}
1e3baf05
DM
657
658for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
659 $drivename_hash->{"ide$i"} = 1;
660 $confdesc->{"ide$i"} = $idedesc;
661}
662
cdb0931f
DA
663for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
664 $drivename_hash->{"sata$i"} = 1;
665 $confdesc->{"sata$i"} = $satadesc;
666}
667
1e3baf05
DM
668for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
669 $drivename_hash->{"scsi$i"} = 1;
670 $confdesc->{"scsi$i"} = $scsidesc ;
671}
672
673for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
674 $drivename_hash->{"virtio$i"} = 1;
675 $confdesc->{"virtio$i"} = $virtiodesc;
676}
677
678for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
679 $confdesc->{"usb$i"} = $usbdesc;
680}
681
682my $unuseddesc = {
683 optional => 1,
684 type => 'string', format => 'pve-volume-id',
685 description => "Reference to unused volumes.",
686};
687
688for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
689 $confdesc->{"unused$i"} = $unuseddesc;
690}
691
692my $kvm_api_version = 0;
693
694sub kvm_version {
695
696 return $kvm_api_version if $kvm_api_version;
697
6b64503e 698 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
699 return 0;
700
6b64503e 701 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
702 $kvm_api_version = $v;
703 }
704
705 $fh->close();
706
707 return $kvm_api_version;
708}
709
710my $kvm_user_version;
711
712sub kvm_user_version {
713
714 return $kvm_user_version if $kvm_user_version;
715
716 $kvm_user_version = 'unknown';
717
718 my $tmp = `kvm -help 2>/dev/null`;
19672434 719
fa7ae705 720 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
721 $kvm_user_version = $2;
722 }
723
724 return $kvm_user_version;
725
726}
727
728my $kernel_has_vhost_net = -c '/dev/vhost-net';
729
730sub disknames {
731 # order is important - used to autoselect boot disk
19672434 732 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 733 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
734 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
735 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
736}
737
738sub valid_drivename {
739 my $dev = shift;
740
6b64503e 741 return defined($drivename_hash->{$dev});
1e3baf05
DM
742}
743
744sub option_exists {
745 my $key = shift;
746 return defined($confdesc->{$key});
19672434 747}
1e3baf05
DM
748
749sub nic_models {
750 return $nic_model_list;
751}
752
753sub os_list_description {
754
755 return {
756 other => 'Other',
757 wxp => 'Windows XP',
758 w2k => 'Windows 2000',
759 w2k3 =>, 'Windows 2003',
760 w2k8 => 'Windows 2008',
761 wvista => 'Windows Vista',
762 win7 => 'Windows 7',
a70ebde3 763 win8 => 'Windows 8/2012',
1e3baf05
DM
764 l24 => 'Linux 2.4',
765 l26 => 'Linux 2.6',
19672434 766 };
1e3baf05
DM
767}
768
1e3baf05
DM
769my $cdrom_path;
770
771sub get_cdrom_path {
772
773 return $cdrom_path if $cdrom_path;
774
775 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
776 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
777 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
778}
779
780sub get_iso_path {
781 my ($storecfg, $vmid, $cdrom) = @_;
782
783 if ($cdrom eq 'cdrom') {
784 return get_cdrom_path();
785 } elsif ($cdrom eq 'none') {
786 return '';
787 } elsif ($cdrom =~ m|^/|) {
788 return $cdrom;
789 } else {
6b64503e 790 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
791 }
792}
793
794# try to convert old style file names to volume IDs
795sub filename_to_volume_id {
796 my ($vmid, $file, $media) = @_;
797
798 if (!($file eq 'none' || $file eq 'cdrom' ||
799 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 800
1e3baf05 801 return undef if $file =~ m|/|;
19672434 802
1e3baf05
DM
803 if ($media && $media eq 'cdrom') {
804 $file = "local:iso/$file";
805 } else {
806 $file = "local:$vmid/$file";
807 }
808 }
809
810 return $file;
811}
812
813sub verify_media_type {
814 my ($opt, $vtype, $media) = @_;
815
816 return if !$media;
817
818 my $etype;
819 if ($media eq 'disk') {
a125592c 820 $etype = 'images';
1e3baf05
DM
821 } elsif ($media eq 'cdrom') {
822 $etype = 'iso';
823 } else {
824 die "internal error";
825 }
826
827 return if ($vtype eq $etype);
19672434 828
1e3baf05
DM
829 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
830}
831
832sub cleanup_drive_path {
833 my ($opt, $storecfg, $drive) = @_;
834
835 # try to convert filesystem paths to volume IDs
836
837 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
838 ($drive->{file} !~ m|^/dev/.+|) &&
839 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 840 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
841 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
842 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
843 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
844 verify_media_type($opt, $vtype, $drive->{media});
845 $drive->{file} = $volid;
846 }
847
848 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
849}
850
851sub create_conf_nolock {
852 my ($vmid, $settings) = @_;
853
6b64503e 854 my $filename = config_file($vmid);
1e3baf05
DM
855
856 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 857
1e3baf05
DM
858 my $defaults = load_defaults();
859
860 $settings->{name} = "vm$vmid" if !$settings->{name};
861 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
862
863 my $data = '';
864 foreach my $opt (keys %$settings) {
865 next if !$confdesc->{$opt};
866
867 my $value = $settings->{$opt};
868 next if !$value;
869
870 $data .= "$opt: $value\n";
871 }
872
873 PVE::Tools::file_set_contents($filename, $data);
874}
875
b3c2bdd1
DM
876sub parse_hotplug_features {
877 my ($data) = @_;
878
879 my $res = {};
880
881 return $res if $data eq '0';
882
883 $data = $confdesc->{hotplug}->{default} if $data eq '1';
884
45827685 885 foreach my $feature (PVE::Tools::split_list($data)) {
b3c2bdd1
DM
886 if ($feature =~ m/^(network|disk|cpu|memory|usb)$/) {
887 $res->{$1} = 1;
888 } else {
889 warn "ignoring unknown hotplug feature '$feature'\n";
890 }
891 }
892 return $res;
893}
894
895PVE::JSONSchema::register_format('pve-hotplug-features', \&pve_verify_hotplug_features);
896sub pve_verify_hotplug_features {
897 my ($value, $noerr) = @_;
898
899 return $value if parse_hotplug_features($value);
900
901 return undef if $noerr;
902
903 die "unable to parse hotplug option\n";
904}
905
f36ed4f4
DM
906my $parse_size = sub {
907 my ($value) = @_;
908
9bf371a6 909 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
910 my ($size, $unit) = ($1, $3);
911 if ($unit) {
912 if ($unit eq 'K') {
913 $size = $size * 1024;
914 } elsif ($unit eq 'M') {
915 $size = $size * 1024 * 1024;
916 } elsif ($unit eq 'G') {
917 $size = $size * 1024 * 1024 * 1024;
918 }
919 }
920 return int($size);
921};
922
923my $format_size = sub {
924 my ($size) = @_;
925
926 $size = int($size);
927
928 my $kb = int($size/1024);
929 return $size if $kb*1024 != $size;
930
931 my $mb = int($kb/1024);
932 return "${kb}K" if $mb*1024 != $kb;
933
934 my $gb = int($mb/1024);
935 return "${mb}M" if $gb*1024 != $mb;
936
937 return "${gb}G";
938};
939
1e3baf05
DM
940# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
941# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 942# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 943# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
944
945sub parse_drive {
946 my ($key, $data) = @_;
947
948 my $res = {};
19672434 949
1e3baf05
DM
950 # $key may be undefined - used to verify JSON parameters
951 if (!defined($key)) {
952 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
953 $res->{index} = 0;
954 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
955 $res->{interface} = $1;
956 $res->{index} = $2;
957 } else {
958 return undef;
959 }
960
961 foreach my $p (split (/,/, $data)) {
962 next if $p =~ m/^\s*$/;
963
74edd76b 964 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
965 my ($k, $v) = ($1, $2);
966
967 $k = 'file' if $k eq 'volume';
968
969 return undef if defined $res->{$k};
19672434 970
9bf371a6
DM
971 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
972 return undef if !$v || $v !~ m/^\d+/;
973 $k = "m$k";
974 $v = sprintf("%.3f", $v / (1024*1024));
975 }
1e3baf05
DM
976 $res->{$k} = $v;
977 } else {
978 if (!$res->{file} && $p !~ m/=/) {
979 $res->{file} = $p;
980 } else {
981 return undef;
982 }
983 }
984 }
985
986 return undef if !$res->{file};
987
bdf3f362
AD
988 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
989 $res->{format} = $1;
990 }
991
19672434 992 return undef if $res->{cache} &&
e482cec3 993 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
994 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
995 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
996 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
997 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
998 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
999 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
1000 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
1001 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
1002 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
1003 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
1004 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 1005 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 1006
9bf371a6
DM
1007 return undef if $res->{mbps_rd} && $res->{mbps};
1008 return undef if $res->{mbps_wr} && $res->{mbps};
1009
1010 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 1011 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 1012 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 1013 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 1014 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 1015 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 1016
affd2f88
AD
1017 return undef if $res->{iops_rd} && $res->{iops};
1018 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
1019
1020
affd2f88 1021 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 1022 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 1023 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 1024 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 1025 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 1026 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
1027
1028
24afaca0 1029 if ($res->{size}) {
be190583 1030 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
1031 }
1032
1e3baf05
DM
1033 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1034 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1035 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1036 return undef if $res->{interface} eq 'virtio';
1037 }
1038
1039 # rerror does not work with scsi drives
1040 if ($res->{rerror}) {
1041 return undef if $res->{interface} eq 'scsi';
1042 }
1043
1044 return $res;
1045}
1046
74edd76b 1047my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
1048
1049sub print_drive {
1050 my ($vmid, $drive) = @_;
1051
1052 my $opts = '';
74edd76b 1053 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
1054 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1055 }
1056
24afaca0
DM
1057 if ($drive->{size}) {
1058 $opts .= ",size=" . &$format_size($drive->{size});
1059 }
1060
1e3baf05
DM
1061 return "$drive->{file}$opts";
1062}
1063
28ef82d3
DM
1064sub scsi_inquiry {
1065 my($fh, $noerr) = @_;
1066
1067 my $SG_IO = 0x2285;
1068 my $SG_GET_VERSION_NUM = 0x2282;
1069
1070 my $versionbuf = "\x00" x 8;
1071 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1072 if (!$ret) {
1073 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1074 return undef;
1075 }
97d62eb7 1076 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1077 if ($version < 30000) {
1078 die "scsi generic interface too old\n" if !$noerr;
1079 return undef;
1080 }
97d62eb7 1081
28ef82d3
DM
1082 my $buf = "\x00" x 36;
1083 my $sensebuf = "\x00" x 8;
f334aa3e 1084 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1085
28ef82d3
DM
1086 # see /usr/include/scsi/sg.h
1087 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1088
97d62eb7
DM
1089 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1090 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1091 $cmd, $sensebuf, 6000);
1092
1093 $ret = ioctl($fh, $SG_IO, $packet);
1094 if (!$ret) {
1095 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1096 return undef;
1097 }
97d62eb7 1098
28ef82d3
DM
1099 my @res = unpack($sg_io_hdr_t, $packet);
1100 if ($res[17] || $res[18]) {
1101 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1102 return undef;
1103 }
1104
1105 my $res = {};
09984754 1106 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1107 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1108
09984754
DM
1109 $res->{removable} = $byte1 & 128 ? 1 : 0;
1110 $res->{type} = $byte0 & 31;
1111
28ef82d3
DM
1112 return $res;
1113}
1114
1115sub path_is_scsi {
1116 my ($path) = @_;
1117
1118 my $fh = IO::File->new("+<$path") || return undef;
1119 my $res = scsi_inquiry($fh, 1);
1120 close($fh);
1121
1122 return $res;
1123}
1124
db656e5f
DM
1125sub machine_type_is_q35 {
1126 my ($conf) = @_;
b467f79a 1127
db656e5f
DM
1128 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1129}
1130
1131sub print_tabletdevice_full {
1132 my ($conf) = @_;
b467f79a 1133
db656e5f
DM
1134 my $q35 = machine_type_is_q35($conf);
1135
1136 # we use uhci for old VMs because tablet driver was buggy in older qemu
1137 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1138
db656e5f
DM
1139 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1140}
1141
ca916ecc 1142sub print_drivedevice_full {
5bdcf937 1143 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1144
1145 my $device = '';
1146 my $maxdev = 0;
19672434 1147
ca916ecc 1148 if ($drive->{interface} eq 'virtio') {
5bdcf937 1149 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1150 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
7183bd9a 1151 $device .= ",iothread=iothread0" if $conf->{iothread};
2ed36a41 1152 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1153 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1154 my $controller = int($drive->{index} / $maxdev);
1155 my $unit = $drive->{index} % $maxdev;
1156 my $devicetype = 'hd';
231f2e13
DA
1157 my $path = '';
1158 if (drive_is_cdrom($drive)) {
1159 $devicetype = 'cd';
29b19529 1160 } else {
231f2e13
DA
1161 if ($drive->{file} =~ m|^/|) {
1162 $path = $drive->{file};
1163 } else {
1164 $path = PVE::Storage::path($storecfg, $drive->{file});
1165 }
d454d040
AD
1166
1167 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1168 $devicetype = 'generic';
1169 } else {
09984754
DM
1170 if (my $info = path_is_scsi($path)) {
1171 if ($info->{type} == 0) {
1172 $devicetype = 'block';
1173 } elsif ($info->{type} == 1) { # tape
1174 $devicetype = 'generic';
1175 }
1176 }
d454d040 1177 }
231f2e13 1178 }
ca916ecc 1179
5b952ff5
DM
1180 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1181 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1182 } else {
1183 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1184 }
1185
2ed36a41
DM
1186 } elsif ($drive->{interface} eq 'ide'){
1187 $maxdev = 2;
1188 my $controller = int($drive->{index} / $maxdev);
1189 my $unit = $drive->{index} % $maxdev;
1190 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1191
7ebe888a 1192 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1193 } elsif ($drive->{interface} eq 'sata'){
1194 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1195 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1196 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1197 } elsif ($drive->{interface} eq 'usb') {
1198 die "implement me";
1199 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1200 } else {
1201 die "unsupported interface type";
ca916ecc
DA
1202 }
1203
3b408e82
DM
1204 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1205
ca916ecc
DA
1206 return $device;
1207}
1208
15b21acc 1209sub get_initiator_name {
46f58b5f 1210 my $initiator;
15b21acc 1211
46f58b5f
DM
1212 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1213 while (defined(my $line = <$fh>)) {
1214 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1215 $initiator = $1;
1216 last;
1217 }
46f58b5f
DM
1218 $fh->close();
1219
15b21acc
MR
1220 return $initiator;
1221}
1222
1e3baf05
DM
1223sub print_drive_full {
1224 my ($storecfg, $vmid, $drive) = @_;
1225
1226 my $opts = '';
1227 foreach my $o (@qemu_drive_options) {
3b408e82 1228 next if $o eq 'bootindex';
1e3baf05 1229 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1230 }
1e3baf05 1231
9bf371a6
DM
1232 foreach my $o (qw(bps bps_rd bps_wr)) {
1233 my $v = $drive->{"m$o"};
1234 $opts .= ",$o=" . int($v*1024*1024) if $v;
1235 }
1236
1e3baf05 1237 # use linux-aio by default (qemu default is threads)
19672434 1238 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1239
1240 my $path;
1241 my $volid = $drive->{file};
6b64503e
DM
1242 if (drive_is_cdrom($drive)) {
1243 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1244 } else {
1245 if ($volid =~ m|^/|) {
1246 $path = $volid;
1247 } else {
6b64503e 1248 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1249 }
1250 }
1251
ef86170e 1252 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1253
f1e05305
AD
1254 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1255 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1256
1e3baf05
DM
1257 my $pathinfo = $path ? "file=$path," : '';
1258
3ebfcc86 1259 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1260}
1261
cc4d6182 1262sub print_netdevice_full {
5bdcf937 1263 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1264
1265 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1266
1267 my $device = $net->{model};
1268 if ($net->{model} eq 'virtio') {
1269 $device = 'virtio-net-pci';
1270 };
1271
5bdcf937 1272 my $pciaddr = print_pci_addr("$netid", $bridges);
5e2068d2 1273 my $tmpstr = "$device,mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1274 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1275 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1276 my $vectors = $net->{queues} * 2 + 2;
1277 $tmpstr .= ",vectors=$vectors,mq=on";
1278 }
cc4d6182
DA
1279 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1280 return $tmpstr;
1281}
1282
1283sub print_netdev_full {
1284 my ($vmid, $conf, $net, $netid) = @_;
1285
1286 my $i = '';
1287 if ($netid =~ m/^net(\d+)$/) {
1288 $i = int($1);
1289 }
1290
1291 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1292
1293 my $ifname = "tap${vmid}i$i";
1294
1295 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1296 die "interface name '$ifname' is too long (max 15 character)\n"
1297 if length($ifname) >= 16;
1298
1299 my $vhostparam = '';
1300 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1301
1302 my $vmname = $conf->{name} || "vm$vmid";
1303
a9410357
AD
1304 my $netdev = "";
1305
cc4d6182 1306 if ($net->{bridge}) {
a9410357 1307 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1308 } else {
a9410357 1309 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1310 }
a9410357
AD
1311
1312 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1313
1314 return $netdev;
cc4d6182 1315}
1e3baf05
DM
1316
1317sub drive_is_cdrom {
1318 my ($drive) = @_;
1319
1320 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1321
1322}
1323
2ed5d572
AD
1324sub parse_numa {
1325 my ($data) = @_;
1326
1327 my $res = {};
1328
1329 foreach my $kvp (split(/,/, $data)) {
1330
1331 if ($kvp =~ m/^memory=(\S+)$/) {
1332 $res->{memory} = $1;
1333 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1334 $res->{policy} = $1;
1335 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1336 $res->{cpus}->{start} = $1;
1337 $res->{cpus}->{end} = $3;
1338 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1339 $res->{hostnodes}->{start} = $1;
1340 $res->{hostnodes}->{end} = $3;
1341 } else {
1342 return undef;
1343 }
1344 }
1345
1346 return $res;
1347}
1348
040b06b7
DA
1349sub parse_hostpci {
1350 my ($value) = @_;
1351
1352 return undef if !$value;
1353
0cea6a01
DM
1354
1355 my @list = split(/,/, $value);
1356 my $found;
1357
040b06b7 1358 my $res = {};
0cea6a01 1359 foreach my $kv (@list) {
040b06b7 1360
4543ecf0 1361 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1362 $found = 1;
4543ecf0
AD
1363 if(defined($4)){
1364 push @{$res->{pciid}}, { id => $2 , function => $4};
1365
1366 }else{
1367 my $pcidevices = lspci($2);
1368 $res->{pciid} = $pcidevices->{$2};
1369 }
0cea6a01
DM
1370 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1371 $res->{driver} = $1;
1372 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1373 $res->{rombar} = $1;
2e3b7e2a
AD
1374 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1375 $res->{'x-vga'} = $1;
1376 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1377 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1378 } else {
1379 warn "unknown hostpci setting '$kv'\n";
1380 }
040b06b7
DA
1381 }
1382
0cea6a01
DM
1383 return undef if !$found;
1384
040b06b7
DA
1385 return $res;
1386}
1387
1e3baf05
DM
1388# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1389sub parse_net {
1390 my ($data) = @_;
1391
1392 my $res = {};
1393
6b64503e 1394 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1395
55034103 1396 if ($kvp =~ m/^(ne2k_pci|e1000|e1000-82540em|e1000-82544gc|e1000-82545em|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1397 my $model = lc($1);
92f0fedc 1398 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1399 $res->{model} = $model;
1400 $res->{macaddr} = $mac;
1401 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1402 $res->{bridge} = $1;
a9410357
AD
1403 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1404 $res->{queues} = $1;
1e3baf05
DM
1405 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1406 $res->{rate} = $1;
5070f384
DA
1407 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1408 $res->{tag} = $1;
25088687 1409 } elsif ($kvp =~ m/^firewall=([01])$/) {
2dd4aa4c 1410 $res->{firewall} = $1;
25088687
DM
1411 } elsif ($kvp =~ m/^link_down=([01])$/) {
1412 $res->{link_down} = $1;
1e3baf05
DM
1413 } else {
1414 return undef;
1415 }
19672434 1416
1e3baf05
DM
1417 }
1418
1419 return undef if !$res->{model};
1420
1421 return $res;
1422}
1423
1424sub print_net {
1425 my $net = shift;
1426
1427 my $res = "$net->{model}";
1428 $res .= "=$net->{macaddr}" if $net->{macaddr};
1429 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1430 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1431 $res .= ",tag=$net->{tag}" if $net->{tag};
25088687
DM
1432 $res .= ",firewall=1" if $net->{firewall};
1433 $res .= ",link_down=1" if $net->{link_down};
8b6c5579 1434 $res .= ",queues=$net->{queues}" if $net->{queues};
1e3baf05
DM
1435
1436 return $res;
1437}
1438
1439sub add_random_macs {
1440 my ($settings) = @_;
1441
1442 foreach my $opt (keys %$settings) {
1443 next if $opt !~ m/^net(\d+)$/;
1444 my $net = parse_net($settings->{$opt});
1445 next if !$net;
1446 $settings->{$opt} = print_net($net);
1447 }
1448}
1449
1450sub add_unused_volume {
1858638f 1451 my ($config, $volid) = @_;
1e3baf05
DM
1452
1453 my $key;
1454 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1455 my $test = "unused$ind";
1456 if (my $vid = $config->{$test}) {
1457 return if $vid eq $volid; # do not add duplicates
1458 } else {
1459 $key = $test;
19672434 1460 }
1e3baf05
DM
1461 }
1462
1463 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1464
1858638f 1465 $config->{$key} = $volid;
1e3baf05 1466
1858638f 1467 return $key;
1e3baf05
DM
1468}
1469
055d554d
DM
1470sub vm_is_volid_owner {
1471 my ($storecfg, $vmid, $volid) = @_;
1472
1473 if ($volid !~ m|^/|) {
1474 my ($path, $owner);
1475 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1476 if ($owner && ($owner == $vmid)) {
1477 return 1;
1478 }
1479 }
1480
1481 return undef;
1482}
1483
1484sub vmconfig_delete_pending_option {
1485 my ($conf, $key) = @_;
1486
1487 delete $conf->{pending}->{$key};
1488 my $pending_delete_hash = { $key => 1 };
1489 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1490 $pending_delete_hash->{$opt} = 1;
1491 }
1492 $conf->{pending}->{delete} = join(',', keys %$pending_delete_hash);
1493}
1494
1495sub vmconfig_undelete_pending_option {
1496 my ($conf, $key) = @_;
1497
1498 my $pending_delete_hash = {};
1499 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1500 $pending_delete_hash->{$opt} = 1;
1501 }
1502 delete $pending_delete_hash->{$key};
1503
1504 my @keylist = keys %$pending_delete_hash;
1505 if (scalar(@keylist)) {
1506 $conf->{pending}->{delete} = join(',', @keylist);
1507 } else {
1508 delete $conf->{pending}->{delete};
1509 }
1510}
1511
1512sub vmconfig_register_unused_drive {
1513 my ($storecfg, $vmid, $conf, $drive) = @_;
1514
1515 if (!drive_is_cdrom($drive)) {
1516 my $volid = $drive->{file};
1517 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
1518 add_unused_volume($conf, $volid, $vmid);
1519 }
1520 }
1521}
1522
c750e90a
DM
1523sub vmconfig_cleanup_pending {
1524 my ($conf) = @_;
1525
1526 # remove pending changes when nothing changed
1527 my $changes;
1528 foreach my $opt (keys %{$conf->{pending}}) {
1529 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1530 $changes = 1;
1531 delete $conf->{pending}->{$opt};
1532 }
1533 }
1534
1535 # remove delete if option is not set
1536 my $pending_delete_hash = {};
1537 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1538 if (defined($conf->{$opt})) {
1539 $pending_delete_hash->{$opt} = 1;
1540 } else {
1541 $changes = 1;
1542 }
1543 }
1544
1545 my @keylist = keys %$pending_delete_hash;
1546 if (scalar(@keylist)) {
1547 $conf->{pending}->{delete} = join(',', @keylist);
1548 } else {
1549 delete $conf->{pending}->{delete};
1550 }
1551
1552 return $changes;
1553}
1554
2796e7d5
DM
1555my $valid_smbios1_options = {
1556 manufacturer => '\S+',
1557 product => '\S+',
1558 version => '\S+',
1559 serial => '\S+',
1560 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1561 sku => '\S+',
1562 family => '\S+',
1563};
1564
1565# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1566sub parse_smbios1 {
1567 my ($data) = @_;
1568
1569 my $res = {};
1570
1571 foreach my $kvp (split(/,/, $data)) {
1572 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1573 my ($k, $v) = split(/=/, $kvp);
1574 return undef if !defined($k) || !defined($v);
1575 return undef if !$valid_smbios1_options->{$k};
1576 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1577 $res->{$k} = $v;
1578 }
1579
1580 return $res;
1581}
1582
cd11416f
DM
1583sub print_smbios1 {
1584 my ($smbios1) = @_;
1585
1586 my $data = '';
1587 foreach my $k (keys %$smbios1) {
1588 next if !defined($smbios1->{$k});
1589 next if !$valid_smbios1_options->{$k};
1590 $data .= ',' if $data;
1591 $data .= "$k=$smbios1->{$k}";
1592 }
1593 return $data;
1594}
1595
2796e7d5
DM
1596PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1597sub verify_smbios1 {
1598 my ($value, $noerr) = @_;
1599
1600 return $value if parse_smbios1($value);
1601
1602 return undef if $noerr;
1603
1604 die "unable to parse smbios (type 1) options\n";
1605}
1606
1e3baf05
DM
1607PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1608sub verify_bootdisk {
1609 my ($value, $noerr) = @_;
1610
19672434 1611 return $value if valid_drivename($value);
1e3baf05
DM
1612
1613 return undef if $noerr;
1614
1615 die "invalid boot disk '$value'\n";
1616}
1617
2ed5d572
AD
1618PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1619sub verify_numa {
1620 my ($value, $noerr) = @_;
1621
1622 return $value if parse_numa($value);
1623
1624 return undef if $noerr;
1625
1626 die "unable to parse numa options\n";
1627}
1628
1e3baf05
DM
1629PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1630sub verify_net {
1631 my ($value, $noerr) = @_;
1632
1633 return $value if parse_net($value);
1634
1635 return undef if $noerr;
19672434 1636
1e3baf05
DM
1637 die "unable to parse network options\n";
1638}
1639
1640PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1641sub verify_drive {
1642 my ($value, $noerr) = @_;
1643
6b64503e 1644 return $value if parse_drive(undef, $value);
1e3baf05
DM
1645
1646 return undef if $noerr;
19672434 1647
1e3baf05
DM
1648 die "unable to parse drive options\n";
1649}
1650
1651PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1652sub verify_hostpci {
1653 my ($value, $noerr) = @_;
1654
040b06b7
DA
1655 return $value if parse_hostpci($value);
1656
1657 return undef if $noerr;
1658
1659 die "unable to parse pci id\n";
1e3baf05
DM
1660}
1661
0ea9541d
DM
1662PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1663sub verify_watchdog {
1664 my ($value, $noerr) = @_;
1665
1666 return $value if parse_watchdog($value);
1667
1668 return undef if $noerr;
19672434 1669
0ea9541d
DM
1670 die "unable to parse watchdog options\n";
1671}
1672
1673sub parse_watchdog {
1674 my ($value) = @_;
1675
1676 return undef if !$value;
1677
1678 my $res = {};
1679
6b64503e 1680 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1681 next if $p =~ m/^\s*$/;
1682
1683 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1684 $res->{model} = $2;
1685 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1686 $res->{action} = $2;
1687 } else {
1688 return undef;
1689 }
1690 }
1691
1692 return $res;
1693}
1694
59411c4e
DM
1695PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1696sub verify_startup {
1697 my ($value, $noerr) = @_;
1698
1699 return $value if parse_startup($value);
1700
1701 return undef if $noerr;
1702
1703 die "unable to parse startup options\n";
1704}
1705
1706sub parse_startup {
1707 my ($value) = @_;
1708
1709 return undef if !$value;
1710
1711 my $res = {};
1712
1713 foreach my $p (split(/,/, $value)) {
1714 next if $p =~ m/^\s*$/;
1715
1716 if ($p =~ m/^(order=)?(\d+)$/) {
1717 $res->{order} = $2;
1718 } elsif ($p =~ m/^up=(\d+)$/) {
1719 $res->{up} = $1;
1720 } elsif ($p =~ m/^down=(\d+)$/) {
1721 $res->{down} = $1;
1722 } else {
1723 return undef;
1724 }
1725 }
1726
1727 return $res;
1728}
1729
1e3baf05
DM
1730sub parse_usb_device {
1731 my ($value) = @_;
1732
1733 return undef if !$value;
1734
6b64503e 1735 my @dl = split(/,/, $value);
1e3baf05
DM
1736 my $found;
1737
1738 my $res = {};
1739 foreach my $v (@dl) {
036e0e2b 1740 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1741 $found = 1;
036e0e2b
DM
1742 $res->{vendorid} = $2;
1743 $res->{productid} = $4;
1e3baf05
DM
1744 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1745 $found = 1;
1746 $res->{hostbus} = $1;
1747 $res->{hostport} = $2;
80401dd8
DM
1748 } elsif ($v =~ m/^spice$/) {
1749 $found = 1;
1750 $res->{spice} = 1;
1e3baf05
DM
1751 } else {
1752 return undef;
1753 }
1754 }
1755 return undef if !$found;
1756
1757 return $res;
1758}
19672434 1759
1e3baf05
DM
1760PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1761sub verify_usb_device {
1762 my ($value, $noerr) = @_;
1763
1764 return $value if parse_usb_device($value);
1765
1766 return undef if $noerr;
19672434 1767
1e3baf05
DM
1768 die "unable to parse usb device\n";
1769}
1770
1e3baf05
DM
1771# add JSON properties for create and set function
1772sub json_config_properties {
1773 my $prop = shift;
1774
1775 foreach my $opt (keys %$confdesc) {
18bfb361 1776 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1777 $prop->{$opt} = $confdesc->{$opt};
1778 }
1779
1780 return $prop;
1781}
1782
1783sub check_type {
1784 my ($key, $value) = @_;
1785
1786 die "unknown setting '$key'\n" if !$confdesc->{$key};
1787
1788 my $type = $confdesc->{$key}->{type};
1789
6b64503e 1790 if (!defined($value)) {
1e3baf05
DM
1791 die "got undefined value\n";
1792 }
1793
1794 if ($value =~ m/[\n\r]/) {
1795 die "property contains a line feed\n";
1796 }
1797
1798 if ($type eq 'boolean') {
19672434
DM
1799 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1800 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1801 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1802 } elsif ($type eq 'integer') {
1803 return int($1) if $value =~ m/^(\d+)$/;
1804 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1805 } elsif ($type eq 'number') {
1806 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1807 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1808 } elsif ($type eq 'string') {
1809 if (my $fmt = $confdesc->{$key}->{format}) {
1810 if ($fmt eq 'pve-qm-drive') {
1811 # special case - we need to pass $key to parse_drive()
6b64503e 1812 my $drive = parse_drive($key, $value);
1e3baf05
DM
1813 return $value if $drive;
1814 die "unable to parse drive options\n";
1815 }
1816 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1817 return $value;
1818 }
1e3baf05 1819 $value =~ s/^\"(.*)\"$/$1/;
19672434 1820 return $value;
1e3baf05
DM
1821 } else {
1822 die "internal error"
1823 }
1824}
1825
191435c6
DM
1826sub lock_config_full {
1827 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1828
6b64503e 1829 my $filename = config_file_lock($vmid);
1e3baf05 1830
191435c6 1831 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1832
1833 die $@ if $@;
5fdbe4f0
DM
1834
1835 return $res;
1e3baf05
DM
1836}
1837
4e4f83fe
DM
1838sub lock_config_mode {
1839 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1840
1841 my $filename = config_file_lock($vmid);
1842
4e4f83fe 1843 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1844
1845 die $@ if $@;
1846
1847 return $res;
1848}
1849
191435c6
DM
1850sub lock_config {
1851 my ($vmid, $code, @param) = @_;
1852
1853 return lock_config_full($vmid, 10, $code, @param);
1854}
1855
1e3baf05 1856sub cfs_config_path {
a78ccf26 1857 my ($vmid, $node) = @_;
1e3baf05 1858
a78ccf26
DM
1859 $node = $nodename if !$node;
1860 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1861}
1862
040b06b7
DA
1863sub check_iommu_support{
1864 #fixme : need to check IOMMU support
1865 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1866
1867 my $iommu=1;
1868 return $iommu;
1869
1870}
1871
1e3baf05 1872sub config_file {
a78ccf26 1873 my ($vmid, $node) = @_;
1e3baf05 1874
a78ccf26 1875 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1876 return "/etc/pve/$cfspath";
1877}
1878
1879sub config_file_lock {
1880 my ($vmid) = @_;
1881
1882 return "$lock_dir/lock-$vmid.conf";
1883}
1884
1885sub touch_config {
1886 my ($vmid) = @_;
1887
6b64503e 1888 my $conf = config_file($vmid);
1e3baf05
DM
1889 utime undef, undef, $conf;
1890}
1891
1e3baf05 1892sub destroy_vm {
a6af7b3e 1893 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1894
6b64503e 1895 my $conffile = config_file($vmid);
1e3baf05 1896
6b64503e 1897 my $conf = load_config($vmid);
1e3baf05 1898
6b64503e 1899 check_lock($conf);
1e3baf05 1900
19672434 1901 # only remove disks owned by this VM
1e3baf05
DM
1902 foreach_drive($conf, sub {
1903 my ($ds, $drive) = @_;
1904
6b64503e 1905 return if drive_is_cdrom($drive);
1e3baf05
DM
1906
1907 my $volid = $drive->{file};
ed221350 1908
ff1a2432 1909 return if !$volid || $volid =~ m|^/|;
1e3baf05 1910
6b64503e 1911 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1912 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1913
6b64503e 1914 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1915 });
19672434 1916
a6af7b3e 1917 if ($keep_empty_config) {
9c502e26 1918 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1919 } else {
1920 unlink $conffile;
1921 }
1e3baf05
DM
1922
1923 # also remove unused disk
1924 eval {
6b64503e 1925 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1926
1927 eval {
6b64503e 1928 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1929 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1930 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1931 });
1932 };
1933 warn $@ if $@;
1934
1935 };
1936 warn $@ if $@;
1937}
1938
1e3baf05 1939sub load_config {
7e8dcf2c 1940 my ($vmid, $node) = @_;
1e3baf05 1941
7e8dcf2c 1942 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1943
1944 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1945
1946 die "no such VM ('$vmid')\n" if !defined($conf);
1947
1948 return $conf;
19672434 1949}
1e3baf05
DM
1950
1951sub parse_vm_config {
1952 my ($filename, $raw) = @_;
1953
1954 return undef if !defined($raw);
1955
554ac7e7 1956 my $res = {
fc1ddcdc 1957 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1958 snapshots => {},
0d732d16 1959 pending => {},
554ac7e7 1960 };
1e3baf05 1961
19672434 1962 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1963 || die "got strange filename '$filename'";
1964
1965 my $vmid = $1;
1966
0d18dcfc 1967 my $conf = $res;
0581fe4f 1968 my $descr = '';
e297c490 1969 my $section = '';
0581fe4f 1970
0d18dcfc
DM
1971 my @lines = split(/\n/, $raw);
1972 foreach my $line (@lines) {
1e3baf05 1973 next if $line =~ m/^\s*$/;
be190583 1974
eab09f4e 1975 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 1976 $section = 'pending';
0d732d16
DM
1977 $conf->{description} = $descr if $descr;
1978 $descr = '';
e297c490 1979 $conf = $res->{$section} = {};
eab09f4e
AD
1980 next;
1981
0d732d16 1982 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 1983 $section = $1;
0d18dcfc 1984 $conf->{description} = $descr if $descr;
782f4f75 1985 $descr = '';
e297c490 1986 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
1987 next;
1988 }
1e3baf05 1989
0581fe4f
DM
1990 if ($line =~ m/^\#(.*)\s*$/) {
1991 $descr .= PVE::Tools::decode_text($1) . "\n";
1992 next;
1993 }
1994
1e3baf05 1995 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1996 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1997 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1998 $conf->{snapstate} = $1;
1e3baf05
DM
1999 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
2000 my $key = $1;
2001 my $value = $2;
0d18dcfc 2002 $conf->{$key} = $value;
ef824322 2003 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
e297c490 2004 my $value = $1;
ef824322
DM
2005 if ($section eq 'pending') {
2006 $conf->{delete} = $value; # we parse this later
2007 } else {
2008 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
eab09f4e 2009 }
1e3baf05
DM
2010 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
2011 my $key = $1;
2012 my $value = $2;
2013 eval { $value = check_type($key, $value); };
2014 if ($@) {
2015 warn "vm $vmid - unable to parse value of '$key' - $@";
2016 } else {
2017 my $fmt = $confdesc->{$key}->{format};
2018 if ($fmt && $fmt eq 'pve-qm-drive') {
2019 my $v = parse_drive($key, $value);
2020 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
2021 $v->{file} = $volid;
6b64503e 2022 $value = print_drive($vmid, $v);
1e3baf05
DM
2023 } else {
2024 warn "vm $vmid - unable to parse value of '$key'\n";
2025 next;
2026 }
2027 }
2028
2029 if ($key eq 'cdrom') {
0d18dcfc 2030 $conf->{ide2} = $value;
1e3baf05 2031 } else {
0d18dcfc 2032 $conf->{$key} = $value;
1e3baf05
DM
2033 }
2034 }
2035 }
2036 }
2037
0d18dcfc 2038 $conf->{description} = $descr if $descr;
0581fe4f 2039
0d18dcfc 2040 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
2041
2042 return $res;
2043}
2044
1858638f
DM
2045sub write_vm_config {
2046 my ($filename, $conf) = @_;
1e3baf05 2047
0d18dcfc
DM
2048 delete $conf->{snapstate}; # just to be sure
2049
1858638f
DM
2050 if ($conf->{cdrom}) {
2051 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2052 $conf->{ide2} = $conf->{cdrom};
2053 delete $conf->{cdrom};
2054 }
1e3baf05
DM
2055
2056 # we do not use 'smp' any longer
1858638f
DM
2057 if ($conf->{sockets}) {
2058 delete $conf->{smp};
2059 } elsif ($conf->{smp}) {
2060 $conf->{sockets} = $conf->{smp};
2061 delete $conf->{cores};
2062 delete $conf->{smp};
1e3baf05
DM
2063 }
2064
ee2f90b1 2065 my $used_volids = {};
0d18dcfc 2066
ee2f90b1 2067 my $cleanup_config = sub {
ef824322 2068 my ($cref, $pending, $snapname) = @_;
1858638f 2069
ee2f90b1
DM
2070 foreach my $key (keys %$cref) {
2071 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
ef824322 2072 $key eq 'snapstate' || $key eq 'pending';
ee2f90b1 2073 my $value = $cref->{$key};
ef824322
DM
2074 if ($key eq 'delete') {
2075 die "propertry 'delete' is only allowed in [PENDING]\n"
2076 if !$pending;
2077 # fixme: check syntax?
2078 next;
2079 }
ee2f90b1
DM
2080 eval { $value = check_type($key, $value); };
2081 die "unable to parse value of '$key' - $@" if $@;
1858638f 2082
ee2f90b1
DM
2083 $cref->{$key} = $value;
2084
a8e2f942 2085 if (!$snapname && valid_drivename($key)) {
ed221350 2086 my $drive = parse_drive($key, $value);
ee2f90b1
DM
2087 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2088 }
1e3baf05 2089 }
ee2f90b1
DM
2090 };
2091
2092 &$cleanup_config($conf);
ef824322
DM
2093
2094 &$cleanup_config($conf->{pending}, 1);
2095
ee2f90b1 2096 foreach my $snapname (keys %{$conf->{snapshots}}) {
ef824322
DM
2097 die "internal error" if $snapname eq 'pending';
2098 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
1e3baf05
DM
2099 }
2100
1858638f
DM
2101 # remove 'unusedX' settings if we re-add a volume
2102 foreach my $key (keys %$conf) {
2103 my $value = $conf->{$key};
ee2f90b1 2104 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 2105 delete $conf->{$key};
1e3baf05 2106 }
1858638f 2107 }
be190583 2108
0d18dcfc
DM
2109 my $generate_raw_config = sub {
2110 my ($conf) = @_;
0581fe4f 2111
0d18dcfc
DM
2112 my $raw = '';
2113
2114 # add description as comment to top of file
2115 my $descr = $conf->{description} || '';
2116 foreach my $cl (split(/\n/, $descr)) {
2117 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2118 }
2119
2120 foreach my $key (sort keys %$conf) {
ef824322 2121 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
0d18dcfc
DM
2122 $raw .= "$key: $conf->{$key}\n";
2123 }
2124 return $raw;
2125 };
0581fe4f 2126
0d18dcfc 2127 my $raw = &$generate_raw_config($conf);
ef824322
DM
2128
2129 if (scalar(keys %{$conf->{pending}})){
2130 $raw .= "\n[PENDING]\n";
2131 $raw .= &$generate_raw_config($conf->{pending});
2132 }
2133
0d18dcfc
DM
2134 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2135 $raw .= "\n[$snapname]\n";
2136 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2137 }
1e3baf05 2138
1858638f
DM
2139 return $raw;
2140}
1e3baf05 2141
1858638f
DM
2142sub update_config_nolock {
2143 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2144
1858638f 2145 check_lock($conf) if !$skiplock;
97d62eb7 2146
1858638f 2147 my $cfspath = cfs_config_path($vmid);
1e3baf05 2148
1858638f
DM
2149 PVE::Cluster::cfs_write_file($cfspath, $conf);
2150}
1e3baf05 2151
1858638f
DM
2152sub update_config {
2153 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2154
1858638f 2155 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
2156}
2157
19672434 2158sub load_defaults {
1e3baf05
DM
2159
2160 my $res = {};
2161
2162 # we use static defaults from our JSON schema configuration
2163 foreach my $key (keys %$confdesc) {
2164 if (defined(my $default = $confdesc->{$key}->{default})) {
2165 $res->{$key} = $default;
2166 }
2167 }
19672434 2168
1e3baf05
DM
2169 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2170 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2171
2172 return $res;
2173}
2174
2175sub config_list {
2176 my $vmlist = PVE::Cluster::get_vmlist();
2177 my $res = {};
2178 return $res if !$vmlist || !$vmlist->{ids};
2179 my $ids = $vmlist->{ids};
2180
1e3baf05
DM
2181 foreach my $vmid (keys %$ids) {
2182 my $d = $ids->{$vmid};
2183 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2184 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2185 $res->{$vmid}->{exists} = 1;
2186 }
2187 return $res;
2188}
2189
64e13401
DM
2190# test if VM uses local resources (to prevent migration)
2191sub check_local_resources {
2192 my ($conf, $noerr) = @_;
2193
2194 my $loc_res = 0;
19672434 2195
e0ab7331
DM
2196 $loc_res = 1 if $conf->{hostusb}; # old syntax
2197 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2198
0d29ab3b 2199 foreach my $k (keys %$conf) {
49ca581d 2200 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 2201 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2202 }
2203
2204 die "VM uses local resources\n" if $loc_res && !$noerr;
2205
2206 return $loc_res;
2207}
2208
719893a9 2209# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2210sub check_storage_availability {
2211 my ($storecfg, $conf, $node) = @_;
2212
2213 foreach_drive($conf, sub {
2214 my ($ds, $drive) = @_;
2215
2216 my $volid = $drive->{file};
2217 return if !$volid;
2218
2219 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2220 return if !$sid;
2221
2222 # check if storage is available on both nodes
2223 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2224 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2225 });
2226}
2227
719893a9
DM
2228# list nodes where all VM images are available (used by has_feature API)
2229sub shared_nodes {
2230 my ($conf, $storecfg) = @_;
2231
2232 my $nodelist = PVE::Cluster::get_nodelist();
2233 my $nodehash = { map { $_ => 1 } @$nodelist };
2234 my $nodename = PVE::INotify::nodename();
be190583 2235
719893a9
DM
2236 foreach_drive($conf, sub {
2237 my ($ds, $drive) = @_;
2238
2239 my $volid = $drive->{file};
2240 return if !$volid;
2241
2242 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2243 if ($storeid) {
2244 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2245 if ($scfg->{disable}) {
2246 $nodehash = {};
2247 } elsif (my $avail = $scfg->{nodes}) {
2248 foreach my $node (keys %$nodehash) {
2249 delete $nodehash->{$node} if !$avail->{$node};
2250 }
2251 } elsif (!$scfg->{shared}) {
2252 foreach my $node (keys %$nodehash) {
2253 delete $nodehash->{$node} if $node ne $nodename
2254 }
2255 }
2256 }
2257 });
2258
2259 return $nodehash
2260}
2261
1e3baf05
DM
2262sub check_lock {
2263 my ($conf) = @_;
2264
2265 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2266}
2267
2268sub check_cmdline {
2269 my ($pidfile, $pid) = @_;
2270
6b64503e
DM
2271 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2272 if (defined($fh)) {
1e3baf05
DM
2273 my $line = <$fh>;
2274 $fh->close;
2275 return undef if !$line;
6b64503e 2276 my @param = split(/\0/, $line);
1e3baf05
DM
2277
2278 my $cmd = $param[0];
06094efd 2279 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2280
2281 for (my $i = 0; $i < scalar (@param); $i++) {
2282 my $p = $param[$i];
2283 next if !$p;
2284 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2285 my $p = $param[$i+1];
2286 return 1 if $p && ($p eq $pidfile);
2287 return undef;
2288 }
2289 }
2290 }
2291 return undef;
2292}
2293
2294sub check_running {
7e8dcf2c 2295 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2296
7e8dcf2c 2297 my $filename = config_file($vmid, $node);
1e3baf05
DM
2298
2299 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2300 if !$nocheck && ! -f $filename;
1e3baf05 2301
e6c3b671 2302 my $pidfile = pidfile_name($vmid);
1e3baf05 2303
e6c3b671
DM
2304 if (my $fd = IO::File->new("<$pidfile")) {
2305 my $st = stat($fd);
1e3baf05 2306 my $line = <$fd>;
6b64503e 2307 close($fd);
1e3baf05
DM
2308
2309 my $mtime = $st->mtime;
2310 if ($mtime > time()) {
2311 warn "file '$filename' modified in future\n";
2312 }
2313
2314 if ($line =~ m/^(\d+)$/) {
2315 my $pid = $1;
e6c3b671
DM
2316 if (check_cmdline($pidfile, $pid)) {
2317 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2318 return $pid;
2319 }
2320 }
1e3baf05
DM
2321 }
2322 }
2323
2324 return undef;
2325}
2326
2327sub vzlist {
19672434 2328
1e3baf05
DM
2329 my $vzlist = config_list();
2330
6b64503e 2331 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2332
19672434 2333 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2334 next if $de !~ m/^(\d+)\.pid$/;
2335 my $vmid = $1;
6b64503e
DM
2336 next if !defined($vzlist->{$vmid});
2337 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2338 $vzlist->{$vmid}->{pid} = $pid;
2339 }
2340 }
2341
2342 return $vzlist;
2343}
2344
1e3baf05
DM
2345sub disksize {
2346 my ($storecfg, $conf) = @_;
2347
2348 my $bootdisk = $conf->{bootdisk};
2349 return undef if !$bootdisk;
2350 return undef if !valid_drivename($bootdisk);
2351
2352 return undef if !$conf->{$bootdisk};
2353
2354 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2355 return undef if !defined($drive);
2356
2357 return undef if drive_is_cdrom($drive);
2358
2359 my $volid = $drive->{file};
2360 return undef if !$volid;
2361
24afaca0 2362 return $drive->{size};
1e3baf05
DM
2363}
2364
2365my $last_proc_pid_stat;
2366
03a33f30
DM
2367# get VM status information
2368# This must be fast and should not block ($full == false)
2369# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2370sub vmstatus {
03a33f30 2371 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2372
2373 my $res = {};
2374
19672434 2375 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2376
2377 my $list = vzlist();
694fcad4 2378 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2379
ae4915a2
DM
2380 my $cpucount = $cpuinfo->{cpus} || 1;
2381
1e3baf05
DM
2382 foreach my $vmid (keys %$list) {
2383 next if $opt_vmid && ($vmid ne $opt_vmid);
2384
2385 my $cfspath = cfs_config_path($vmid);
2386 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2387
2388 my $d = {};
2389 $d->{pid} = $list->{$vmid}->{pid};
2390
2391 # fixme: better status?
2392 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2393
af990afe
DM
2394 my $size = disksize($storecfg, $conf);
2395 if (defined($size)) {
2396 $d->{disk} = 0; # no info available
1e3baf05
DM
2397 $d->{maxdisk} = $size;
2398 } else {
2399 $d->{disk} = 0;
2400 $d->{maxdisk} = 0;
2401 }
2402
2403 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2404 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2405
1e3baf05 2406 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2407 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2408
8b1accf7 2409 if ($conf->{balloon}) {
4bdb0514 2410 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2411 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2412 }
2413
1e3baf05
DM
2414 $d->{uptime} = 0;
2415 $d->{cpu} = 0;
1e3baf05
DM
2416 $d->{mem} = 0;
2417
2418 $d->{netout} = 0;
2419 $d->{netin} = 0;
2420
2421 $d->{diskread} = 0;
2422 $d->{diskwrite} = 0;
2423
4d8c851b
AD
2424 $d->{template} = is_template($conf);
2425
1e3baf05
DM
2426 $res->{$vmid} = $d;
2427 }
2428
2429 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2430 foreach my $dev (keys %$netdev) {
2431 next if $dev !~ m/^tap([1-9]\d*)i/;
2432 my $vmid = $1;
2433 my $d = $res->{$vmid};
2434 next if !$d;
19672434 2435
1e3baf05
DM
2436 $d->{netout} += $netdev->{$dev}->{receive};
2437 $d->{netin} += $netdev->{$dev}->{transmit};
2438 }
2439
1e3baf05
DM
2440 my $ctime = gettimeofday;
2441
2442 foreach my $vmid (keys %$list) {
2443
2444 my $d = $res->{$vmid};
2445 my $pid = $d->{pid};
2446 next if !$pid;
2447
694fcad4
DM
2448 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2449 next if !$pstat; # not running
19672434 2450
694fcad4 2451 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2452
694fcad4 2453 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2454
694fcad4 2455 if ($pstat->{vsize}) {
6b64503e 2456 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2457 }
2458
2459 my $old = $last_proc_pid_stat->{$pid};
2460 if (!$old) {
19672434
DM
2461 $last_proc_pid_stat->{$pid} = {
2462 time => $ctime,
1e3baf05
DM
2463 used => $used,
2464 cpu => 0,
1e3baf05
DM
2465 };
2466 next;
2467 }
2468
7f0b5beb 2469 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2470
2471 if ($dtime > 1000) {
2472 my $dutime = $used - $old->{used};
2473
ae4915a2 2474 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2475 $last_proc_pid_stat->{$pid} = {
19672434 2476 time => $ctime,
1e3baf05
DM
2477 used => $used,
2478 cpu => $d->{cpu},
1e3baf05
DM
2479 };
2480 } else {
2481 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2482 }
2483 }
2484
f5eb281a 2485 return $res if !$full;
03a33f30
DM
2486
2487 my $qmpclient = PVE::QMPClient->new();
2488
64e7fcf2
DM
2489 my $ballooncb = sub {
2490 my ($vmid, $resp) = @_;
2491
2492 my $info = $resp->{'return'};
2493 return if !$info->{max_mem};
be190583 2494
64e7fcf2
DM
2495 my $d = $res->{$vmid};
2496
2497 # use memory assigned to VM
2498 $d->{maxmem} = $info->{max_mem};
2499 $d->{balloon} = $info->{actual};
be190583 2500
64e7fcf2
DM
2501 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2502 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2503 $d->{freemem} = $info->{free_mem};
2504 }
2505
2506 };
2507
03a33f30
DM
2508 my $blockstatscb = sub {
2509 my ($vmid, $resp) = @_;
2510 my $data = $resp->{'return'} || [];
2511 my $totalrdbytes = 0;
2512 my $totalwrbytes = 0;
2513 for my $blockstat (@$data) {
2514 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2515 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2516 }
2517 $res->{$vmid}->{diskread} = $totalrdbytes;
2518 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2519 };
2520
2521 my $statuscb = sub {
2522 my ($vmid, $resp) = @_;
64e7fcf2 2523
03a33f30 2524 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2525 # this fails if ballon driver is not loaded, so this must be
2526 # the last commnand (following command are aborted if this fails).
2527 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2528
2529 my $status = 'unknown';
2530 if (!defined($status = $resp->{'return'}->{status})) {
2531 warn "unable to get VM status\n";
2532 return;
2533 }
2534
2535 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2536 };
2537
2538 foreach my $vmid (keys %$list) {
2539 next if $opt_vmid && ($vmid ne $opt_vmid);
2540 next if !$res->{$vmid}->{pid}; # not running
2541 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2542 }
2543
c8125172 2544 $qmpclient->queue_execute(undef, 1);
03a33f30
DM
2545
2546 foreach my $vmid (keys %$list) {
2547 next if $opt_vmid && ($vmid ne $opt_vmid);
2548 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2549 }
2550
1e3baf05
DM
2551 return $res;
2552}
2553
e059fb4d
AD
2554sub foreach_dimm {
2555 my ($conf, $vmid, $memory, $sockets, $func) = @_;
2556
2557 my $dimm_id = 0;
2558 my $current_size = 1024;
2559 my $dimm_size = 512;
2560 return if $current_size == $memory;
2561
2562 for (my $j = 0; $j < 8; $j++) {
2563 for (my $i = 0; $i < 32; $i++) {
2564 my $name = "dimm${dimm_id}";
2565 $dimm_id++;
2566 my $numanode = $i % $sockets;
2567 $current_size += $dimm_size;
2568 &$func($conf, $vmid, $name, $dimm_size, $numanode, $current_size, $memory);
2569 return $current_size if $current_size >= $memory;
2570 }
2571 $dimm_size *= 2;
2572 }
2573}
2574
1e3baf05
DM
2575sub foreach_drive {
2576 my ($conf, $func) = @_;
2577
2578 foreach my $ds (keys %$conf) {
2579 next if !valid_drivename($ds);
2580
6b64503e 2581 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2582 next if !$drive;
2583
2584 &$func($ds, $drive);
2585 }
2586}
2587
d5769dc2
DM
2588sub foreach_volid {
2589 my ($conf, $func) = @_;
be190583 2590
d5769dc2
DM
2591 my $volhash = {};
2592
2593 my $test_volid = sub {
2594 my ($volid, $is_cdrom) = @_;
2595
2596 return if !$volid;
be190583 2597
d5769dc2
DM
2598 $volhash->{$volid} = $is_cdrom || 0;
2599 };
2600
ed221350 2601 foreach_drive($conf, sub {
d5769dc2
DM
2602 my ($ds, $drive) = @_;
2603 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2604 });
2605
2606 foreach my $snapname (keys %{$conf->{snapshots}}) {
2607 my $snap = $conf->{snapshots}->{$snapname};
2608 &$test_volid($snap->{vmstate}, 0);
ed221350 2609 foreach_drive($snap, sub {
d5769dc2
DM
2610 my ($ds, $drive) = @_;
2611 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2612 });
2613 }
2614
2615 foreach my $volid (keys %$volhash) {
be190583 2616 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2617 }
2618}
2619
86b8228b
DM
2620sub vga_conf_has_spice {
2621 my ($vga) = @_;
2622
590e698c
DM
2623 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2624
2625 return $1 || 1;
86b8228b
DM
2626}
2627
1e3baf05 2628sub config_to_command {
952958bc 2629 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2630
2631 my $cmd = [];
8c559505
DM
2632 my $globalFlags = [];
2633 my $machineFlags = [];
2634 my $rtcFlags = [];
519ed28c 2635 my $cpuFlags = [];
5bdcf937 2636 my $devices = [];
b78ebef7 2637 my $pciaddr = '';
5bdcf937 2638 my $bridges = {};
1e3baf05
DM
2639 my $kvmver = kvm_user_version();
2640 my $vernum = 0; # unknown
a3c52213
DM
2641 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2642 $vernum = $1*1000000+$2*1000;
2643 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2644 $vernum = $1*1000000+$2*1000+$3;
2645 }
2646
a3c52213 2647 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2648
2649 my $have_ovz = -f '/proc/vz/vestat';
2650
db656e5f 2651 my $q35 = machine_type_is_q35($conf);
4d3f29ed 2652 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
db656e5f 2653
1e3baf05
DM
2654 push @$cmd, '/usr/bin/kvm';
2655
2656 push @$cmd, '-id', $vmid;
2657
2658 my $use_virtio = 0;
2659
c971c4f2
AD
2660 my $qmpsocket = qmp_socket($vmid);
2661 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2662 push @$cmd, '-mon', "chardev=qmp,mode=control";
2663
7b7c6d1b 2664 my $socket = vnc_socket($vmid);
1e3baf05
DM
2665 push @$cmd, '-vnc', "unix:$socket,x509,password";
2666
6b64503e 2667 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2668
1e3baf05
DM
2669 push @$cmd, '-daemonize';
2670
2796e7d5
DM
2671 if ($conf->{smbios1}) {
2672 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2673 }
2674
7183bd9a
AD
2675 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2676
db656e5f 2677 if ($q35) {
b467f79a 2678 # the q35 chipset support native usb2, so we enable usb controller
db656e5f 2679 # by default for this machine type
f8e83f05 2680 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2681 } else {
f8e83f05
AD
2682 $pciaddr = print_pci_addr("piix3", $bridges);
2683 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2684
f8e83f05 2685 my $use_usb2 = 0;
db656e5f
DM
2686 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2687 next if !$conf->{"usb$i"};
2688 $use_usb2 = 1;
2689 }
2690 # include usb device config
2691 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2692 }
19672434 2693
5acbfe9e 2694 my $vga = $conf->{vga};
2fa3151e 2695
590e698c
DM
2696 my $qxlnum = vga_conf_has_spice($vga);
2697 $vga = 'qxl' if $qxlnum;
2fa3151e 2698
5acbfe9e 2699 if (!$vga) {
264e519f
DM
2700 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2701 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2702 $conf->{ostype} eq 'w2k8')) {
2703 $vga = 'std';
2704 } else {
2705 $vga = 'cirrus';
2706 }
2707 }
2708
1e3baf05 2709 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2710 my $tablet;
2711 if (defined($conf->{tablet})) {
2712 $tablet = $conf->{tablet};
2713 } else {
2714 $tablet = $defaults->{tablet};
590e698c 2715 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2716 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2717 }
2718
db656e5f 2719 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2720
1e3baf05 2721 # host pci devices
040b06b7 2722 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2723 my $d = parse_hostpci($conf->{"hostpci$i"});
2724 next if !$d;
2725
2726 my $pcie = $d->{pcie};
2727 if($pcie){
2728 die "q35 machine model is not enabled" if !$q35;
2729 $pciaddr = print_pcie_addr("hostpci$i");
2730 }else{
2731 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2732 }
2733
2734 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2735 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2736 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2737 if ($xvga && $xvga ne '') {
2738 push @$cpuFlags, 'kvm=off';
2739 $vga = 'none';
2740 }
2e3b7e2a 2741 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2742 my $pcidevices = $d->{pciid};
2743 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2744
4543ecf0
AD
2745 my $j=0;
2746 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2747
4543ecf0
AD
2748 my $id = "hostpci$i";
2749 $id .= ".$j" if $multifunction;
2750 my $addr = $pciaddr;
2751 $addr .= ".$j" if $multifunction;
2752 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2753
2754 if($j == 0){
2755 $devicestr .= "$rombar$xvga";
2756 $devicestr .= ",multifunction=on" if $multifunction;
2757 }
2758
2759 push @$devices, '-device', $devicestr;
2760 $j++;
2761 }
1e3baf05
DM
2762 }
2763
2764 # usb devices
2765 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2766 my $d = parse_usb_device($conf->{"usb$i"});
2767 next if !$d;
2768 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2769 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2770 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2771 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2772 } elsif ($d->{spice}) {
2773 # usb redir support for spice
2774 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2775 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2776 }
2777 }
2778
1e3baf05 2779 # serial devices
bae179aa 2780 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2781 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2782 if ($path eq 'socket') {
2783 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2784 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2785 push @$devices, '-device', "isa-serial,chardev=serial$i";
2786 } else {
2787 die "no such serial device\n" if ! -c $path;
2788 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2789 push @$devices, '-device', "isa-serial,chardev=serial$i";
2790 }
34978be3 2791 }
1e3baf05
DM
2792 }
2793
2794 # parallel devices
1989a89c 2795 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2796 if (my $path = $conf->{"parallel$i"}) {
19672434 2797 die "no such parallel device\n" if ! -c $path;
32e69805 2798 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2799 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2800 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2801 }
1e3baf05
DM
2802 }
2803
2804 my $vmname = $conf->{name} || "vm$vmid";
2805
2806 push @$cmd, '-name', $vmname;
19672434 2807
1e3baf05
DM
2808 my $sockets = 1;
2809 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2810 $sockets = $conf->{sockets} if $conf->{sockets};
2811
2812 my $cores = $conf->{cores} || 1;
3bd18e48 2813
de9d1e55 2814 my $maxcpus = $sockets * $cores;
76267728 2815
de9d1e55 2816 my $vcpus = $conf->{vcpus} ? $conf->{vcpus} : $maxcpus;
76267728 2817
de9d1e55
AD
2818 my $allowed_vcpus = $cpuinfo->{cpus};
2819
2820 die "MAX $maxcpus vcpus allowed per VM on this node\n"
2821 if ($allowed_vcpus < $maxcpus);
2822
2823 push @$cmd, '-smp', "$vcpus,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
1e3baf05 2824
1e3baf05
DM
2825 push @$cmd, '-nodefaults';
2826
32baffb4 2827 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2828
0888fdce
DM
2829 my $bootindex_hash = {};
2830 my $i = 1;
2831 foreach my $o (split(//, $bootorder)) {
2832 $bootindex_hash->{$o} = $i*100;
2833 $i++;
afdb31d5 2834 }
3b408e82 2835
cf71f776 2836 push @$cmd, '-boot', "menu=on,strict=on,reboot-timeout=1000";
1e3baf05 2837
6b64503e 2838 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2839
6b64503e 2840 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2841
ef5e2be2 2842 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2843
2844 # time drift fix
6b64503e 2845 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2846
6b64503e 2847 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2848 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2849
2850 if (my $ost = $conf->{ostype}) {
6b9d84cf 2851 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2852
2853 if ($ost =~ m/^w/) { # windows
8c559505 2854 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2855
8c559505 2856 # use time drift fix when acpi is enabled
6b64503e 2857 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2858 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2859 }
2860 }
2861
be190583 2862 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2863 $ost eq 'wvista') {
8c559505 2864 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2865 push @$cmd, '-no-hpet';
462e8d19
AD
2866 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2867 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2868 }
2869
2870 if ($ost eq 'win7' || $ost eq 'win8') {
2871 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2872 }
1e3baf05
DM
2873 }
2874
8c559505
DM
2875 push @$rtcFlags, 'driftfix=slew' if $tdf;
2876
7f0b5beb 2877 if ($nokvm) {
8c559505 2878 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2879 } else {
2880 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2881 }
1e3baf05 2882
952958bc
DM
2883 my $machine_type = $forcemachine || $conf->{machine};
2884 if ($machine_type) {
2885 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2886 }
2887
8c559505
DM
2888 if ($conf->{startdate}) {
2889 push @$rtcFlags, "base=$conf->{startdate}";
2890 } elsif ($useLocaltime) {
2891 push @$rtcFlags, 'base=localtime';
2892 }
1e3baf05 2893
519ed28c
AD
2894 my $cpu = $nokvm ? "qemu64" : "kvm64";
2895 $cpu = $conf->{cpu} if $conf->{cpu};
2896
4dc339e7
AD
2897 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2898
6b9d84cf
AD
2899 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2900
2901 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2902
2e1a5389
AD
2903 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2904
be190583 2905 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2906
c0efd8cd
DM
2907 # Note: enforce needs kernel 3.10, so we do not use it for now
2908 # push @$cmd, '-cpu', "$cpu,enforce";
2909 push @$cmd, '-cpu', $cpu;
519ed28c 2910
4d3f29ed
AD
2911 my $memory = $conf->{memory} || $defaults->{memory};
2912 my $static_memory = 0;
2913 my $dimm_memory = 0;
2914
2915 if ($hotplug_features->{memory}) {
996635e5
DM
2916 die "Numa need to be enabled for memory hotplug\n" if !$conf->{numa};
2917 die "Total memory is bigger than ${MAX_MEM}MB\n" if $memory > $MAX_MEM;
4d3f29ed 2918 $static_memory = $STATICMEM;
996635e5 2919 die "minimum memory must be ${static_memory}MB\n" if($memory < $static_memory);
4d3f29ed 2920 $dimm_memory = $memory - $static_memory;
996635e5 2921 push @$cmd, '-m', "size=${static_memory},slots=255,maxmem=${MAX_MEM}M";
4d3f29ed
AD
2922
2923 } else {
2924
2925 $static_memory = $memory;
2926 push @$cmd, '-m', $static_memory;
2927 }
8a010eae 2928
67fb9de6 2929 if ($conf->{numa}) {
8a010eae 2930
2ed5d572
AD
2931 my $numa_totalmemory = undef;
2932 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2933 next if !$conf->{"numa$i"};
2934 my $numa = parse_numa($conf->{"numa$i"});
2935 next if !$numa;
67fb9de6
DM
2936 # memory
2937 die "missing numa node$i memory value\n" if !$numa->{memory};
2ed5d572
AD
2938 my $numa_memory = $numa->{memory};
2939 $numa_totalmemory += $numa_memory;
996635e5 2940 my $numa_object = "memory-backend-ram,id=ram-node$i,size=${numa_memory}M";
2ed5d572 2941
67fb9de6 2942 # cpus
2ed5d572 2943 my $cpus_start = $numa->{cpus}->{start};
67fb9de6 2944 die "missing numa node$i cpus\n" if !defined($cpus_start);
2ed5d572
AD
2945 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2946 my $cpus = $cpus_start;
2947 if (defined($cpus_end)) {
2948 $cpus .= "-$cpus_end";
67fb9de6 2949 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2ed5d572 2950 }
8a010eae 2951
67fb9de6 2952 # hostnodes
2ed5d572
AD
2953 my $hostnodes_start = $numa->{hostnodes}->{start};
2954 if (defined($hostnodes_start)) {
2955 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2956 my $hostnodes = $hostnodes_start;
2957 if (defined($hostnodes_end)) {
2958 $hostnodes .= "-$hostnodes_end";
67fb9de6 2959 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2ed5d572 2960 }
8a010eae 2961
2ed5d572
AD
2962 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2963 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
67fb9de6 2964 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2ed5d572 2965 }
8a010eae 2966
67fb9de6 2967 # policy
2ed5d572 2968 my $policy = $numa->{policy};
67fb9de6
DM
2969 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2970 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2ed5d572
AD
2971 }
2972
2973 push @$cmd, '-object', $numa_object;
8a010eae
AD
2974 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2975 }
67fb9de6 2976
4d3f29ed
AD
2977 die "total memory for NUMA nodes must be equal to vm static memory\n"
2978 if $numa_totalmemory && $numa_totalmemory != $static_memory;
2ed5d572
AD
2979
2980 #if no custom tology, we split memory and cores across numa nodes
2981 if(!$numa_totalmemory) {
2982
4d3f29ed 2983 my $numa_memory = ($static_memory / $sockets) . "M";
2ed5d572
AD
2984
2985 for (my $i = 0; $i < $sockets; $i++) {
2986
2987 my $cpustart = ($cores * $i);
2988 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2989 my $cpus = $cpustart;
2990 $cpus .= "-$cpuend" if $cpuend;
2991
2992 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2993 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2994 }
2995 }
8a010eae
AD
2996 }
2997
4d3f29ed 2998 if ($hotplug_features->{memory}) {
e059fb4d
AD
2999 foreach_dimm($conf, $vmid, $memory, $sockets, sub {
3000 my ($conf, $vmid, $name, $dimm_size, $numanode, $current_size, $memory) = @_;
996635e5 3001 push @$cmd, "-object" , "memory-backend-ram,id=mem-$name,size=${dimm_size}M";
e059fb4d
AD
3002 push @$cmd, "-device", "pc-dimm,id=$name,memdev=mem-$name,node=$numanode";
3003
3004 #if dimm_memory is not aligned to dimm map
3005 if($current_size > $memory) {
3006 $conf->{memory} = $current_size;
3007 update_config_nolock($vmid, $conf, 1);
3008 }
3009 });
4d3f29ed
AD
3010 }
3011
1e3baf05
DM
3012 push @$cmd, '-S' if $conf->{freeze};
3013
3014 # set keyboard layout
3015 my $kb = $conf->{keyboard} || $defaults->{keyboard};
3016 push @$cmd, '-k', $kb if $kb;
3017
3018 # enable sound
3019 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
3020 #push @$cmd, '-soundhw', 'es1370';
3021 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 3022
bc84dcca 3023 if($conf->{agent}) {
7a6c2150 3024 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
3025 my $pciaddr = print_pci_addr("qga0", $bridges);
3026 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
3027 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
3028 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
3029 }
3030
1d794448 3031 my $spice_port;
2fa3151e 3032
590e698c
DM
3033 if ($qxlnum) {
3034 if ($qxlnum > 1) {
3035 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
3036 for(my $i = 1; $i < $qxlnum; $i++){
3037 my $pciaddr = print_pci_addr("vga$i", $bridges);
3038 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
3039 }
3040 } else {
3041 # assume other OS works like Linux
3042 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
3043 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
3044 }
3045 }
3046
1011b570 3047 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 3048
cd339d1f 3049 $spice_port = PVE::Tools::next_spice_port();
943340a6 3050
d2da6d9b 3051 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 3052
d2da6d9b
AD
3053 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
3054 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
3055 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
3056 }
3057
8d9ae0d2
DM
3058 # enable balloon by default, unless explicitly disabled
3059 if (!defined($conf->{balloon}) || $conf->{balloon}) {
3060 $pciaddr = print_pci_addr("balloon0", $bridges);
3061 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
3062 }
1e3baf05 3063
0ea9541d
DM
3064 if ($conf->{watchdog}) {
3065 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 3066 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 3067 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
3068 push @$devices, '-device', "$watchdog$pciaddr";
3069 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
3070 }
3071
1e3baf05 3072 my $vollist = [];
941e0c42 3073 my $scsicontroller = {};
26ee04b6 3074 my $ahcicontroller = {};
cdd20088 3075 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 3076
5881b913
DM
3077 # Add iscsi initiator name if available
3078 if (my $initiator = get_initiator_name()) {
3079 push @$devices, '-iscsi', "initiator-name=$initiator";
3080 }
3081
1e3baf05
DM
3082 foreach_drive($conf, sub {
3083 my ($ds, $drive) = @_;
3084
ff1a2432 3085 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 3086 push @$vollist, $drive->{file};
ff1a2432 3087 }
afdb31d5 3088
1e3baf05 3089 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
3090
3091 if (drive_is_cdrom ($drive)) {
3092 if ($bootindex_hash->{d}) {
3093 $drive->{bootindex} = $bootindex_hash->{d};
3094 $bootindex_hash->{d} += 1;
3095 }
3096 } else {
3097 if ($bootindex_hash->{c}) {
3098 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3099 $bootindex_hash->{c} += 1;
3100 }
3101 }
3102
941e0c42 3103 if ($drive->{interface} eq 'scsi') {
cdd20088 3104
5b952ff5 3105 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 3106 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
3107 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
3108 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 3109 $scsicontroller->{$controller}=1;
941e0c42 3110 }
3b408e82 3111
26ee04b6
DA
3112 if ($drive->{interface} eq 'sata') {
3113 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
3114 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3115 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
3116 $ahcicontroller->{$controller}=1;
3117 }
46f58b5f 3118
15b21acc
MR
3119 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3120 push @$devices, '-drive',$drive_cmd;
46f58b5f 3121 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
3122 });
3123
cc4d6182 3124 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 3125 next if !$conf->{"net$i"};
cc4d6182
DA
3126 my $d = parse_net($conf->{"net$i"});
3127 next if !$d;
1e3baf05 3128
cc4d6182 3129 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 3130
cc4d6182
DA
3131 if ($bootindex_hash->{n}) {
3132 $d->{bootindex} = $bootindex_hash->{n};
3133 $bootindex_hash->{n} += 1;
3134 }
1e3baf05 3135
cc4d6182 3136 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
3137 push @$devices, '-netdev', $netdevfull;
3138
3139 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
3140 push @$devices, '-device', $netdevicefull;
3141 }
1e3baf05 3142
db656e5f
DM
3143 if (!$q35) {
3144 # add pci bridges
f8e83f05
AD
3145 while (my ($k, $v) = each %$bridges) {
3146 $pciaddr = print_pci_addr("pci.$k");
3147 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3148 }
19672434
DM
3149 }
3150
1e3baf05
DM
3151 # hack: virtio with fairsched is unreliable, so we do not use fairsched
3152 # when the VM uses virtio devices.
19672434
DM
3153 if (!$use_virtio && $have_ovz) {
3154
6b64503e 3155 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
3156 $conf->{cpuunits} : $defaults->{cpuunits};
3157
3158 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
3159
3160 # fixme: cpulimit is currently ignored
3161 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
3162 }
3163
3164 # add custom args
3165 if ($conf->{args}) {
3ada46c9 3166 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
3167 push @$cmd, @$aa;
3168 }
3169
5bdcf937 3170 push @$cmd, @$devices;
be190583 3171 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 3172 if scalar(@$rtcFlags);
be190583 3173 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
3174 if scalar(@$machineFlags);
3175 push @$cmd, '-global', join(',', @$globalFlags)
3176 if scalar(@$globalFlags);
3177
1d794448 3178 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 3179}
19672434 3180
1e3baf05
DM
3181sub vnc_socket {
3182 my ($vmid) = @_;
3183 return "${var_run_tmpdir}/$vmid.vnc";
3184}
3185
943340a6 3186sub spice_port {
1011b570 3187 my ($vmid) = @_;
943340a6 3188
1d794448 3189 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
3190
3191 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3192}
3193
c971c4f2 3194sub qmp_socket {
693d12a2
AD
3195 my ($vmid, $qga) = @_;
3196 my $sockettype = $qga ? 'qga' : 'qmp';
3197 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3198}
3199
1e3baf05
DM
3200sub pidfile_name {
3201 my ($vmid) = @_;
3202 return "${var_run_tmpdir}/$vmid.pid";
3203}
3204
86fdcfb2
DA
3205sub vm_devices_list {
3206 my ($vmid) = @_;
3207
ceea9078 3208 my $res = vm_mon_cmd($vmid, 'query-pci');
ceea9078
DM
3209 my $devices = {};
3210 foreach my $pcibus (@$res) {
3211 foreach my $device (@{$pcibus->{devices}}) {
6e62a21f 3212 next if !$device->{'qdev_id'};
200644a7 3213 if ($device->{'pci_bridge'}) {
200644a7
AD
3214 $devices->{$device->{'qdev_id'}} = 1;
3215 foreach my $bridge_device (@{$device->{'pci_bridge'}->{devices}}) {
3216 next if !$bridge_device->{'qdev_id'};
3217 $devices->{$bridge_device->{'qdev_id'}} = 1;
3218 $devices->{$device->{'qdev_id'}}++;
3219 }
3220 } else {
200644a7
AD
3221 $devices->{$device->{'qdev_id'}} = 1;
3222 }
f78cc802
AD
3223 }
3224 }
3225
3226 my $resblock = vm_mon_cmd($vmid, 'query-block');
3227 foreach my $block (@$resblock) {
3228 if($block->{device} =~ m/^drive-(\S+)/){
3229 $devices->{$1} = 1;
1dc4f496
DM
3230 }
3231 }
86fdcfb2 3232
3d7389fe
DM
3233 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3234 foreach my $mice (@$resmice) {
3235 if ($mice->{name} eq 'QEMU HID Tablet') {
3236 $devices->{tablet} = 1;
3237 last;
3238 }
3239 }
3240
1dc4f496 3241 return $devices;
86fdcfb2
DA
3242}
3243
ec21aa11 3244sub vm_deviceplug {
f19d1c47 3245 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3246
db656e5f
DM
3247 my $q35 = machine_type_is_q35($conf);
3248
95d6343b
DA
3249 my $devices_list = vm_devices_list($vmid);
3250 return 1 if defined($devices_list->{$deviceid});
3251
fee46675
DM
3252 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid); # add PCI bridge if we need it for the device
3253
3d7389fe 3254 if ($deviceid eq 'tablet') {
fee46675 3255
3d7389fe 3256 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3d7389fe 3257
fee46675 3258 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
40f28a9f 3259
fee46675 3260 qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3261 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
fee46675 3262
5e5dcb73 3263 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3264 eval { qemu_deviceaddverify($vmid, $deviceid); };
3265 if (my $err = $@) {
63c2da2f
DM
3266 eval { qemu_drivedel($vmid, $deviceid); };
3267 warn $@ if $@;
fee46675 3268 die $err;
5e5dcb73 3269 }
cfc817c7 3270
fee46675
DM
3271 } elsif ($deviceid =~ m/^(scsihw)(\d+)$/) {
3272
cdd20088 3273 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3274 my $pciaddr = print_pci_addr($deviceid);
cdd20088 3275 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
fee46675 3276
cfc817c7 3277 qemu_deviceadd($vmid, $devicefull);
fee46675 3278 qemu_deviceaddverify($vmid, $deviceid);
cfc817c7 3279
fee46675
DM
3280 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3281
3282 qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
3283 qemu_driveadd($storecfg, $vmid, $device);
3284
3285 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3286 eval { qemu_deviceadd($vmid, $devicefull); };
3287 if (my $err = $@) {
63c2da2f
DM
3288 eval { qemu_drivedel($vmid, $deviceid); };
3289 warn $@ if $@;
fee46675 3290 die $err;
a4f091a0 3291 }
a4f091a0 3292
fee46675
DM
3293 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3294
2630d2a9
DA
3295 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3296 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3297 qemu_deviceadd($vmid, $netdevicefull);
fee46675
DM
3298 eval { qemu_deviceaddverify($vmid, $deviceid); };
3299 if (my $err = $@) {
3300 eval { qemu_netdevdel($vmid, $deviceid); };
3301 warn $@ if $@;
3302 die $err;
2630d2a9 3303 }
2630d2a9 3304
fee46675 3305 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
b467f79a 3306
40f28a9f
AD
3307 my $bridgeid = $2;
3308 my $pciaddr = print_pci_addr($deviceid);
3309 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
fee46675 3310
40f28a9f 3311 qemu_deviceadd($vmid, $devicefull);
fee46675
DM
3312 qemu_deviceaddverify($vmid, $deviceid);
3313
3314 } else {
3315 die "can't hotplug device '$deviceid'\n";
40f28a9f
AD
3316 }
3317
5e5dcb73 3318 return 1;
a4dea331
DA
3319}
3320
3eec5767 3321# fixme: this should raise exceptions on error!
ec21aa11 3322sub vm_deviceunplug {
f19d1c47 3323 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3324
95d6343b
DA
3325 my $devices_list = vm_devices_list($vmid);
3326 return 1 if !defined($devices_list->{$deviceid});
3327
63c2da2f
DM
3328 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3329
3d7389fe 3330 if ($deviceid eq 'tablet') {
63c2da2f 3331
3d7389fe 3332 qemu_devicedel($vmid, $deviceid);
3d7389fe 3333
63c2da2f 3334 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
f19d1c47 3335
5e5dcb73 3336 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3337 qemu_devicedelverify($vmid, $deviceid);
3338 qemu_drivedel($vmid, $deviceid);
3339
3340 } elsif ($deviceid =~ m/^(lsi)(\d+)$/) {
3341
3342 qemu_devicedel($vmid, $deviceid);
3343
3344 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
cfc817c7 3345
63c2da2f
DM
3346 qemu_devicedel($vmid, $deviceid);
3347 qemu_drivedel($vmid, $deviceid);
3348
3349 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
a4f091a0 3350
2630d2a9 3351 qemu_devicedel($vmid, $deviceid);
63c2da2f
DM
3352 qemu_devicedelverify($vmid, $deviceid);
3353 qemu_netdevdel($vmid, $deviceid);
3354
3355 } else {
3356 die "can't unplug device '$deviceid'\n";
2630d2a9
DA
3357 }
3358
5e5dcb73
DA
3359 return 1;
3360}
3361
3362sub qemu_deviceadd {
3363 my ($vmid, $devicefull) = @_;
873c2d69 3364
d695b5b7
AD
3365 $devicefull = "driver=".$devicefull;
3366 my %options = split(/[=,]/, $devicefull);
f19d1c47 3367
d695b5b7 3368 vm_mon_cmd($vmid, "device_add" , %options);
5e5dcb73 3369}
afdb31d5 3370
5e5dcb73 3371sub qemu_devicedel {
fee46675 3372 my ($vmid, $deviceid) = @_;
63c2da2f 3373
5a77d8c1 3374 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
5e5dcb73
DA
3375}
3376
4d3f29ed
AD
3377sub qemu_objectadd {
3378 my($vmid, $objectid, $qomtype) = @_;
3379
3380 vm_mon_cmd($vmid, "object-add", id => $objectid, "qom-type" => $qomtype);
3381
3382 return 1;
3383}
3384
3385sub qemu_objectdel {
3386 my($vmid, $objectid) = @_;
3387
3388 vm_mon_cmd($vmid, "object-del", id => $objectid);
3389
3390 return 1;
3391}
3392
5e5dcb73 3393sub qemu_driveadd {
fee46675 3394 my ($storecfg, $vmid, $device) = @_;
5e5dcb73
DA
3395
3396 my $drive = print_drive_full($storecfg, $vmid, $device);
8ead5ec7 3397 my $ret = vm_human_monitor_command($vmid, "drive_add auto \"$drive\"");
fee46675 3398
5e5dcb73 3399 # If the command succeeds qemu prints: "OK"
fee46675
DM
3400 return 1 if $ret =~ m/OK/s;
3401
3402 die "adding drive failed: $ret\n";
5e5dcb73 3403}
afdb31d5 3404
5e5dcb73
DA
3405sub qemu_drivedel {
3406 my($vmid, $deviceid) = @_;
873c2d69 3407
7b7c6d1b 3408 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73 3409 $ret =~ s/^\s+//;
63c2da2f
DM
3410
3411 return 1 if $ret eq "";
3412
3413 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
3414 return 1 if $ret =~ m/Device \'.*?\' not found/s;
3415
3416 die "deleting drive $deviceid failed : $ret\n";
5e5dcb73 3417}
f19d1c47 3418
5e5dcb73 3419sub qemu_deviceaddverify {
fee46675 3420 my ($vmid, $deviceid) = @_;
873c2d69 3421
5e5dcb73
DA
3422 for (my $i = 0; $i <= 5; $i++) {
3423 my $devices_list = vm_devices_list($vmid);
3424 return 1 if defined($devices_list->{$deviceid});
3425 sleep 1;
afdb31d5 3426 }
fee46675
DM
3427
3428 die "error on hotplug device '$deviceid'\n";
5e5dcb73 3429}
afdb31d5 3430
5e5dcb73
DA
3431
3432sub qemu_devicedelverify {
63c2da2f
DM
3433 my ($vmid, $deviceid) = @_;
3434
3435 # need to verify that the device is correctly removed as device_del
3436 # is async and empty return is not reliable
5e5dcb73 3437
5e5dcb73
DA
3438 for (my $i = 0; $i <= 5; $i++) {
3439 my $devices_list = vm_devices_list($vmid);
3440 return 1 if !defined($devices_list->{$deviceid});
3441 sleep 1;
afdb31d5 3442 }
63c2da2f
DM
3443
3444 die "error on hot-unplugging device '$deviceid'\n";
873c2d69
DA
3445}
3446
cdd20088 3447sub qemu_findorcreatescsihw {
cfc817c7
DA
3448 my ($storecfg, $conf, $vmid, $device) = @_;
3449
5b952ff5 3450 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3451 my $controller = int($device->{index} / $maxdev);
cdd20088 3452 my $scsihwid="scsihw$controller";
cfc817c7
DA
3453 my $devices_list = vm_devices_list($vmid);
3454
cdd20088 3455 if(!defined($devices_list->{$scsihwid})) {
fee46675 3456 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7 3457 }
fee46675 3458
cfc817c7
DA
3459 return 1;
3460}
3461
281fedb3 3462sub qemu_add_pci_bridge {
40f28a9f
AD
3463 my ($storecfg, $conf, $vmid, $device) = @_;
3464
3465 my $bridges = {};
281fedb3
DM
3466
3467 my $bridgeid;
3468
40f28a9f
AD
3469 print_pci_addr($device, $bridges);
3470
3471 while (my ($k, $v) = each %$bridges) {
3472 $bridgeid = $k;
3473 }
fee46675 3474 return 1 if !defined($bridgeid) || $bridgeid < 1;
281fedb3 3475
40f28a9f
AD
3476 my $bridge = "pci.$bridgeid";
3477 my $devices_list = vm_devices_list($vmid);
3478
281fedb3 3479 if (!defined($devices_list->{$bridge})) {
fee46675 3480 vm_deviceplug($storecfg, $conf, $vmid, $bridge);
40f28a9f 3481 }
281fedb3 3482
40f28a9f
AD
3483 return 1;
3484}
3485
25088687
DM
3486sub qemu_set_link_status {
3487 my ($vmid, $device, $up) = @_;
3488
3489 vm_mon_cmd($vmid, "set_link", name => $device,
3490 up => $up ? JSON::true : JSON::false);
3491}
3492
2630d2a9
DA
3493sub qemu_netdevadd {
3494 my ($vmid, $conf, $device, $deviceid) = @_;
3495
3496 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3497 my %options = split(/[=,]/, $netdev);
2630d2a9 3498
73aa03b8
AD
3499 vm_mon_cmd($vmid, "netdev_add", %options);
3500 return 1;
2630d2a9
DA
3501}
3502
3503sub qemu_netdevdel {
3504 my ($vmid, $deviceid) = @_;
3505
89c1e0f4 3506 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
2630d2a9
DA
3507}
3508
838776ab 3509sub qemu_cpu_hotplug {
8edc9c08 3510 my ($vmid, $conf, $vcpus) = @_;
838776ab 3511
8edc9c08
AD
3512 my $sockets = 1;
3513 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
3514 $sockets = $conf->{sockets} if $conf->{sockets};
3515 my $cores = $conf->{cores} || 1;
3516 my $maxcpus = $sockets * $cores;
838776ab 3517
8edc9c08 3518 $vcpus = $maxcpus if !$vcpus;
3a11fadb 3519
8edc9c08
AD
3520 die "you can't add more vcpus than maxcpus\n"
3521 if $vcpus > $maxcpus;
3a11fadb 3522
8edc9c08 3523 my $currentvcpus = $conf->{vcpus} || $maxcpus;
3a11fadb 3524 die "online cpu unplug is not yet possible\n"
8edc9c08 3525 if $vcpus < $currentvcpus;
838776ab 3526
8edc9c08
AD
3527 my $currentrunningvcpus = vm_mon_cmd($vmid, "query-cpus");
3528 die "vcpus in running vm is different than configuration\n"
3529 if scalar(@{$currentrunningvcpus}) != $currentvcpus;
838776ab 3530
8edc9c08 3531 for (my $i = $currentvcpus; $i < $vcpus; $i++) {
838776ab
AD
3532 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3533 }
3534}
3535
4d3f29ed
AD
3536sub qemu_memory_hotplug {
3537 my ($vmid, $conf, $defaults, $opt, $value) = @_;
3538
3539 return $value if !check_running($vmid);
3540
3541 my $memory = $conf->{memory} || $defaults->{memory};
3542 $value = $defaults->{memory} if !$value;
3543 return $value if $value == $memory;
3544
3545 my $static_memory = $STATICMEM;
3546 my $dimm_memory = $memory - $static_memory;
3547
3548 die "memory can't be lower than $static_memory MB" if $value < $static_memory;
3549 die "memory unplug is not yet available" if $value < $memory;
4d3f29ed
AD
3550 die "you cannot add more memory than $MAX_MEM MB!\n" if $memory > $MAX_MEM;
3551
3552
3553 my $sockets = 1;
3554 $sockets = $conf->{sockets} if $conf->{sockets};
3555
e059fb4d
AD
3556 foreach_dimm($conf, $vmid, $value, $sockets, sub {
3557 my ($conf, $vmid, $name, $dimm_size, $numanode, $current_size, $memory) = @_;
3558
3559 return if $current_size <= $conf->{memory};
4d3f29ed
AD
3560
3561 eval { vm_mon_cmd($vmid, "object-add", 'qom-type' => "memory-backend-ram", id => "mem-$name", props => { size => int($dimm_size*1024*1024) } ) };
3562 if (my $err = $@) {
3563 eval { qemu_objectdel($vmid, "mem-$name"); };
3564 die $err;
3565 }
3566
3567 eval { vm_mon_cmd($vmid, "device_add", driver => "pc-dimm", id => "$name", memdev => "mem-$name", node => $numanode) };
3568 if (my $err = $@) {
3569 eval { qemu_objectdel($vmid, "mem-$name"); };
3570 die $err;
3571 }
3572 #update conf after each succesful module hotplug
e059fb4d 3573 $conf->{memory} = $current_size;
4d3f29ed 3574 update_config_nolock($vmid, $conf, 1);
e059fb4d 3575 });
4d3f29ed
AD
3576}
3577
affd2f88
AD
3578sub qemu_block_set_io_throttle {
3579 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3580
f3f323a3
AD
3581 return if !check_running($vmid) ;
3582
f3f323a3
AD
3583 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3584
affd2f88
AD
3585}
3586
f5eb281a 3587# old code, only used to shutdown old VM after update
dab36e1e
DM
3588sub __read_avail {
3589 my ($fh, $timeout) = @_;
3590
3591 my $sel = new IO::Select;
3592 $sel->add($fh);
3593
3594 my $res = '';
3595 my $buf;
3596
3597 my @ready;
3598 while (scalar (@ready = $sel->can_read($timeout))) {
3599 my $count;
3600 if ($count = $fh->sysread($buf, 8192)) {
3601 if ($buf =~ /^(.*)\(qemu\) $/s) {
3602 $res .= $1;
3603 last;
3604 } else {
3605 $res .= $buf;
3606 }
3607 } else {
3608 if (!defined($count)) {
3609 die "$!\n";
3610 }
3611 last;
3612 }
3613 }
3614
3615 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3616
dab36e1e
DM
3617 return $res;
3618}
3619
f5eb281a 3620# old code, only used to shutdown old VM after update
dab36e1e
DM
3621sub vm_monitor_command {
3622 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3623
dab36e1e
DM
3624 my $res;
3625
3626 eval {
3627 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3628
3629 my $sname = "${var_run_tmpdir}/$vmid.mon";
3630
3631 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3632 die "unable to connect to VM $vmid socket - $!\n";
3633
3634 my $timeout = 3;
3635
3636 # hack: migrate sometime blocks the monitor (when migrate_downtime
3637 # is set)
3638 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3639 $timeout = 60*60; # 1 hour
3640 }
3641
3642 # read banner;
3643 my $data = __read_avail($sock, $timeout);
3644
3645 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3646 die "got unexpected qemu monitor banner\n";
3647 }
3648
3649 my $sel = new IO::Select;
3650 $sel->add($sock);
3651
3652 if (!scalar(my @ready = $sel->can_write($timeout))) {
3653 die "monitor write error - timeout";
3654 }
3655
3656 my $fullcmd = "$cmdstr\r";
3657
3658 # syslog('info', "VM $vmid monitor command: $cmdstr");
3659
3660 my $b;
3661 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3662 die "monitor write error - $!";
3663 }
3664
3665 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3666
3667 $timeout = 20;
3668
3669 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3670 $timeout = 60*60; # 1 hour
3671 } elsif ($cmdstr =~ m/^(eject|change)/) {
3672 $timeout = 60; # note: cdrom mount command is slow
3673 }
3674 if ($res = __read_avail($sock, $timeout)) {
3675
3676 my @lines = split("\r?\n", $res);
f5eb281a 3677
dab36e1e 3678 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3679
dab36e1e
DM
3680 $res = join("\n", @lines);
3681 $res .= "\n";
3682 }
3683 };
3684
3685 my $err = $@;
3686
3687 if ($err) {
3688 syslog("err", "VM $vmid monitor command failed - $err");
3689 die $err;
3690 }
f5eb281a 3691
dab36e1e
DM
3692 return $res;
3693}
3694
c1175c92
AD
3695sub qemu_block_resize {
3696 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3697
ed221350 3698 my $running = check_running($vmid);
c1175c92
AD
3699
3700 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3701
3702 return if !$running;
3703
3704 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3705
3706}
3707
1ab0057c
AD
3708sub qemu_volume_snapshot {
3709 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3710
ed221350 3711 my $running = check_running($vmid);
1ab0057c
AD
3712
3713 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3714
3715 return if !$running;
3716
3717 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3718
3719}
3720
fc46aff9
AD
3721sub qemu_volume_snapshot_delete {
3722 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3723
ed221350 3724 my $running = check_running($vmid);
fc46aff9
AD
3725
3726 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3727
3728 return if !$running;
3729
18bfb361 3730 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3731}
3732
264e519f
DM
3733sub set_migration_caps {
3734 my ($vmid) = @_;
a89fded1 3735
8b8345f3 3736 my $cap_ref = [];
a89fded1
AD
3737
3738 my $enabled_cap = {
8b8345f3
DM
3739 "auto-converge" => 1,
3740 "xbzrle" => 0,
3741 "x-rdma-pin-all" => 0,
3742 "zero-blocks" => 0,
a89fded1
AD
3743 };
3744
8b8345f3 3745 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3746
8b8345f3 3747 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3748 push @$cap_ref, {
3749 capability => $supported_capability->{capability},
22430fa2
DM
3750 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3751 };
a89fded1
AD
3752 }
3753
8b8345f3
DM
3754 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3755}
a89fded1 3756
81d95ae1
DM
3757my $fast_plug_option = {
3758 'name' => 1,
81d95ae1
DM
3759 'onboot' => 1,
3760 'shares' => 1,
3761 'startup' => 1,
3762};
3763
3a11fadb
DM
3764# hotplug changes in [PENDING]
3765# $selection hash can be used to only apply specified options, for
3766# example: { cores => 1 } (only apply changed 'cores')
3767# $errors ref is used to return error messages
c427973b 3768sub vmconfig_hotplug_pending {
3a11fadb 3769 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
c427973b 3770
8e90138a 3771 my $defaults = load_defaults();
c427973b
DM
3772
3773 # commit values which do not have any impact on running VM first
3a11fadb
DM
3774 # Note: those option cannot raise errors, we we do not care about
3775 # $selection and always apply them.
3776
3777 my $add_error = sub {
3778 my ($opt, $msg) = @_;
3779 $errors->{$opt} = "hotplug problem - $msg";
3780 };
c427973b
DM
3781
3782 my $changes = 0;
3783 foreach my $opt (keys %{$conf->{pending}}) { # add/change
81d95ae1 3784 if ($fast_plug_option->{$opt}) {
c427973b
DM
3785 $conf->{$opt} = $conf->{pending}->{$opt};
3786 delete $conf->{pending}->{$opt};
3787 $changes = 1;
3788 }
3789 }
3790
3791 if ($changes) {
3792 update_config_nolock($vmid, $conf, 1);
3793 $conf = load_config($vmid); # update/reload
3794 }
3795
b3c2bdd1 3796 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
c427973b 3797
3d7389fe
DM
3798 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3799 foreach my $opt (@delete) {
3a11fadb 3800 next if $selection && !$selection->{$opt};
3a11fadb 3801 eval {
51a6f637
AD
3802 if ($opt eq 'hotplug') {
3803 die "skip\n" if ($conf->{hotplug} =~ /memory/);
3804 } elsif ($opt eq 'tablet') {
b3c2bdd1 3805 die "skip\n" if !$hotplug_features->{usb};
3a11fadb
DM
3806 if ($defaults->{tablet}) {
3807 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3808 } else {
3809 vm_deviceunplug($vmid, $conf, $opt);
3810 }
8edc9c08 3811 } elsif ($opt eq 'vcpus') {
b3c2bdd1 3812 die "skip\n" if !$hotplug_features->{cpu};
8edc9c08 3813 qemu_cpu_hotplug($vmid, $conf, undef);
9c2f7069 3814 } elsif ($opt eq 'balloon') {
81d95ae1
DM
3815 # enable balloon device is not hotpluggable
3816 die "skip\n" if !defined($conf->{balloon}) || $conf->{balloon};
3817 } elsif ($fast_plug_option->{$opt}) {
3818 # do nothing
3eec5767 3819 } elsif ($opt =~ m/^net(\d+)$/) {
b3c2bdd1 3820 die "skip\n" if !$hotplug_features->{network};
3eec5767 3821 vm_deviceunplug($vmid, $conf, $opt);
a05cff86 3822 } elsif (valid_drivename($opt)) {
b3c2bdd1 3823 die "skip\n" if !$hotplug_features->{disk} || $opt =~ m/(ide|sata)(\d+)/;
19120f99
AD
3824 vm_deviceunplug($vmid, $conf, $opt);
3825 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
4d3f29ed
AD
3826 } elsif ($opt =~ m/^memory$/) {
3827 die "skip\n" if !$hotplug_features->{memory};
3828 qemu_memory_hotplug($vmid, $conf, $defaults, $opt);
3d7389fe 3829 } else {
e56beeda 3830 die "skip\n";
3d7389fe 3831 }
3a11fadb
DM
3832 };
3833 if (my $err = $@) {
e56beeda
DM
3834 &$add_error($opt, $err) if $err ne "skip\n";
3835 } else {
3a11fadb
DM
3836 # save new config if hotplug was successful
3837 delete $conf->{$opt};
3838 vmconfig_undelete_pending_option($conf, $opt);
3839 update_config_nolock($vmid, $conf, 1);
3840 $conf = load_config($vmid); # update/reload
3d7389fe 3841 }
3d7389fe
DM
3842 }
3843
3844 foreach my $opt (keys %{$conf->{pending}}) {
3a11fadb 3845 next if $selection && !$selection->{$opt};
3d7389fe 3846 my $value = $conf->{pending}->{$opt};
3a11fadb 3847 eval {
51a6f637
AD
3848 if ($opt eq 'hotplug') {
3849 die "skip\n" if ($value =~ /memory/) || ($value !~ /memory/ && $conf->{hotplug} =~ /memory/);
3850 } elsif ($opt eq 'tablet') {
b3c2bdd1 3851 die "skip\n" if !$hotplug_features->{usb};
3a11fadb
DM
3852 if ($value == 1) {
3853 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3854 } elsif ($value == 0) {
3855 vm_deviceunplug($vmid, $conf, $opt);
3856 }
8edc9c08 3857 } elsif ($opt eq 'vcpus') {
b3c2bdd1 3858 die "skip\n" if !$hotplug_features->{cpu};
3a11fadb
DM
3859 qemu_cpu_hotplug($vmid, $conf, $value);
3860 } elsif ($opt eq 'balloon') {
81d95ae1 3861 # enable/disable balloning device is not hotpluggable
8fe689e7
DM
3862 my $old_balloon_enabled = !!(!defined($conf->{balloon}) || $conf->{balloon});
3863 my $new_balloon_enabled = !!(!defined($conf->{pending}->{balloon}) || $conf->{pending}->{balloon});
81d95ae1
DM
3864 die "skip\n" if $old_balloon_enabled != $new_balloon_enabled;
3865
3a11fadb 3866 # allow manual ballooning if shares is set to zero
9c2f7069
AD
3867 if (!(defined($conf->{shares}) && ($conf->{shares} == 0))) {
3868 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
3869 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
3870 }
3eec5767
DM
3871 } elsif ($opt =~ m/^net(\d+)$/) {
3872 # some changes can be done without hotplug
b3c2bdd1
DM
3873 vmconfig_update_net($storecfg, $conf, $hotplug_features->{network},
3874 $vmid, $opt, $value);
a05cff86
DM
3875 } elsif (valid_drivename($opt)) {
3876 # some changes can be done without hotplug
b3c2bdd1
DM
3877 vmconfig_update_disk($storecfg, $conf, $hotplug_features->{disk},
3878 $vmid, $opt, $value, 1);
4d3f29ed
AD
3879 } elsif ($opt =~ m/^memory$/) { #dimms
3880 die "skip\n" if !$hotplug_features->{memory};
3881 $value = qemu_memory_hotplug($vmid, $conf, $defaults, $opt, $value);
3a11fadb 3882 } else {
e56beeda 3883 die "skip\n"; # skip non-hot-pluggable options
3d7389fe 3884 }
3a11fadb
DM
3885 };
3886 if (my $err = $@) {
e56beeda
DM
3887 &$add_error($opt, $err) if $err ne "skip\n";
3888 } else {
3a11fadb
DM
3889 # save new config if hotplug was successful
3890 $conf->{$opt} = $value;
3891 delete $conf->{pending}->{$opt};
3892 update_config_nolock($vmid, $conf, 1);
3893 $conf = load_config($vmid); # update/reload
3d7389fe 3894 }
3d7389fe 3895 }
c427973b 3896}
055d554d
DM
3897
3898sub vmconfig_apply_pending {
3a11fadb 3899 my ($vmid, $conf, $storecfg) = @_;
c427973b
DM
3900
3901 # cold plug
055d554d
DM
3902
3903 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3904 foreach my $opt (@delete) { # delete
3905 die "internal error" if $opt =~ m/^unused/;
3906 $conf = load_config($vmid); # update/reload
3907 if (!defined($conf->{$opt})) {
3908 vmconfig_undelete_pending_option($conf, $opt);
3909 update_config_nolock($vmid, $conf, 1);
3910 } elsif (valid_drivename($opt)) {
3911 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
3912 vmconfig_undelete_pending_option($conf, $opt);
3913 delete $conf->{$opt};
3914 update_config_nolock($vmid, $conf, 1);
3915 } else {
3916 vmconfig_undelete_pending_option($conf, $opt);
3917 delete $conf->{$opt};
3918 update_config_nolock($vmid, $conf, 1);
3919 }
3920 }
3921
3922 $conf = load_config($vmid); # update/reload
3923
3924 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3925 $conf = load_config($vmid); # update/reload
3926
3927 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
3928 # skip if nothing changed
3929 } elsif (valid_drivename($opt)) {
3930 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
3931 if defined($conf->{$opt});
3932 $conf->{$opt} = $conf->{pending}->{$opt};
3933 } else {
3934 $conf->{$opt} = $conf->{pending}->{$opt};
3935 }
3936
3937 delete $conf->{pending}->{$opt};
3938 update_config_nolock($vmid, $conf, 1);
3939 }
3940}
3941
3eec5767
DM
3942my $safe_num_ne = sub {
3943 my ($a, $b) = @_;
3944
3945 return 0 if !defined($a) && !defined($b);
3946 return 1 if !defined($a);
3947 return 1 if !defined($b);
3948
3949 return $a != $b;
3950};
3951
3952my $safe_string_ne = sub {
3953 my ($a, $b) = @_;
3954
3955 return 0 if !defined($a) && !defined($b);
3956 return 1 if !defined($a);
3957 return 1 if !defined($b);
3958
3959 return $a ne $b;
3960};
3961
3962sub vmconfig_update_net {
b3c2bdd1 3963 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value) = @_;
3eec5767
DM
3964
3965 my $newnet = parse_net($value);
3966
3967 if ($conf->{$opt}) {
3968 my $oldnet = parse_net($conf->{$opt});
3969
3970 if (&$safe_string_ne($oldnet->{model}, $newnet->{model}) ||
3971 &$safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
3972 &$safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
3973 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
3974
3975 # for non online change, we try to hot-unplug
7196b757 3976 die "skip\n" if !$hotplug;
3eec5767
DM
3977 vm_deviceunplug($vmid, $conf, $opt);
3978 } else {
3979
3980 die "internal error" if $opt !~ m/net(\d+)/;
3981 my $iface = "tap${vmid}i$1";
3982
3983 if (&$safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
3984 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3985 }
3986
25088687
DM
3987 if (&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
3988 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
3989 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3eec5767
DM
3990 PVE::Network::tap_unplug($iface);
3991 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall});
3992 }
38c590d9 3993
25088687
DM
3994 if (&$safe_string_ne($oldnet->{link_down}, $newnet->{link_down})) {
3995 qemu_set_link_status($vmid, $opt, !$newnet->{link_down});
3996 }
3997
38c590d9 3998 return 1;
3eec5767
DM
3999 }
4000 }
4001
7196b757 4002 if ($hotplug) {
38c590d9
DM
4003 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet);
4004 } else {
4005 die "skip\n";
4006 }
3eec5767
DM
4007}
4008
a05cff86 4009sub vmconfig_update_disk {
b3c2bdd1 4010 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value, $force) = @_;
a05cff86
DM
4011
4012 # fixme: do we need force?
4013
4014 my $drive = parse_drive($opt, $value);
4015
4016 if ($conf->{$opt}) {
4017
4018 if (my $old_drive = parse_drive($opt, $conf->{$opt})) {
4019
4020 my $media = $drive->{media} || 'disk';
4021 my $oldmedia = $old_drive->{media} || 'disk';
4022 die "unable to change media type\n" if $media ne $oldmedia;
4023
4024 if (!drive_is_cdrom($old_drive)) {
4025
4026 if ($drive->{file} ne $old_drive->{file}) {
4027
7196b757 4028 die "skip\n" if !$hotplug;
a05cff86
DM
4029
4030 # unplug and register as unused
4031 vm_deviceunplug($vmid, $conf, $opt);
4032 vmconfig_register_unused_drive($storecfg, $vmid, $conf, $old_drive)
4033
4034 } else {
4035 # update existing disk
4036
4037 # skip non hotpluggable value
4038 if (&$safe_num_ne($drive->{discard}, $old_drive->{discard}) ||
4039 &$safe_string_ne($drive->{cache}, $old_drive->{cache})) {
4040 die "skip\n";
4041 }
4042
4043 # apply throttle
4044 if (&$safe_num_ne($drive->{mbps}, $old_drive->{mbps}) ||
4045 &$safe_num_ne($drive->{mbps_rd}, $old_drive->{mbps_rd}) ||
4046 &$safe_num_ne($drive->{mbps_wr}, $old_drive->{mbps_wr}) ||
4047 &$safe_num_ne($drive->{iops}, $old_drive->{iops}) ||
4048 &$safe_num_ne($drive->{iops_rd}, $old_drive->{iops_rd}) ||
4049 &$safe_num_ne($drive->{iops_wr}, $old_drive->{iops_wr}) ||
4050 &$safe_num_ne($drive->{mbps_max}, $old_drive->{mbps_max}) ||
4051 &$safe_num_ne($drive->{mbps_rd_max}, $old_drive->{mbps_rd_max}) ||
4052 &$safe_num_ne($drive->{mbps_wr_max}, $old_drive->{mbps_wr_max}) ||
4053 &$safe_num_ne($drive->{iops_max}, $old_drive->{iops_max}) ||
4054 &$safe_num_ne($drive->{iops_rd_max}, $old_drive->{iops_rd_max}) ||
4055 &$safe_num_ne($drive->{iops_wr_max}, $old_drive->{iops_wr_max})) {
4056
4057 qemu_block_set_io_throttle($vmid,"drive-$opt",
4058 ($drive->{mbps} || 0)*1024*1024,
4059 ($drive->{mbps_rd} || 0)*1024*1024,
4060 ($drive->{mbps_wr} || 0)*1024*1024,
4061 $drive->{iops} || 0,
4062 $drive->{iops_rd} || 0,
4063 $drive->{iops_wr} || 0,
4064 ($drive->{mbps_max} || 0)*1024*1024,
4065 ($drive->{mbps_rd_max} || 0)*1024*1024,
4066 ($drive->{mbps_wr_max} || 0)*1024*1024,
4067 $drive->{iops_max} || 0,
4068 $drive->{iops_rd_max} || 0,
4069 $drive->{iops_wr_max} || 0);
4070
4071 }
4072
4073 return 1;
4074 }
4de1bb25
DM
4075
4076 } else { # cdrom
4077
4078 if ($drive->{file} eq 'none') {
4079 vm_mon_cmd($vmid, "eject",force => JSON::true,device => "drive-$opt");
4080 } else {
4081 my $path = get_iso_path($storecfg, $vmid, $drive->{file});
4082 vm_mon_cmd($vmid, "eject", force => JSON::true,device => "drive-$opt"); # force eject if locked
4083 vm_mon_cmd($vmid, "change", device => "drive-$opt",target => "$path") if $path;
4084 }
34758d66
DM
4085
4086 return 1;
a05cff86
DM
4087 }
4088 }
4089 }
4090
4de1bb25
DM
4091 die "skip\n" if !$hotplug || $opt =~ m/(ide|sata)(\d+)/;
4092 # hotplug new disks
4093 vm_deviceplug($storecfg, $conf, $vmid, $opt, $drive);
a05cff86
DM
4094}
4095
1e3baf05 4096sub vm_start {
1d794448 4097 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 4098
6b64503e 4099 lock_config($vmid, sub {
7e8dcf2c 4100 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 4101
8b43bc11 4102 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 4103
6b64503e 4104 check_lock($conf) if !$skiplock;
1e3baf05 4105
7e8dcf2c 4106 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 4107
055d554d 4108 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3a11fadb 4109 vmconfig_apply_pending($vmid, $conf, $storecfg);
055d554d
DM
4110 $conf = load_config($vmid); # update/reload
4111 }
4112
6c47d546
DM
4113 my $defaults = load_defaults();
4114
4115 # set environment variable useful inside network script
4116 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
4117
1d794448 4118 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 4119
1e3baf05 4120 my $migrate_port = 0;
5bc1e039 4121 my $migrate_uri;
1e3baf05
DM
4122 if ($statefile) {
4123 if ($statefile eq 'tcp') {
5bc1e039
SP
4124 my $localip = "localhost";
4125 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
4126 if ($datacenterconf->{migration_unsecure}) {
4127 my $nodename = PVE::INotify::nodename();
4128 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
4129 }
f9a971e0 4130 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 4131 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
4132 push @$cmd, '-incoming', $migrate_uri;
4133 push @$cmd, '-S';
1e3baf05 4134 } else {
6c47d546 4135 push @$cmd, '-loadstate', $statefile;
1e3baf05 4136 }
91bd6c90
DM
4137 } elsif ($paused) {
4138 push @$cmd, '-S';
1e3baf05
DM
4139 }
4140
1e3baf05 4141 # host pci devices
040b06b7
DA
4142 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
4143 my $d = parse_hostpci($conf->{"hostpci$i"});
4144 next if !$d;
b1f72af6
AD
4145 my $pcidevices = $d->{pciid};
4146 foreach my $pcidevice (@$pcidevices) {
4147 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 4148
b1f72af6
AD
4149 my $info = pci_device_info("0000:$pciid");
4150 die "IOMMU not present\n" if !check_iommu_support();
4151 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 4152
b1f72af6
AD
4153 if ($d->{driver} && $d->{driver} eq "vfio") {
4154 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
4155 } else {
4156 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
4157 }
4158
8f3e88af 4159 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 4160 }
040b06b7 4161 }
1e3baf05
DM
4162
4163 PVE::Storage::activate_volumes($storecfg, $vollist);
4164
585b6e28
DM
4165 eval { run_command($cmd, timeout => $statefile ? undef : 30,
4166 umask => 0077); };
1e3baf05 4167 my $err = $@;
ff1a2432 4168 die "start failed: $err" if $err;
1e3baf05 4169
5bc1e039 4170 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 4171
8c609afd 4172 if ($statefile && $statefile ne 'tcp') {
95381ce0 4173 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 4174 warn $@ if $@;
62de2cbd
DM
4175 }
4176
1d794448 4177 if ($migratedfrom) {
a89fded1
AD
4178
4179 eval {
8e90138a 4180 set_migration_caps($vmid);
a89fded1 4181 };
1d794448 4182 warn $@ if $@;
a89fded1 4183
1d794448
DM
4184 if ($spice_port) {
4185 print "spice listens on port $spice_port\n";
4186 if ($spice_ticket) {
8e90138a
DM
4187 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
4188 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
4189 }
4190 }
4191
1d794448 4192 } else {
4ec05c4c 4193
15b1fc93 4194 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 4195 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 4196 if $conf->{balloon};
be190583
DM
4197 vm_mon_cmd_nocheck($vmid, 'qom-set',
4198 path => "machine/peripheral/balloon0",
4199 property => "guest-stats-polling-interval",
4ec05c4c
AD
4200 value => 2);
4201 }
25088687
DM
4202
4203 foreach my $opt (keys %$conf) {
4204 next if $opt !~ m/^net\d+$/;
4205 my $nicconf = parse_net($conf->{$opt});
4206 qemu_set_link_status($vmid, $opt, 0) if $nicconf->{link_down};
4207 }
e18b0b99 4208 }
1e3baf05
DM
4209 });
4210}
4211
0eedc444
AD
4212sub vm_mon_cmd {
4213 my ($vmid, $execute, %params) = @_;
4214
26f11676
DM
4215 my $cmd = { execute => $execute, arguments => \%params };
4216 vm_qmp_command($vmid, $cmd);
0eedc444
AD
4217}
4218
4219sub vm_mon_cmd_nocheck {
4220 my ($vmid, $execute, %params) = @_;
4221
26f11676
DM
4222 my $cmd = { execute => $execute, arguments => \%params };
4223 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
4224}
4225
c971c4f2 4226sub vm_qmp_command {
c5a07de5 4227 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 4228
c971c4f2 4229 my $res;
26f11676 4230
14db5366
DM
4231 my $timeout;
4232 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
4233 $timeout = $cmd->{arguments}->{timeout};
4234 delete $cmd->{arguments}->{timeout};
4235 }
be190583 4236
c971c4f2
AD
4237 eval {
4238 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
4239 my $sname = qmp_socket($vmid);
4240 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 4241 my $qmpclient = PVE::QMPClient->new();
dab36e1e 4242
14db5366 4243 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 4244 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
4245 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
4246 if scalar(%{$cmd->{arguments}});
4247 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
4248 } else {
4249 die "unable to open monitor socket\n";
4250 }
c971c4f2 4251 };
26f11676 4252 if (my $err = $@) {
c971c4f2
AD
4253 syslog("err", "VM $vmid qmp command failed - $err");
4254 die $err;
4255 }
4256
4257 return $res;
4258}
4259
9df5cbcc
DM
4260sub vm_human_monitor_command {
4261 my ($vmid, $cmdline) = @_;
4262
4263 my $res;
4264
f5eb281a 4265 my $cmd = {
9df5cbcc
DM
4266 execute => 'human-monitor-command',
4267 arguments => { 'command-line' => $cmdline},
4268 };
4269
4270 return vm_qmp_command($vmid, $cmd);
4271}
4272
1e3baf05
DM
4273sub vm_commandline {
4274 my ($storecfg, $vmid) = @_;
4275
6b64503e 4276 my $conf = load_config($vmid);
1e3baf05
DM
4277
4278 my $defaults = load_defaults();
4279
6b64503e 4280 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 4281
6b64503e 4282 return join(' ', @$cmd);
1e3baf05
DM
4283}
4284
4285sub vm_reset {
4286 my ($vmid, $skiplock) = @_;
4287
6b64503e 4288 lock_config($vmid, sub {
1e3baf05 4289
6b64503e 4290 my $conf = load_config($vmid);
1e3baf05 4291
6b64503e 4292 check_lock($conf) if !$skiplock;
1e3baf05 4293
816e2c4a 4294 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
4295 });
4296}
4297
4298sub get_vm_volumes {
4299 my ($conf) = @_;
1e3baf05 4300
ff1a2432 4301 my $vollist = [];
d5769dc2
DM
4302 foreach_volid($conf, sub {
4303 my ($volid, $is_cdrom) = @_;
ff1a2432 4304
d5769dc2 4305 return if $volid =~ m|^/|;
ff1a2432 4306
d5769dc2
DM
4307 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4308 return if !$sid;
ff1a2432
DM
4309
4310 push @$vollist, $volid;
1e3baf05 4311 });
ff1a2432
DM
4312
4313 return $vollist;
4314}
4315
4316sub vm_stop_cleanup {
70b04821 4317 my ($storecfg, $vmid, $conf, $keepActive, $apply_pending_changes) = @_;
ff1a2432 4318
745fed70
DM
4319 eval {
4320 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 4321
254575e9
DM
4322 if (!$keepActive) {
4323 my $vollist = get_vm_volumes($conf);
4324 PVE::Storage::deactivate_volumes($storecfg, $vollist);
4325 }
70b04821 4326
ab6a046f 4327 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
4328 unlink "/var/run/qemu-server/${vmid}.$ext";
4329 }
70b04821
DM
4330
4331 vmconfig_apply_pending($vmid, $conf, $storecfg) if $apply_pending_changes;
745fed70
DM
4332 };
4333 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
4334}
4335
e6c3b671 4336# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
4337# We need that when migration VMs to other nodes (files already moved)
4338# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 4339sub vm_stop {
af30308f 4340 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 4341
9269013a 4342 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 4343
af30308f
DM
4344 if ($migratedfrom){
4345 my $pid = check_running($vmid, $nocheck, $migratedfrom);
4346 kill 15, $pid if $pid;
4347 my $conf = load_config($vmid, $migratedfrom);
70b04821 4348 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 0);
af30308f
DM
4349 return;
4350 }
4351
e6c3b671 4352 lock_config($vmid, sub {
1e3baf05 4353
e6c3b671 4354 my $pid = check_running($vmid, $nocheck);
ff1a2432 4355 return if !$pid;
1e3baf05 4356
ff1a2432 4357 my $conf;
e6c3b671 4358 if (!$nocheck) {
ff1a2432 4359 $conf = load_config($vmid);
e6c3b671 4360 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
4361 if (!defined($timeout) && $shutdown && $conf->{startup}) {
4362 my $opts = parse_startup($conf->{startup});
4363 $timeout = $opts->{down} if $opts->{down};
4364 }
e6c3b671 4365 }
19672434 4366
7f4a5b5a 4367 $timeout = 60 if !defined($timeout);
67fb9de6 4368
9269013a
DM
4369 eval {
4370 if ($shutdown) {
fbda7965 4371 if (defined($conf) && $conf->{agent}) {
2ea54503 4372 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 4373 } else {
2ea54503 4374 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 4375 }
9269013a 4376 } else {
2ea54503 4377 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 4378 }
9269013a 4379 };
1e3baf05
DM
4380 my $err = $@;
4381
4382 if (!$err) {
1e3baf05 4383 my $count = 0;
e6c3b671 4384 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4385 $count++;
4386 sleep 1;
4387 }
4388
4389 if ($count >= $timeout) {
9269013a
DM
4390 if ($force) {
4391 warn "VM still running - terminating now with SIGTERM\n";
4392 kill 15, $pid;
4393 } else {
4394 die "VM quit/powerdown failed - got timeout\n";
4395 }
4396 } else {
70b04821 4397 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
9269013a 4398 return;
1e3baf05
DM
4399 }
4400 } else {
9269013a
DM
4401 if ($force) {
4402 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4403 kill 15, $pid;
4404 } else {
afdb31d5 4405 die "VM quit/powerdown failed\n";
9269013a 4406 }
1e3baf05
DM
4407 }
4408
4409 # wait again
ff1a2432 4410 $timeout = 10;
1e3baf05
DM
4411
4412 my $count = 0;
e6c3b671 4413 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
4414 $count++;
4415 sleep 1;
4416 }
4417
4418 if ($count >= $timeout) {
ff1a2432 4419 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 4420 kill 9, $pid;
ff1a2432 4421 sleep 1;
1e3baf05
DM
4422 }
4423
70b04821 4424 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
ff1a2432 4425 });
1e3baf05
DM
4426}
4427
4428sub vm_suspend {
4429 my ($vmid, $skiplock) = @_;
4430
6b64503e 4431 lock_config($vmid, sub {
1e3baf05 4432
6b64503e 4433 my $conf = load_config($vmid);
1e3baf05 4434
051347aa 4435 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 4436
f77f91f3 4437 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
4438 });
4439}
4440
4441sub vm_resume {
4442 my ($vmid, $skiplock) = @_;
4443
6b64503e 4444 lock_config($vmid, sub {
1e3baf05 4445
6b64503e 4446 my $conf = load_config($vmid);
1e3baf05 4447
051347aa 4448 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 4449
12060fe8 4450 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
4451 });
4452}
4453
5fdbe4f0
DM
4454sub vm_sendkey {
4455 my ($vmid, $skiplock, $key) = @_;
1e3baf05 4456
6b64503e 4457 lock_config($vmid, sub {
1e3baf05 4458
6b64503e 4459 my $conf = load_config($vmid);
f5eb281a 4460
7b7c6d1b
DM
4461 # there is no qmp command, so we use the human monitor command
4462 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
4463 });
4464}
4465
4466sub vm_destroy {
4467 my ($storecfg, $vmid, $skiplock) = @_;
4468
6b64503e 4469 lock_config($vmid, sub {
1e3baf05 4470
6b64503e 4471 my $conf = load_config($vmid);
1e3baf05 4472
6b64503e 4473 check_lock($conf) if !$skiplock;
1e3baf05 4474
ff1a2432
DM
4475 if (!check_running($vmid)) {
4476 fairsched_rmnod($vmid); # try to destroy group
4477 destroy_vm($storecfg, $vmid);
4478 } else {
4479 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
4480 }
4481 });
4482}
4483
1e3baf05
DM
4484# pci helpers
4485
4486sub file_write {
4487 my ($filename, $buf) = @_;
4488
6b64503e 4489 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
4490 return undef if !$fh;
4491
4492 my $res = print $fh $buf;
4493
4494 $fh->close();
4495
4496 return $res;
4497}
4498
4499sub pci_device_info {
4500 my ($name) = @_;
4501
4502 my $res;
4503
4504 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
4505 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
4506
4507 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
4508 return undef if !defined($irq) || $irq !~ m/^\d+$/;
4509
4510 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
4511 return undef if !defined($vendor) || $vendor !~ s/^0x//;
4512
4513 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
4514 return undef if !defined($product) || $product !~ s/^0x//;
4515
4516 $res = {
4517 name => $name,
4518 vendor => $vendor,
4519 product => $product,
4520 domain => $domain,
4521 bus => $bus,
4522 slot => $slot,
4523 func => $func,
4524 irq => $irq,
4525 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
4526 };
4527
4528 return $res;
4529}
4530
4531sub pci_dev_reset {
4532 my ($dev) = @_;
4533
4534 my $name = $dev->{name};
4535
4536 my $fn = "$pcisysfs/devices/$name/reset";
4537
6b64503e 4538 return file_write($fn, "1");
1e3baf05
DM
4539}
4540
4541sub pci_dev_bind_to_stub {
4542 my ($dev) = @_;
4543
4544 my $name = $dev->{name};
4545
4546 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
4547 return 1 if -d $testdir;
4548
4549 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 4550 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
4551
4552 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 4553 if (!file_write($fn, $name)) {
1e3baf05
DM
4554 return undef if -f $fn;
4555 }
4556
4557 $fn = "$pcisysfs/drivers/pci-stub/bind";
4558 if (! -d $testdir) {
6b64503e 4559 return undef if !file_write($fn, $name);
1e3baf05
DM
4560 }
4561
4562 return -d $testdir;
4563}
4564
000fc0a2
SP
4565sub pci_dev_bind_to_vfio {
4566 my ($dev) = @_;
4567
4568 my $name = $dev->{name};
4569
4570 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4571
4572 if (!-d $vfio_basedir) {
4573 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4574 }
4575 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4576
4577 my $testdir = "$vfio_basedir/$name";
4578 return 1 if -d $testdir;
4579
4580 my $data = "$dev->{vendor} $dev->{product}";
4581 return undef if !file_write("$vfio_basedir/new_id", $data);
4582
4583 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4584 if (!file_write($fn, $name)) {
4585 return undef if -f $fn;
4586 }
4587
4588 $fn = "$vfio_basedir/bind";
4589 if (! -d $testdir) {
4590 return undef if !file_write($fn, $name);
4591 }
4592
4593 return -d $testdir;
4594}
4595
4596sub pci_dev_group_bind_to_vfio {
4597 my ($pciid) = @_;
4598
4599 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4600
4601 if (!-d $vfio_basedir) {
4602 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4603 }
4604 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4605
4606 # get IOMMU group devices
4607 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
4608 my @devs = grep /^0000:/, readdir($D);
4609 closedir($D);
4610
4611 foreach my $pciid (@devs) {
4612 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
f8fa2ed7
SP
4613
4614 # pci bridges, switches or root ports are not supported
4615 # they have a pci_bus subdirectory so skip them
4616 next if (-e "$pcisysfs/devices/$pciid/pci_bus");
4617
000fc0a2
SP
4618 my $info = pci_device_info($1);
4619 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
4620 }
4621
4622 return 1;
4623}
4624
afdb31d5 4625sub print_pci_addr {
5bdcf937 4626 my ($id, $bridges) = @_;
6b64503e 4627
72a063e4 4628 my $res = '';
6b64503e 4629 my $devices = {
24f0d39a 4630 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 4631 #addr2 : first videocard
13b5a753 4632 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 4633 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
4634 scsihw0 => { bus => 0, addr => 5 },
4635 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 4636 ahci0 => { bus => 0, addr => 7 },
ab6a046f 4637 qga0 => { bus => 0, addr => 8 },
1011b570 4638 spice => { bus => 0, addr => 9 },
6b64503e
DM
4639 virtio0 => { bus => 0, addr => 10 },
4640 virtio1 => { bus => 0, addr => 11 },
4641 virtio2 => { bus => 0, addr => 12 },
4642 virtio3 => { bus => 0, addr => 13 },
4643 virtio4 => { bus => 0, addr => 14 },
4644 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
4645 hostpci0 => { bus => 0, addr => 16 },
4646 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
4647 net0 => { bus => 0, addr => 18 },
4648 net1 => { bus => 0, addr => 19 },
4649 net2 => { bus => 0, addr => 20 },
4650 net3 => { bus => 0, addr => 21 },
4651 net4 => { bus => 0, addr => 22 },
4652 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
4653 vga1 => { bus => 0, addr => 24 },
4654 vga2 => { bus => 0, addr => 25 },
4655 vga3 => { bus => 0, addr => 26 },
5cffb2d2
AD
4656 hostpci2 => { bus => 0, addr => 27 },
4657 hostpci3 => { bus => 0, addr => 28 },
e5f7f8ed 4658 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
4659 'pci.1' => { bus => 0, addr => 30 },
4660 'pci.2' => { bus => 0, addr => 31 },
4661 'net6' => { bus => 1, addr => 1 },
4662 'net7' => { bus => 1, addr => 2 },
4663 'net8' => { bus => 1, addr => 3 },
4664 'net9' => { bus => 1, addr => 4 },
4665 'net10' => { bus => 1, addr => 5 },
4666 'net11' => { bus => 1, addr => 6 },
4667 'net12' => { bus => 1, addr => 7 },
4668 'net13' => { bus => 1, addr => 8 },
4669 'net14' => { bus => 1, addr => 9 },
4670 'net15' => { bus => 1, addr => 10 },
4671 'net16' => { bus => 1, addr => 11 },
4672 'net17' => { bus => 1, addr => 12 },
4673 'net18' => { bus => 1, addr => 13 },
4674 'net19' => { bus => 1, addr => 14 },
4675 'net20' => { bus => 1, addr => 15 },
4676 'net21' => { bus => 1, addr => 16 },
4677 'net22' => { bus => 1, addr => 17 },
4678 'net23' => { bus => 1, addr => 18 },
4679 'net24' => { bus => 1, addr => 19 },
4680 'net25' => { bus => 1, addr => 20 },
4681 'net26' => { bus => 1, addr => 21 },
4682 'net27' => { bus => 1, addr => 22 },
4683 'net28' => { bus => 1, addr => 23 },
4684 'net29' => { bus => 1, addr => 24 },
4685 'net30' => { bus => 1, addr => 25 },
4686 'net31' => { bus => 1, addr => 26 },
4687 'virtio6' => { bus => 2, addr => 1 },
4688 'virtio7' => { bus => 2, addr => 2 },
4689 'virtio8' => { bus => 2, addr => 3 },
4690 'virtio9' => { bus => 2, addr => 4 },
4691 'virtio10' => { bus => 2, addr => 5 },
4692 'virtio11' => { bus => 2, addr => 6 },
4693 'virtio12' => { bus => 2, addr => 7 },
4694 'virtio13' => { bus => 2, addr => 8 },
4695 'virtio14' => { bus => 2, addr => 9 },
4696 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
4697 };
4698
4699 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 4700 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
4701 my $bus = $devices->{$id}->{bus};
4702 $res = ",bus=pci.$bus,addr=$addr";
98627641 4703 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
4704 }
4705 return $res;
4706
4707}
4708
2e3b7e2a
AD
4709sub print_pcie_addr {
4710 my ($id) = @_;
4711
4712 my $res = '';
4713 my $devices = {
4714 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4715 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4716 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4717 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4718 };
4719
4720 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4721 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4722 my $bus = $devices->{$id}->{bus};
4723 $res = ",bus=$bus,addr=$addr";
4724 }
4725 return $res;
4726
4727}
4728
3e16d5fc
DM
4729# vzdump restore implementaion
4730
ed221350 4731sub tar_archive_read_firstfile {
3e16d5fc 4732 my $archive = shift;
afdb31d5 4733
3e16d5fc
DM
4734 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4735
4736 # try to detect archive type first
4737 my $pid = open (TMP, "tar tf '$archive'|") ||
4738 die "unable to open file '$archive'\n";
4739 my $firstfile = <TMP>;
4740 kill 15, $pid;
4741 close TMP;
4742
4743 die "ERROR: archive contaions no data\n" if !$firstfile;
4744 chomp $firstfile;
4745
4746 return $firstfile;
4747}
4748
ed221350
DM
4749sub tar_restore_cleanup {
4750 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
4751
4752 print STDERR "starting cleanup\n";
4753
4754 if (my $fd = IO::File->new($statfile, "r")) {
4755 while (defined(my $line = <$fd>)) {
4756 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4757 my $volid = $2;
4758 eval {
4759 if ($volid =~ m|^/|) {
4760 unlink $volid || die 'unlink failed\n';
4761 } else {
ed221350 4762 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 4763 }
afdb31d5 4764 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
4765 };
4766 print STDERR "unable to cleanup '$volid' - $@" if $@;
4767 } else {
4768 print STDERR "unable to parse line in statfile - $line";
afdb31d5 4769 }
3e16d5fc
DM
4770 }
4771 $fd->close();
4772 }
4773}
4774
4775sub restore_archive {
a0d1b1a2 4776 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 4777
91bd6c90
DM
4778 my $format = $opts->{format};
4779 my $comp;
4780
4781 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4782 $format = 'tar' if !$format;
4783 $comp = 'gzip';
4784 } elsif ($archive =~ m/\.tar$/) {
4785 $format = 'tar' if !$format;
4786 } elsif ($archive =~ m/.tar.lzo$/) {
4787 $format = 'tar' if !$format;
4788 $comp = 'lzop';
4789 } elsif ($archive =~ m/\.vma$/) {
4790 $format = 'vma' if !$format;
4791 } elsif ($archive =~ m/\.vma\.gz$/) {
4792 $format = 'vma' if !$format;
4793 $comp = 'gzip';
4794 } elsif ($archive =~ m/\.vma\.lzo$/) {
4795 $format = 'vma' if !$format;
4796 $comp = 'lzop';
4797 } else {
4798 $format = 'vma' if !$format; # default
4799 }
4800
4801 # try to detect archive format
4802 if ($format eq 'tar') {
4803 return restore_tar_archive($archive, $vmid, $user, $opts);
4804 } else {
4805 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4806 }
4807}
4808
4809sub restore_update_config_line {
4810 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4811
4812 return if $line =~ m/^\#qmdump\#/;
4813 return if $line =~ m/^\#vzdump\#/;
4814 return if $line =~ m/^lock:/;
4815 return if $line =~ m/^unused\d+:/;
4816 return if $line =~ m/^parent:/;
ca3e4fa4 4817 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4818
4819 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4820 # try to convert old 1.X settings
4821 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4822 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4823 my ($model, $macaddr) = split(/\=/, $devconfig);
4824 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4825 my $net = {
4826 model => $model,
4827 bridge => "vmbr$ind",
4828 macaddr => $macaddr,
4829 };
4830 my $netstr = print_net($net);
4831
4832 print $outfd "net$cookie->{netcount}: $netstr\n";
4833 $cookie->{netcount}++;
4834 }
4835 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4836 my ($id, $netstr) = ($1, $2);
4837 my $net = parse_net($netstr);
4838 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4839 $netstr = print_net($net);
4840 print $outfd "$id: $netstr\n";
4841 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4842 my $virtdev = $1;
907ea891 4843 my $value = $3;
91bd6c90
DM
4844 if ($line =~ m/backup=no/) {
4845 print $outfd "#$line";
4846 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4847 my $di = parse_drive($virtdev, $value);
8fd57431 4848 delete $di->{format}; # format can change on restore
91bd6c90 4849 $di->{file} = $map->{$virtdev};
ed221350 4850 $value = print_drive($vmid, $di);
91bd6c90
DM
4851 print $outfd "$virtdev: $value\n";
4852 } else {
4853 print $outfd $line;
4854 }
4855 } else {
4856 print $outfd $line;
4857 }
4858}
4859
4860sub scan_volids {
4861 my ($cfg, $vmid) = @_;
4862
4863 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4864
4865 my $volid_hash = {};
4866 foreach my $storeid (keys %$info) {
4867 foreach my $item (@{$info->{$storeid}}) {
4868 next if !($item->{volid} && $item->{size});
5996a936 4869 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4870 $volid_hash->{$item->{volid}} = $item;
4871 }
4872 }
4873
4874 return $volid_hash;
4875}
4876
a8e2f942
DM
4877sub get_used_paths {
4878 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4879
4880 my $used_path = {};
4881
4882 my $scan_config = sub {
4883 my ($cref, $snapname) = @_;
4884
4885 foreach my $key (keys %$cref) {
4886 my $value = $cref->{$key};
4887 if (valid_drivename($key)) {
4888 next if $skip_drive && $key eq $skip_drive;
4889 my $drive = parse_drive($key, $value);
4890 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4891 if ($drive->{file} =~ m!^/!) {
4892 $used_path->{$drive->{file}}++; # = 1;
4893 } else {
4894 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4895 next if !$storeid;
4896 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4897 next if !$scfg;
4898 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4899 $used_path->{$path}++; # = 1;
4900 }
4901 }
4902 }
4903 };
4904
4905 &$scan_config($conf);
4906
4907 undef $skip_drive;
4908
4909 if ($scan_snapshots) {
4910 foreach my $snapname (keys %{$conf->{snapshots}}) {
4911 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4912 }
4913 }
4914
4915 return $used_path;
4916}
4917
91bd6c90
DM
4918sub update_disksize {
4919 my ($vmid, $conf, $volid_hash) = @_;
be190583 4920
91bd6c90
DM
4921 my $changes;
4922
4923 my $used = {};
4924
5996a936
DM
4925 # Note: it is allowed to define multiple storages with same path (alias), so
4926 # we need to check both 'volid' and real 'path' (two different volid can point
4927 # to the same path).
4928
4929 my $usedpath = {};
be190583 4930
91bd6c90
DM
4931 # update size info
4932 foreach my $opt (keys %$conf) {
ed221350
DM
4933 if (valid_drivename($opt)) {
4934 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4935 my $volid = $drive->{file};
4936 next if !$volid;
4937
4938 $used->{$volid} = 1;
be190583 4939 if ($volid_hash->{$volid} &&
5996a936
DM
4940 (my $path = $volid_hash->{$volid}->{path})) {
4941 $usedpath->{$path} = 1;
4942 }
91bd6c90 4943
ed221350 4944 next if drive_is_cdrom($drive);
91bd6c90
DM
4945 next if !$volid_hash->{$volid};
4946
4947 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4948 my $new = print_drive($vmid, $drive);
4949 if ($new ne $conf->{$opt}) {
4950 $changes = 1;
4951 $conf->{$opt} = $new;
4952 }
91bd6c90
DM
4953 }
4954 }
4955
5996a936
DM
4956 # remove 'unusedX' entry if volume is used
4957 foreach my $opt (keys %$conf) {
4958 next if $opt !~ m/^unused\d+$/;
4959 my $volid = $conf->{$opt};
4960 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4961 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4962 $changes = 1;
4963 delete $conf->{$opt};
4964 }
4965 }
4966
91bd6c90
DM
4967 foreach my $volid (sort keys %$volid_hash) {
4968 next if $volid =~ m/vm-$vmid-state-/;
4969 next if $used->{$volid};
5996a936
DM
4970 my $path = $volid_hash->{$volid}->{path};
4971 next if !$path; # just to be sure
4972 next if $usedpath->{$path};
91bd6c90 4973 $changes = 1;
ed221350 4974 add_unused_volume($conf, $volid);
05937a14 4975 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4976 }
4977
4978 return $changes;
4979}
4980
4981sub rescan {
4982 my ($vmid, $nolock) = @_;
4983
4984 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4985
4986 my $volid_hash = scan_volids($cfg, $vmid);
4987
4988 my $updatefn = sub {
4989 my ($vmid) = @_;
4990
ed221350 4991 my $conf = load_config($vmid);
be190583 4992
ed221350 4993 check_lock($conf);
91bd6c90 4994
03da3f0d
DM
4995 my $vm_volids = {};
4996 foreach my $volid (keys %$volid_hash) {
4997 my $info = $volid_hash->{$volid};
4998 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4999 }
5000
5001 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 5002
ed221350 5003 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
5004 };
5005
5006 if (defined($vmid)) {
5007 if ($nolock) {
5008 &$updatefn($vmid);
5009 } else {
ed221350 5010 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
5011 }
5012 } else {
5013 my $vmlist = config_list();
5014 foreach my $vmid (keys %$vmlist) {
5015 if ($nolock) {
5016 &$updatefn($vmid);
5017 } else {
ed221350 5018 lock_config($vmid, $updatefn, $vmid);
be190583 5019 }
91bd6c90
DM
5020 }
5021 }
5022}
5023
5024sub restore_vma_archive {
5025 my ($archive, $vmid, $user, $opts, $comp) = @_;
5026
5027 my $input = $archive eq '-' ? "<&STDIN" : undef;
5028 my $readfrom = $archive;
5029
5030 my $uncomp = '';
5031 if ($comp) {
5032 $readfrom = '-';
5033 my $qarchive = PVE::Tools::shellquote($archive);
5034 if ($comp eq 'gzip') {
5035 $uncomp = "zcat $qarchive|";
5036 } elsif ($comp eq 'lzop') {
5037 $uncomp = "lzop -d -c $qarchive|";
5038 } else {
5039 die "unknown compression method '$comp'\n";
5040 }
be190583 5041
91bd6c90
DM
5042 }
5043
5044 my $tmpdir = "/var/tmp/vzdumptmp$$";
5045 rmtree $tmpdir;
5046
5047 # disable interrupts (always do cleanups)
5048 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5049 warn "got interrupt - ignored\n";
5050 };
5051
5052 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
5053 POSIX::mkfifo($mapfifo, 0600);
5054 my $fifofh;
5055
5056 my $openfifo = sub {
5057 open($fifofh, '>', $mapfifo) || die $!;
5058 };
5059
5060 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
5061
5062 my $oldtimeout;
5063 my $timeout = 5;
5064
5065 my $devinfo = {};
5066
5067 my $rpcenv = PVE::RPCEnvironment::get();
5068
ed221350 5069 my $conffile = config_file($vmid);
91bd6c90
DM
5070 my $tmpfn = "$conffile.$$.tmp";
5071
ed221350
DM
5072 # Note: $oldconf is undef if VM does not exists
5073 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
5074
91bd6c90
DM
5075 my $print_devmap = sub {
5076 my $virtdev_hash = {};
5077
5078 my $cfgfn = "$tmpdir/qemu-server.conf";
5079
5080 # we can read the config - that is already extracted
5081 my $fh = IO::File->new($cfgfn, "r") ||
5082 "unable to read qemu-server.conf - $!\n";
5083
5084 while (defined(my $line = <$fh>)) {
5085 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
5086 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
5087 die "archive does not contain data for drive '$virtdev'\n"
5088 if !$devinfo->{$devname};
5089 if (defined($opts->{storage})) {
5090 $storeid = $opts->{storage} || 'local';
5091 } elsif (!$storeid) {
5092 $storeid = 'local';
5093 }
5094 $format = 'raw' if !$format;
5095 $devinfo->{$devname}->{devname} = $devname;
5096 $devinfo->{$devname}->{virtdev} = $virtdev;
5097 $devinfo->{$devname}->{format} = $format;
5098 $devinfo->{$devname}->{storeid} = $storeid;
5099
be190583 5100 # check permission on storage
91bd6c90
DM
5101 my $pool = $opts->{pool}; # todo: do we need that?
5102 if ($user ne 'root@pam') {
5103 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
5104 }
5105
5106 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
5107 }
5108 }
5109
5110 foreach my $devname (keys %$devinfo) {
be190583
DM
5111 die "found no device mapping information for device '$devname'\n"
5112 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
5113 }
5114
91bd6c90 5115 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
5116
5117 # create empty/temp config
be190583 5118 if ($oldconf) {
ed221350
DM
5119 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
5120 foreach_drive($oldconf, sub {
5121 my ($ds, $drive) = @_;
5122
5123 return if drive_is_cdrom($drive);
5124
5125 my $volid = $drive->{file};
5126
5127 return if !$volid || $volid =~ m|^/|;
5128
5129 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
5130 return if !$path || !$owner || ($owner != $vmid);
5131
5132 # Note: only delete disk we want to restore
5133 # other volumes will become unused
5134 if ($virtdev_hash->{$ds}) {
5135 PVE::Storage::vdisk_free($cfg, $volid);
5136 }
5137 });
5138 }
5139
5140 my $map = {};
91bd6c90
DM
5141 foreach my $virtdev (sort keys %$virtdev_hash) {
5142 my $d = $virtdev_hash->{$virtdev};
5143 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
5144 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
5145
5146 # test if requested format is supported
5147 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
5148 my $supported = grep { $_ eq $d->{format} } @$validFormats;
5149 $d->{format} = $defFormat if !$supported;
5150
91bd6c90
DM
5151 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
5152 $d->{format}, undef, $alloc_size);
5153 print STDERR "new volume ID is '$volid'\n";
5154 $d->{volid} = $volid;
5155 my $path = PVE::Storage::path($cfg, $volid);
5156
5157 my $write_zeros = 1;
5158 # fixme: what other storages types initialize volumes with zero?
244f2577 5159 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 5160 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
5161 $write_zeros = 0;
5162 }
5163
5164 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
5165
5166 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
5167 $map->{$virtdev} = $volid;
5168 }
5169
5170 $fh->seek(0, 0) || die "seek failed - $!\n";
5171
5172 my $outfd = new IO::File ($tmpfn, "w") ||
5173 die "unable to write config for VM $vmid\n";
5174
5175 my $cookie = { netcount => 0 };
5176 while (defined(my $line = <$fh>)) {
be190583 5177 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
5178 }
5179
5180 $fh->close();
5181 $outfd->close();
5182 };
5183
5184 eval {
5185 # enable interrupts
5186 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5187 die "interrupted by signal\n";
5188 };
5189 local $SIG{ALRM} = sub { die "got timeout\n"; };
5190
5191 $oldtimeout = alarm($timeout);
5192
5193 my $parser = sub {
5194 my $line = shift;
5195
5196 print "$line\n";
5197
5198 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
5199 my ($dev_id, $size, $devname) = ($1, $2, $3);
5200 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
5201 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 5202 # we correctly received the vma config, so we can disable
3cf90d7a
DM
5203 # the timeout now for disk allocation (set to 10 minutes, so
5204 # that we always timeout if something goes wrong)
5205 alarm(600);
91bd6c90
DM
5206 &$print_devmap();
5207 print $fifofh "done\n";
5208 my $tmp = $oldtimeout || 0;
5209 $oldtimeout = undef;
5210 alarm($tmp);
5211 close($fifofh);
5212 }
5213 };
be190583 5214
91bd6c90
DM
5215 print "restore vma archive: $cmd\n";
5216 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
5217 };
5218 my $err = $@;
5219
5220 alarm($oldtimeout) if $oldtimeout;
5221
5222 unlink $mapfifo;
5223
5224 if ($err) {
5225 rmtree $tmpdir;
5226 unlink $tmpfn;
5227
5228 my $cfg = cfs_read_file('storage.cfg');
5229 foreach my $devname (keys %$devinfo) {
5230 my $volid = $devinfo->{$devname}->{volid};
5231 next if !$volid;
5232 eval {
5233 if ($volid =~ m|^/|) {
5234 unlink $volid || die 'unlink failed\n';
5235 } else {
5236 PVE::Storage::vdisk_free($cfg, $volid);
5237 }
5238 print STDERR "temporary volume '$volid' sucessfuly removed\n";
5239 };
5240 print STDERR "unable to cleanup '$volid' - $@" if $@;
5241 }
5242 die $err;
5243 }
5244
5245 rmtree $tmpdir;
ed221350
DM
5246
5247 rename($tmpfn, $conffile) ||
91bd6c90
DM
5248 die "unable to commit configuration file '$conffile'\n";
5249
ed221350
DM
5250 PVE::Cluster::cfs_update(); # make sure we read new file
5251
91bd6c90
DM
5252 eval { rescan($vmid, 1); };
5253 warn $@ if $@;
5254}
5255
5256sub restore_tar_archive {
5257 my ($archive, $vmid, $user, $opts) = @_;
5258
9c502e26 5259 if ($archive ne '-') {
ed221350 5260 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
5261 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
5262 if $firstfile ne 'qemu-server.conf';
5263 }
3e16d5fc 5264
ed221350 5265 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 5266
ed221350 5267 # destroy existing data - keep empty config
8e90138a 5268 my $vmcfgfn = config_file($vmid);
ebb55558 5269 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 5270
3e16d5fc
DM
5271 my $tocmd = "/usr/lib/qemu-server/qmextract";
5272
2415a446 5273 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 5274 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
5275 $tocmd .= ' --prealloc' if $opts->{prealloc};
5276 $tocmd .= ' --info' if $opts->{info};
5277
a0d1b1a2 5278 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 5279 # so we pipe to zcat
2415a446
DM
5280 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
5281 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
5282
5283 my $tmpdir = "/var/tmp/vzdumptmp$$";
5284 mkpath $tmpdir;
5285
5286 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
5287 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 5288 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 5289
ed221350 5290 my $conffile = config_file($vmid);
3e16d5fc
DM
5291 my $tmpfn = "$conffile.$$.tmp";
5292
5293 # disable interrupts (always do cleanups)
5294 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
5295 print STDERR "got interrupt - ignored\n";
5296 };
5297
afdb31d5 5298 eval {
3e16d5fc
DM
5299 # enable interrupts
5300 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5301 die "interrupted by signal\n";
5302 };
5303
9c502e26
DM
5304 if ($archive eq '-') {
5305 print "extracting archive from STDIN\n";
5306 run_command($cmd, input => "<&STDIN");
5307 } else {
5308 print "extracting archive '$archive'\n";
5309 run_command($cmd);
5310 }
3e16d5fc
DM
5311
5312 return if $opts->{info};
5313
5314 # read new mapping
5315 my $map = {};
5316 my $statfile = "$tmpdir/qmrestore.stat";
5317 if (my $fd = IO::File->new($statfile, "r")) {
5318 while (defined (my $line = <$fd>)) {
5319 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5320 $map->{$1} = $2 if $1;
5321 } else {
5322 print STDERR "unable to parse line in statfile - $line\n";
5323 }
5324 }
5325 $fd->close();
5326 }
5327
5328 my $confsrc = "$tmpdir/qemu-server.conf";
5329
5330 my $srcfd = new IO::File($confsrc, "r") ||
5331 die "unable to open file '$confsrc'\n";
5332
5333 my $outfd = new IO::File ($tmpfn, "w") ||
5334 die "unable to write config for VM $vmid\n";
5335
91bd6c90 5336 my $cookie = { netcount => 0 };
3e16d5fc 5337 while (defined (my $line = <$srcfd>)) {
be190583 5338 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
5339 }
5340
5341 $srcfd->close();
5342 $outfd->close();
5343 };
5344 my $err = $@;
5345
afdb31d5 5346 if ($err) {
3e16d5fc
DM
5347
5348 unlink $tmpfn;
5349
ed221350 5350 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 5351
3e16d5fc 5352 die $err;
afdb31d5 5353 }
3e16d5fc
DM
5354
5355 rmtree $tmpdir;
5356
5357 rename $tmpfn, $conffile ||
5358 die "unable to commit configuration file '$conffile'\n";
91bd6c90 5359
ed221350
DM
5360 PVE::Cluster::cfs_update(); # make sure we read new file
5361
91bd6c90
DM
5362 eval { rescan($vmid, 1); };
5363 warn $@ if $@;
3e16d5fc
DM
5364};
5365
0d18dcfc
DM
5366
5367# Internal snapshots
5368
5369# NOTE: Snapshot create/delete involves several non-atomic
5370# action, and can take a long time.
5371# So we try to avoid locking the file and use 'lock' variable
5372# inside the config file instead.
5373
ef59d1ca
DM
5374my $snapshot_copy_config = sub {
5375 my ($source, $dest) = @_;
5376
5377 foreach my $k (keys %$source) {
5378 next if $k eq 'snapshots';
982c7f12
DM
5379 next if $k eq 'snapstate';
5380 next if $k eq 'snaptime';
18bfb361 5381 next if $k eq 'vmstate';
ef59d1ca
DM
5382 next if $k eq 'lock';
5383 next if $k eq 'digest';
db7c26e5 5384 next if $k eq 'description';
ef59d1ca 5385 next if $k =~ m/^unused\d+$/;
be190583 5386
ef59d1ca
DM
5387 $dest->{$k} = $source->{$k};
5388 }
5389};
5390
5391my $snapshot_apply_config = sub {
5392 my ($conf, $snap) = @_;
5393
5394 # copy snapshot list
5395 my $newconf = {
5396 snapshots => $conf->{snapshots},
5397 };
5398
db7c26e5 5399 # keep description and list of unused disks
ef59d1ca 5400 foreach my $k (keys %$conf) {
db7c26e5 5401 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
5402 $newconf->{$k} = $conf->{$k};
5403 }
5404
5405 &$snapshot_copy_config($snap, $newconf);
5406
5407 return $newconf;
5408};
5409
18bfb361
DM
5410sub foreach_writable_storage {
5411 my ($conf, $func) = @_;
5412
5413 my $sidhash = {};
5414
5415 foreach my $ds (keys %$conf) {
5416 next if !valid_drivename($ds);
5417
5418 my $drive = parse_drive($ds, $conf->{$ds});
5419 next if !$drive;
5420 next if drive_is_cdrom($drive);
5421
5422 my $volid = $drive->{file};
5423
5424 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 5425 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
5426 }
5427
5428 foreach my $sid (sort keys %$sidhash) {
5429 &$func($sid);
5430 }
5431}
5432
5433my $alloc_vmstate_volid = sub {
5434 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 5435
18bfb361
DM
5436 # Note: we try to be smart when selecting a $target storage
5437
5438 my $target;
5439
5440 # search shared storage first
5441 foreach_writable_storage($conf, sub {
5442 my ($sid) = @_;
5443 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5444 return if !$scfg->{shared};
5445
5446 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
5447 });
5448
5449 if (!$target) {
5450 # now search local storage
5451 foreach_writable_storage($conf, sub {
5452 my ($sid) = @_;
5453 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5454 return if $scfg->{shared};
5455
5456 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
5457 });
5458 }
5459
5460 $target = 'local' if !$target;
5461
fe6249f4
DM
5462 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
5463 # we abort live save after $conf->{memory}, so we need at max twice that space
5464 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
5465
5466 my $name = "vm-$vmid-state-$snapname";
5467 my $scfg = PVE::Storage::storage_config($storecfg, $target);
5468 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
5469 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
5470
5471 return $volid;
5472};
5473
0d18dcfc 5474my $snapshot_prepare = sub {
18bfb361 5475 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
5476
5477 my $snap;
0d18dcfc
DM
5478
5479 my $updatefn = sub {
5480
5481 my $conf = load_config($vmid);
5482
be190583 5483 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
5484 if is_template($conf);
5485
0d18dcfc
DM
5486 check_lock($conf);
5487
22c377f0
DM
5488 $conf->{lock} = 'snapshot';
5489
be190583
DM
5490 die "snapshot name '$snapname' already used\n"
5491 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 5492
ee2f90b1 5493 my $storecfg = PVE::Storage::config();
7ea975ef 5494 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 5495
782f4f75 5496 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 5497
18bfb361
DM
5498 if ($save_vmstate && check_running($vmid)) {
5499 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
5500 }
5501
ef59d1ca 5502 &$snapshot_copy_config($conf, $snap);
0d18dcfc 5503
782f4f75
DM
5504 $snap->{snapstate} = "prepare";
5505 $snap->{snaptime} = time();
5506 $snap->{description} = $comment if $comment;
5507
4b15803d
DM
5508 # always overwrite machine if we save vmstate. This makes sure we
5509 # can restore it later using correct machine type
5510 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
5511
0d18dcfc
DM
5512 update_config_nolock($vmid, $conf, 1);
5513 };
5514
5515 lock_config($vmid, $updatefn);
22c377f0
DM
5516
5517 return $snap;
0d18dcfc
DM
5518};
5519
5520my $snapshot_commit = sub {
5521 my ($vmid, $snapname) = @_;
5522
5523 my $updatefn = sub {
5524
5525 my $conf = load_config($vmid);
5526
be190583
DM
5527 die "missing snapshot lock\n"
5528 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc 5529
7946e0fa
DM
5530 my $has_machine_config = defined($conf->{machine});
5531
0d18dcfc
DM
5532 my $snap = $conf->{snapshots}->{$snapname};
5533
be190583
DM
5534 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5535
5536 die "wrong snapshot state\n"
5537 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 5538
0d18dcfc 5539 delete $snap->{snapstate};
ee2f90b1 5540 delete $conf->{lock};
0d18dcfc 5541
ef59d1ca 5542 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 5543
7946e0fa
DM
5544 delete $newconf->{machine} if !$has_machine_config;
5545
05e5ad3f
DM
5546 $newconf->{parent} = $snapname;
5547
0d18dcfc
DM
5548 update_config_nolock($vmid, $newconf, 1);
5549 };
5550
5551 lock_config($vmid, $updatefn);
5552};
5553
22c377f0
DM
5554sub snapshot_rollback {
5555 my ($vmid, $snapname) = @_;
5556
22c377f0
DM
5557 my $prepare = 1;
5558
a3222b91 5559 my $storecfg = PVE::Storage::config();
be190583 5560
ba4eea15 5561 my $conf = load_config($vmid);
22c377f0 5562
ba4eea15 5563 my $get_snapshot_config = sub {
22c377f0 5564
8b43bc11 5565 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 5566
ba4eea15 5567 my $res = $conf->{snapshots}->{$snapname};
ab33a7c2 5568
ba4eea15
WL
5569 die "snapshot '$snapname' does not exist\n" if !defined($res);
5570
5571 return $res;
5572 };
5573
5574 my $snap = &$get_snapshot_config();
5575
5576 foreach_drive($snap, sub {
5577 my ($ds, $drive) = @_;
5578
5579 return if drive_is_cdrom($drive);
5580
5581 my $volid = $drive->{file};
5582
5583 PVE::Storage::volume_rollback_is_possible($storecfg, $volid, $snapname);
5584 });
5585
5586 my $updatefn = sub {
5587
5588 $conf = load_config($vmid);
5589
5590 $snap = &$get_snapshot_config();
ab33a7c2 5591
be190583 5592 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
5593 if $snap->{snapstate};
5594
a3222b91
DM
5595 if ($prepare) {
5596 check_lock($conf);
5597 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
5598 }
22c377f0
DM
5599
5600 die "unable to rollback vm $vmid: vm is running\n"
5601 if check_running($vmid);
5602
5603 if ($prepare) {
5604 $conf->{lock} = 'rollback';
5605 } else {
5606 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
5607 delete $conf->{lock};
5608 }
5609
4b15803d
DM
5610 my $forcemachine;
5611
22c377f0 5612 if (!$prepare) {
4b15803d
DM
5613 my $has_machine_config = defined($conf->{machine});
5614
22c377f0 5615 # copy snapshot config to current config
ef59d1ca
DM
5616 $conf = &$snapshot_apply_config($conf, $snap);
5617 $conf->{parent} = $snapname;
4b15803d 5618
d8b916fd
DM
5619 # Note: old code did not store 'machine', so we try to be smart
5620 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
5621 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 5622 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
5623 # in the original config.
5624 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
5625 }
5626
5627 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
5628
5629 if (!$prepare && $snap->{vmstate}) {
5630 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 5631 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 5632 }
22c377f0
DM
5633 };
5634
5635 lock_config($vmid, $updatefn);
be190583 5636
22c377f0
DM
5637 foreach_drive($snap, sub {
5638 my ($ds, $drive) = @_;
5639
5640 return if drive_is_cdrom($drive);
5641
5642 my $volid = $drive->{file};
5643 my $device = "drive-$ds";
5644
79e57b29 5645 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
5646 });
5647
5648 $prepare = 0;
5649 lock_config($vmid, $updatefn);
5650}
5651
9dcf4909
DM
5652my $savevm_wait = sub {
5653 my ($vmid) = @_;
5654
5655 for(;;) {
ed221350 5656 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
5657 if (!$stat->{status}) {
5658 die "savevm not active\n";
5659 } elsif ($stat->{status} eq 'active') {
5660 sleep(1);
5661 next;
5662 } elsif ($stat->{status} eq 'completed') {
5663 last;
5664 } else {
5665 die "query-savevm returned status '$stat->{status}'\n";
5666 }
5667 }
5668};
5669
0d18dcfc 5670sub snapshot_create {
af9110dd 5671 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
0d18dcfc 5672
18bfb361 5673 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 5674
af9110dd 5675 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
18bfb361 5676
67fb9de6
DM
5677 my $config = load_config($vmid);
5678
af9110dd
WL
5679 my $running = check_running($vmid);
5680
67fb9de6 5681 my $freezefs = $running && $config->{agent};
af9110dd
WL
5682 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5683
5684 my $drivehash = {};
5685
5686 if ($freezefs) {
65994ad7
WL
5687 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5688 warn "guest-fsfreeze-freeze problems - $@" if $@;
5689 }
67fb9de6 5690
0d18dcfc
DM
5691 eval {
5692 # create internal snapshots of all drives
22c377f0
DM
5693
5694 my $storecfg = PVE::Storage::config();
a3222b91
DM
5695
5696 if ($running) {
5697 if ($snap->{vmstate}) {
be190583 5698 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
5699 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5700 &$savevm_wait($vmid);
a3222b91 5701 } else {
9dcf4909 5702 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
5703 }
5704 };
5705
22c377f0
DM
5706 foreach_drive($snap, sub {
5707 my ($ds, $drive) = @_;
5708
5709 return if drive_is_cdrom($drive);
0d18dcfc 5710
22c377f0
DM
5711 my $volid = $drive->{file};
5712 my $device = "drive-$ds";
5713
5714 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 5715 $drivehash->{$ds} = 1;
22c377f0 5716 });
0d18dcfc 5717 };
22c377f0
DM
5718 my $err = $@;
5719
65994ad7
WL
5720 if ($running) {
5721 eval { vm_mon_cmd($vmid, "savevm-end") };
5722 warn $@ if $@;
22c377f0 5723
af9110dd 5724 if ($freezefs) {
67fb9de6 5725 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
65994ad7
WL
5726 warn "guest-fsfreeze-thaw problems - $@" if $@;
5727 }
22c377f0 5728
65994ad7 5729 # savevm-end is async, we need to wait
f34ebd52 5730 for (;;) {
2c9e8036
AD
5731 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5732 if (!$stat->{bytes}) {
5733 last;
5734 } else {
5735 print "savevm not yet finished\n";
5736 sleep(1);
5737 next;
5738 }
5739 }
5740 }
5741
22c377f0 5742 if ($err) {
0d18dcfc 5743 warn "snapshot create failed: starting cleanup\n";
3ee28e38 5744 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
5745 warn $@ if $@;
5746 die $err;
5747 }
5748
5749 &$snapshot_commit($vmid, $snapname);
5750}
5751
3ee28e38 5752# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 5753sub snapshot_delete {
3ee28e38 5754 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
5755
5756 my $prepare = 1;
5757
22c377f0 5758 my $snap;
ee2f90b1 5759 my $unused = [];
0d18dcfc 5760
6cb1a8cf
DM
5761 my $unlink_parent = sub {
5762 my ($confref, $new_parent) = @_;
5763
5764 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5765 if ($new_parent) {
5766 $confref->{parent} = $new_parent;
5767 } else {
5768 delete $confref->{parent};
5769 }
5770 }
5771 };
be190583 5772
0d18dcfc 5773 my $updatefn = sub {
2009f324 5774 my ($remove_drive) = @_;
0d18dcfc 5775
22c377f0 5776 my $conf = load_config($vmid);
0d18dcfc 5777
5295b23d
DM
5778 if (!$drivehash) {
5779 check_lock($conf);
be190583 5780 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
5781 if is_template($conf);
5782 }
0d18dcfc 5783
22c377f0 5784 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 5785
be190583 5786 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
5787
5788 # remove parent refs
8fd882a4
SP
5789 if (!$prepare) {
5790 &$unlink_parent($conf, $snap->{parent});
5791 foreach my $sn (keys %{$conf->{snapshots}}) {
5792 next if $sn eq $snapname;
5793 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5794 }
0d18dcfc
DM
5795 }
5796
2009f324 5797 if ($remove_drive) {
18bfb361
DM
5798 if ($remove_drive eq 'vmstate') {
5799 delete $snap->{$remove_drive};
5800 } else {
5801 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5802 my $volid = $drive->{file};
5803 delete $snap->{$remove_drive};
5804 add_unused_volume($conf, $volid);
5805 }
2009f324
DM
5806 }
5807
0d18dcfc
DM
5808 if ($prepare) {
5809 $snap->{snapstate} = 'delete';
5810 } else {
5811 delete $conf->{snapshots}->{$snapname};
3ee28e38 5812 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
5813 foreach my $volid (@$unused) {
5814 add_unused_volume($conf, $volid);
5815 }
0d18dcfc
DM
5816 }
5817
5818 update_config_nolock($vmid, $conf, 1);
5819 };
5820
5821 lock_config($vmid, $updatefn);
5822
18bfb361 5823 # now remove vmstate file
0d18dcfc 5824
22c377f0
DM
5825 my $storecfg = PVE::Storage::config();
5826
18bfb361
DM
5827 if ($snap->{vmstate}) {
5828 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5829 if (my $err = $@) {
5830 die $err if !$force;
5831 warn $err;
5832 }
5833 # save changes (remove vmstate from snapshot)
5834 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5835 };
5836
5837 # now remove all internal snapshots
5838 foreach_drive($snap, sub {
22c377f0
DM
5839 my ($ds, $drive) = @_;
5840
5841 return if drive_is_cdrom($drive);
3ee28e38 5842
22c377f0
DM
5843 my $volid = $drive->{file};
5844 my $device = "drive-$ds";
5845
2009f324
DM
5846 if (!$drivehash || $drivehash->{$ds}) {
5847 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5848 if (my $err = $@) {
5849 die $err if !$force;
5850 warn $err;
5851 }
3ee28e38 5852 }
2009f324
DM
5853
5854 # save changes (remove drive fron snapshot)
5855 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5856 push @$unused, $volid;
22c377f0 5857 });
0d18dcfc
DM
5858
5859 # now cleanup config
5860 $prepare = 0;
5861 lock_config($vmid, $updatefn);
5862}
5863
9cd07842 5864sub has_feature {
7ea975ef
AD
5865 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5866
719893a9 5867 my $err;
7ea975ef
AD
5868 foreach_drive($conf, sub {
5869 my ($ds, $drive) = @_;
5870
5871 return if drive_is_cdrom($drive);
5872 my $volid = $drive->{file};
5873 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5874 });
5875
719893a9 5876 return $err ? 0 : 1;
7ea975ef 5877}
04a69bb4
AD
5878
5879sub template_create {
5880 my ($vmid, $conf, $disk) = @_;
5881
04a69bb4 5882 my $storecfg = PVE::Storage::config();
04a69bb4 5883
9cd07842
DM
5884 foreach_drive($conf, sub {
5885 my ($ds, $drive) = @_;
5886
5887 return if drive_is_cdrom($drive);
5888 return if $disk && $ds ne $disk;
5889
5890 my $volid = $drive->{file};
bbd56097 5891 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5892
04a69bb4
AD
5893 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5894 $drive->{file} = $voliddst;
152fe752
DM
5895 $conf->{$ds} = print_drive($vmid, $drive);
5896 update_config_nolock($vmid, $conf, 1);
04a69bb4 5897 });
04a69bb4
AD
5898}
5899
624361b3
AD
5900sub is_template {
5901 my ($conf) = @_;
5902
96d695c0 5903 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5904}
5905
5133de42
AD
5906sub qemu_img_convert {
5907 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5908
5909 my $storecfg = PVE::Storage::config();
5910 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5911 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5912
5913 if ($src_storeid && $dst_storeid) {
5914 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5915 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5916
5917 my $src_format = qemu_img_format($src_scfg, $src_volname);
5918 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5919
5920 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5921 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5922
5923 my $cmd = [];
71ddbff9 5924 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5925 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5926 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5927
5928 my $parser = sub {
5929 my $line = shift;
5930 if($line =~ m/\((\S+)\/100\%\)/){
5931 my $percent = $1;
5932 my $transferred = int($size * $percent / 100);
5933 my $remaining = $size - $transferred;
5934
5935 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5936 }
5937
5938 };
5939
5940 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5941 my $err = $@;
5942 die "copy failed: $err" if $err;
5943 }
5944}
5945
5946sub qemu_img_format {
5947 my ($scfg, $volname) = @_;
5948
ccb5c001 5949 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5950 return $1;
ccb5c001 5951 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5952 return "host_device";
be190583 5953 } else {
5133de42 5954 return "raw";
5133de42
AD
5955 }
5956}
5957
cfad42af 5958sub qemu_drive_mirror {
ab6ecffe 5959 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
cfad42af 5960
ab6ecffe 5961 my $count = 0;
cfad42af
AD
5962 my $old_len = 0;
5963 my $frozen = undef;
ab6ecffe 5964 my $maxwait = 120;
cfad42af
AD
5965
5966 my $storecfg = PVE::Storage::config();
08ac653f 5967 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
152fe752 5968
08ac653f 5969 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 5970
08ac653f
DM
5971 my $format;
5972 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5973 $format = $1;
5974 }
21ccdb50 5975
08ac653f 5976 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 5977
88383920
DM
5978 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5979 $opts->{format} = $format if $format;
5980
5981 #fixme : sometime drive-mirror timeout, but works fine after.
5982 # (I have see the problem with big volume > 200GB), so we need to eval
f34ebd52 5983 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
88383920 5984 # ignore errors here
21ccdb50 5985
08ac653f
DM
5986 eval {
5987 while (1) {
5988 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5989 my $stat = @$stats[0];
5990 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5991 die "error job is not mirroring" if $stat->{type} ne "mirror";
5992
08ac653f
DM
5993 my $busy = $stat->{busy};
5994
6f708643
DM
5995 if (my $total = $stat->{len}) {
5996 my $transferred = $stat->{offset} || 0;
5997 my $remaining = $total - $transferred;
5998 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
67fb9de6 5999
6f708643
DM
6000 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
6001 }
f34ebd52 6002
08ac653f
DM
6003 if ($stat->{len} == $stat->{offset}) {
6004 if ($busy eq 'false') {
6005
6006 last if $vmiddst != $vmid;
f34ebd52 6007
08ac653f
DM
6008 # try to switch the disk if source and destination are on the same guest
6009 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
6010 last if !$@;
6011 die $@ if $@ !~ m/cannot be completed/;
cfad42af 6012 }
b467f79a 6013
08ac653f
DM
6014 if ($count > $maxwait) {
6015 # if too much writes to disk occurs at the end of migration
6016 #the disk needs to be freezed to be able to complete the migration
6017 vm_suspend($vmid,1);
6018 $frozen = 1;
bcc87408 6019 }
08ac653f
DM
6020 $count ++
6021 }
6022 $old_len = $stat->{offset};
6023 sleep 1;
cfad42af
AD
6024 }
6025
08ac653f
DM
6026 vm_resume($vmid, 1) if $frozen;
6027
6028 };
88383920 6029 my $err = $@;
08ac653f 6030
88383920 6031 my $cancel_job = sub {
08ac653f
DM
6032 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
6033 while (1) {
6034 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
6035 my $stat = @$stats[0];
6036 last if !$stat;
6037 sleep 1;
cfad42af 6038 }
88383920
DM
6039 };
6040
6041 if ($err) {
f34ebd52 6042 eval { &$cancel_job(); };
88383920
DM
6043 die "mirroring error: $err";
6044 }
6045
6046 if ($vmiddst != $vmid) {
6047 # if we clone a disk for a new target vm, we don't switch the disk
6048 &$cancel_job(); # so we call block-job-cancel
cfad42af
AD
6049 }
6050}
6051
152fe752 6052sub clone_disk {
be190583 6053 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
6054 $newvmid, $storage, $format, $full, $newvollist) = @_;
6055
6056 my $newvolid;
6057
6058 if (!$full) {
6059 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 6060 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
6061 push @$newvollist, $newvolid;
6062 } else {
6063 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
6064 $storeid = $storage if $storage;
6065
1377d7b0
DM
6066 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
6067 if (!$format) {
6068 $format = $drive->{format} || $defFormat;
152fe752
DM
6069 }
6070
1377d7b0
DM
6071 # test if requested format is supported - else use default
6072 my $supported = grep { $_ eq $format } @$validFormats;
6073 $format = $defFormat if !$supported;
6074
152fe752
DM
6075 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
6076
6077 print "create full clone of drive $drivename ($drive->{file})\n";
6078 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
6079 push @$newvollist, $newvolid;
6080
6081 if (!$running || $snapname) {
6082 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
6083 } else {
6084 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 6085 }
152fe752
DM
6086 }
6087
6088 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
6089
6090 my $disk = $drive;
6091 $disk->{format} = undef;
6092 $disk->{file} = $newvolid;
6093 $disk->{size} = $size;
6094
6095 return $disk;
6096}
6097
ff556cf2
DM
6098# this only works if VM is running
6099sub get_current_qemu_machine {
6100 my ($vmid) = @_;
6101
6102 my $cmd = { execute => 'query-machines', arguments => {} };
8e90138a 6103 my $res = vm_qmp_command($vmid, $cmd);
ff556cf2
DM
6104
6105 my ($current, $default);
6106 foreach my $e (@$res) {
6107 $default = $e->{name} if $e->{'is-default'};
6108 $current = $e->{name} if $e->{'is-current'};
6109 }
6110
6111 # fallback to the default machine if current is not supported by qemu
6112 return $current || $default || 'pc';
6113}
6114
4543ecf0
AD
6115sub lspci {
6116
6117 my $devices = {};
6118
6119 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
6120 my (undef, $id, $function) = @_;
6121 my $res = { id => $id, function => $function};
6122 push @{$devices->{$id}}, $res;
6123 });
6124
6125 return $devices;
6126}
6127
1e3baf05 61281;