]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
parse_vm_config: only allow 'delete' inside [PENDING]
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05 154my $confdesc = {
7183bd9a
AD
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
1e3baf05
DM
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
2ff09f52
DA
173 hotplug => {
174 optional => 1,
e8b9c17c 175 type => 'boolean',
6c52b679 176 description => "Allow hotplug for disk and network device",
2dbe827e 177 default => 0,
2ff09f52 178 },
1e3baf05
DM
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
22c377f0 189 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
7878afeb 209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
210 minimum => 16,
211 default => 512,
212 },
13a48620
DA
213 balloon => {
214 optional => 1,
215 type => 'integer',
8b1accf7
DM
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
13a48620 226 },
1e3baf05
DM
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 231 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
7fabe17d 236 type => 'string', format => 'dns-name',
1e3baf05
DM
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
cdd20088
AD
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
5b952ff5 243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
244 default => 'lsi',
245 },
1e3baf05
DM
246 description => {
247 optional => 1,
248 type => 'string',
0581fe4f 249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
6b9d84cf 254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
255 description => <<EODESC,
256Used to enable special optimization/features for specific
257operating systems:
258
259other => unspecified OS
260wxp => Microsoft Windows XP
261w2k => Microsoft Windows 2000
262w2k3 => Microsoft Windows 2003
263w2k8 => Microsoft Windows 2008
264wvista => Microsoft Windows Vista
265win7 => Microsoft Windows 7
a70ebde3 266win8 => Microsoft Windows 8/2012
1e3baf05
DM
267l24 => Linux 2.4 Kernel
268l26 => Linux 2.6/3.X Kernel
6b9d84cf 269solaris => solaris/opensolaris/openindiania kernel
1e3baf05 270
6b9d84cf 271other|l24|l26|solaris ... no special behaviour
a70ebde3 272wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
273EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
32baffb4 280 default => 'cdn',
1e3baf05
DM
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
03e480fc 286 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
8a010eae
AD
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
3bd18e48
AD
315 maxcpus => {
316 optional => 1,
317 type => 'integer',
318 description => "Maximum cpus for hotplug.",
319 minimum => 1,
320 default => 1,
321 },
1e3baf05
DM
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
bc84dcca 328 agent => {
ab6a046f
AD
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
be79c214 332 default => 0,
ab6a046f 333 },
1e3baf05
DM
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
8c559505
DM
343 description => "Enable/disable time drift fix.",
344 default => 0,
1e3baf05 345 },
19672434 346 localtime => {
1e3baf05
DM
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
ef5e2be2 359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 361 },
0ea9541d
DM
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
1e3baf05
DM
368 startdate => {
369 optional => 1,
19672434 370 type => 'string',
1e3baf05
DM
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
59411c4e
DM
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
68eda3ab
AD
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
1e3baf05
DM
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394args: -no-reboot -no-hpet
395EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
5acbfe9e 401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
04432191 412 type => 'number',
1e3baf05
DM
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
04432191 415 default => 0.1,
1e3baf05
DM
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
3aefd6fd 427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 428 default => 'kvm64',
1e3baf05 429 },
b7ba6b79
DM
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
982c7f12
DM
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
18bfb361
DM
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
3bafc510
DM
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
2796e7d5
DM
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
1e3baf05
DM
459};
460
461# what about other qemu settings ?
462#cpu => 'string',
463#machine => 'string',
464#fda => 'file',
465#fdb => 'file',
466#mtdblock => 'file',
467#sd => 'file',
468#pflash => 'file',
469#snapshot => 'bool',
470#bootp => 'file',
471##tftp => 'dir',
472##smb => 'dir',
473#kernel => 'file',
474#append => 'string',
475#initrd => 'file',
476##soundhw => 'string',
477
478while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480}
481
482my $MAX_IDE_DISKS = 4;
f62db2a4 483my $MAX_SCSI_DISKS = 14;
a2650619 484my $MAX_VIRTIO_DISKS = 16;
cdb0931f 485my $MAX_SATA_DISKS = 6;
1e3baf05 486my $MAX_USB_DEVICES = 5;
5bdcf937 487my $MAX_NETS = 32;
1e3baf05 488my $MAX_UNUSED_DISKS = 8;
5cffb2d2 489my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 490my $MAX_SERIAL_PORTS = 4;
1989a89c 491my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
492my $MAX_NUMA = 8;
493
494my $numadesc = {
495 optional => 1,
496 type => 'string', format => 'pve-qm-numanode',
497 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>][,policy=<preferred|bind|interleave>]]",
498 description => "numa topology",
499};
500PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
501
502for (my $i = 0; $i < $MAX_NUMA; $i++) {
503 $confdesc->{"numa$i"} = $numadesc;
504}
1e3baf05
DM
505
506my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
e4c6e0b8 507 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
6b64503e 508my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 509
1e3baf05
DM
510my $netdesc = {
511 optional => 1,
512 type => 'string', format => 'pve-qm-net',
a9410357 513 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
1e3baf05 514 description => <<EODESCR,
19672434 515Specify network devices.
1e3baf05
DM
516
517MODEL is one of: $nic_model_list_txt
518
19672434 519XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
520automatically generated if not specified.
521
522The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
523
524Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
525
526If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
527
52810.0.2.2 Gateway
52910.0.2.3 DNS Server
53010.0.2.4 SMB Server
531
532The DHCP server assign addresses to the guest starting from 10.0.2.15.
533
534EODESCR
535};
536PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
537
538for (my $i = 0; $i < $MAX_NETS; $i++) {
539 $confdesc->{"net$i"} = $netdesc;
540}
541
542my $drivename_hash;
19672434 543
1e3baf05
DM
544my $idedesc = {
545 optional => 1,
546 type => 'string', format => 'pve-qm-drive',
8d87f8aa 547 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 548 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
549};
550PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
551
552my $scsidesc = {
553 optional => 1,
554 type => 'string', format => 'pve-qm-drive',
8d87f8aa 555 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 556 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
557};
558PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
559
cdb0931f
DA
560my $satadesc = {
561 optional => 1,
562 type => 'string', format => 'pve-qm-drive',
8d87f8aa 563 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 564 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
565};
566PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
567
1e3baf05
DM
568my $virtiodesc = {
569 optional => 1,
570 type => 'string', format => 'pve-qm-drive',
8d87f8aa 571 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 572 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
573};
574PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
575
576my $usbdesc = {
577 optional => 1,
578 type => 'string', format => 'pve-qm-usb-device',
80401dd8 579 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 580 description => <<EODESCR,
2fe1a152 581Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
582pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
583
19672434 584'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
585'vendor_id:product_id' (hexadeciaml numbers)
586
19672434 587You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
588
589Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
590
80401dd8
DM
591The value 'spice' can be used to add a usb redirection devices for spice.
592
1e3baf05
DM
593EODESCR
594};
595PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
596
040b06b7
DA
597my $hostpcidesc = {
598 optional => 1,
599 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 600 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
601 description => <<EODESCR,
602Map host pci devices. HOSTPCIDEVICE syntax is:
603
604'bus:dev.func' (hexadecimal numbers)
605
606You can us the 'lspci' command to list existing pci devices.
607
0cea6a01
DM
608The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
609
040b06b7
DA
610Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
611
612Experimental: user reported problems with this option.
613EODESCR
614};
615PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
616
bae179aa
DA
617my $serialdesc = {
618 optional => 1,
ca0cef26 619 type => 'string',
1b0b51ed 620 pattern => '(/dev/.+|socket)',
bae179aa 621 description => <<EODESCR,
1b0b51ed 622Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
623
624Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
625
626Experimental: user reported problems with this option.
627EODESCR
628};
bae179aa 629
1989a89c
DA
630my $paralleldesc= {
631 optional => 1,
ca0cef26 632 type => 'string',
9ecc8431 633 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 634 description => <<EODESCR,
19672434 635Map host parallel devices (n is 0 to 2).
1989a89c
DA
636
637Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
638
639Experimental: user reported problems with this option.
640EODESCR
641};
1989a89c
DA
642
643for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
644 $confdesc->{"parallel$i"} = $paralleldesc;
645}
646
bae179aa
DA
647for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
648 $confdesc->{"serial$i"} = $serialdesc;
649}
650
040b06b7
DA
651for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
652 $confdesc->{"hostpci$i"} = $hostpcidesc;
653}
1e3baf05
DM
654
655for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
656 $drivename_hash->{"ide$i"} = 1;
657 $confdesc->{"ide$i"} = $idedesc;
658}
659
cdb0931f
DA
660for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
661 $drivename_hash->{"sata$i"} = 1;
662 $confdesc->{"sata$i"} = $satadesc;
663}
664
1e3baf05
DM
665for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
666 $drivename_hash->{"scsi$i"} = 1;
667 $confdesc->{"scsi$i"} = $scsidesc ;
668}
669
670for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
671 $drivename_hash->{"virtio$i"} = 1;
672 $confdesc->{"virtio$i"} = $virtiodesc;
673}
674
675for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
676 $confdesc->{"usb$i"} = $usbdesc;
677}
678
679my $unuseddesc = {
680 optional => 1,
681 type => 'string', format => 'pve-volume-id',
682 description => "Reference to unused volumes.",
683};
684
685for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
686 $confdesc->{"unused$i"} = $unuseddesc;
687}
688
689my $kvm_api_version = 0;
690
691sub kvm_version {
692
693 return $kvm_api_version if $kvm_api_version;
694
6b64503e 695 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
696 return 0;
697
6b64503e 698 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
699 $kvm_api_version = $v;
700 }
701
702 $fh->close();
703
704 return $kvm_api_version;
705}
706
707my $kvm_user_version;
708
709sub kvm_user_version {
710
711 return $kvm_user_version if $kvm_user_version;
712
713 $kvm_user_version = 'unknown';
714
715 my $tmp = `kvm -help 2>/dev/null`;
19672434 716
fa7ae705 717 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
718 $kvm_user_version = $2;
719 }
720
721 return $kvm_user_version;
722
723}
724
725my $kernel_has_vhost_net = -c '/dev/vhost-net';
726
727sub disknames {
728 # order is important - used to autoselect boot disk
19672434 729 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 730 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
731 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
732 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
733}
734
735sub valid_drivename {
736 my $dev = shift;
737
6b64503e 738 return defined($drivename_hash->{$dev});
1e3baf05
DM
739}
740
741sub option_exists {
742 my $key = shift;
743 return defined($confdesc->{$key});
19672434 744}
1e3baf05
DM
745
746sub nic_models {
747 return $nic_model_list;
748}
749
750sub os_list_description {
751
752 return {
753 other => 'Other',
754 wxp => 'Windows XP',
755 w2k => 'Windows 2000',
756 w2k3 =>, 'Windows 2003',
757 w2k8 => 'Windows 2008',
758 wvista => 'Windows Vista',
759 win7 => 'Windows 7',
a70ebde3 760 win8 => 'Windows 8/2012',
1e3baf05
DM
761 l24 => 'Linux 2.4',
762 l26 => 'Linux 2.6',
19672434 763 };
1e3baf05
DM
764}
765
1e3baf05
DM
766my $cdrom_path;
767
768sub get_cdrom_path {
769
770 return $cdrom_path if $cdrom_path;
771
772 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
773 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
774 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
775}
776
777sub get_iso_path {
778 my ($storecfg, $vmid, $cdrom) = @_;
779
780 if ($cdrom eq 'cdrom') {
781 return get_cdrom_path();
782 } elsif ($cdrom eq 'none') {
783 return '';
784 } elsif ($cdrom =~ m|^/|) {
785 return $cdrom;
786 } else {
6b64503e 787 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
788 }
789}
790
791# try to convert old style file names to volume IDs
792sub filename_to_volume_id {
793 my ($vmid, $file, $media) = @_;
794
795 if (!($file eq 'none' || $file eq 'cdrom' ||
796 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 797
1e3baf05 798 return undef if $file =~ m|/|;
19672434 799
1e3baf05
DM
800 if ($media && $media eq 'cdrom') {
801 $file = "local:iso/$file";
802 } else {
803 $file = "local:$vmid/$file";
804 }
805 }
806
807 return $file;
808}
809
810sub verify_media_type {
811 my ($opt, $vtype, $media) = @_;
812
813 return if !$media;
814
815 my $etype;
816 if ($media eq 'disk') {
a125592c 817 $etype = 'images';
1e3baf05
DM
818 } elsif ($media eq 'cdrom') {
819 $etype = 'iso';
820 } else {
821 die "internal error";
822 }
823
824 return if ($vtype eq $etype);
19672434 825
1e3baf05
DM
826 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
827}
828
829sub cleanup_drive_path {
830 my ($opt, $storecfg, $drive) = @_;
831
832 # try to convert filesystem paths to volume IDs
833
834 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
835 ($drive->{file} !~ m|^/dev/.+|) &&
836 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 837 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
838 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
839 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
840 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
841 verify_media_type($opt, $vtype, $drive->{media});
842 $drive->{file} = $volid;
843 }
844
845 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
846}
847
848sub create_conf_nolock {
849 my ($vmid, $settings) = @_;
850
6b64503e 851 my $filename = config_file($vmid);
1e3baf05
DM
852
853 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 854
1e3baf05
DM
855 my $defaults = load_defaults();
856
857 $settings->{name} = "vm$vmid" if !$settings->{name};
858 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
859
860 my $data = '';
861 foreach my $opt (keys %$settings) {
862 next if !$confdesc->{$opt};
863
864 my $value = $settings->{$opt};
865 next if !$value;
866
867 $data .= "$opt: $value\n";
868 }
869
870 PVE::Tools::file_set_contents($filename, $data);
871}
872
f36ed4f4
DM
873my $parse_size = sub {
874 my ($value) = @_;
875
9bf371a6 876 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
877 my ($size, $unit) = ($1, $3);
878 if ($unit) {
879 if ($unit eq 'K') {
880 $size = $size * 1024;
881 } elsif ($unit eq 'M') {
882 $size = $size * 1024 * 1024;
883 } elsif ($unit eq 'G') {
884 $size = $size * 1024 * 1024 * 1024;
885 }
886 }
887 return int($size);
888};
889
890my $format_size = sub {
891 my ($size) = @_;
892
893 $size = int($size);
894
895 my $kb = int($size/1024);
896 return $size if $kb*1024 != $size;
897
898 my $mb = int($kb/1024);
899 return "${kb}K" if $mb*1024 != $kb;
900
901 my $gb = int($mb/1024);
902 return "${mb}M" if $gb*1024 != $mb;
903
904 return "${gb}G";
905};
906
1e3baf05
DM
907# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
908# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 909# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 910# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
911
912sub parse_drive {
913 my ($key, $data) = @_;
914
915 my $res = {};
19672434 916
1e3baf05
DM
917 # $key may be undefined - used to verify JSON parameters
918 if (!defined($key)) {
919 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
920 $res->{index} = 0;
921 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
922 $res->{interface} = $1;
923 $res->{index} = $2;
924 } else {
925 return undef;
926 }
927
928 foreach my $p (split (/,/, $data)) {
929 next if $p =~ m/^\s*$/;
930
74edd76b 931 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
932 my ($k, $v) = ($1, $2);
933
934 $k = 'file' if $k eq 'volume';
935
936 return undef if defined $res->{$k};
19672434 937
9bf371a6
DM
938 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
939 return undef if !$v || $v !~ m/^\d+/;
940 $k = "m$k";
941 $v = sprintf("%.3f", $v / (1024*1024));
942 }
1e3baf05
DM
943 $res->{$k} = $v;
944 } else {
945 if (!$res->{file} && $p !~ m/=/) {
946 $res->{file} = $p;
947 } else {
948 return undef;
949 }
950 }
951 }
952
953 return undef if !$res->{file};
954
bdf3f362
AD
955 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
956 $res->{format} = $1;
957 }
958
19672434 959 return undef if $res->{cache} &&
e482cec3 960 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
961 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
962 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
963 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
964 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
965 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
966 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
967 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
968 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
969 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
970 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
971 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 972 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 973
9bf371a6
DM
974 return undef if $res->{mbps_rd} && $res->{mbps};
975 return undef if $res->{mbps_wr} && $res->{mbps};
976
977 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 978 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 979 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 980 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 981 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 982 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 983
affd2f88
AD
984 return undef if $res->{iops_rd} && $res->{iops};
985 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
986
987
affd2f88 988 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 989 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 990 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 991 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 992 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 993 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
994
995
24afaca0 996 if ($res->{size}) {
be190583 997 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
998 }
999
1e3baf05
DM
1000 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1001 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1002 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1003 return undef if $res->{interface} eq 'virtio';
1004 }
1005
1006 # rerror does not work with scsi drives
1007 if ($res->{rerror}) {
1008 return undef if $res->{interface} eq 'scsi';
1009 }
1010
1011 return $res;
1012}
1013
74edd76b 1014my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
1015
1016sub print_drive {
1017 my ($vmid, $drive) = @_;
1018
1019 my $opts = '';
74edd76b 1020 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
1021 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1022 }
1023
24afaca0
DM
1024 if ($drive->{size}) {
1025 $opts .= ",size=" . &$format_size($drive->{size});
1026 }
1027
1e3baf05
DM
1028 return "$drive->{file}$opts";
1029}
1030
28ef82d3
DM
1031sub scsi_inquiry {
1032 my($fh, $noerr) = @_;
1033
1034 my $SG_IO = 0x2285;
1035 my $SG_GET_VERSION_NUM = 0x2282;
1036
1037 my $versionbuf = "\x00" x 8;
1038 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1039 if (!$ret) {
1040 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1041 return undef;
1042 }
97d62eb7 1043 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1044 if ($version < 30000) {
1045 die "scsi generic interface too old\n" if !$noerr;
1046 return undef;
1047 }
97d62eb7 1048
28ef82d3
DM
1049 my $buf = "\x00" x 36;
1050 my $sensebuf = "\x00" x 8;
f334aa3e 1051 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1052
28ef82d3
DM
1053 # see /usr/include/scsi/sg.h
1054 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1055
97d62eb7
DM
1056 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1057 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1058 $cmd, $sensebuf, 6000);
1059
1060 $ret = ioctl($fh, $SG_IO, $packet);
1061 if (!$ret) {
1062 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1063 return undef;
1064 }
97d62eb7 1065
28ef82d3
DM
1066 my @res = unpack($sg_io_hdr_t, $packet);
1067 if ($res[17] || $res[18]) {
1068 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1069 return undef;
1070 }
1071
1072 my $res = {};
09984754 1073 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1074 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1075
09984754
DM
1076 $res->{removable} = $byte1 & 128 ? 1 : 0;
1077 $res->{type} = $byte0 & 31;
1078
28ef82d3
DM
1079 return $res;
1080}
1081
1082sub path_is_scsi {
1083 my ($path) = @_;
1084
1085 my $fh = IO::File->new("+<$path") || return undef;
1086 my $res = scsi_inquiry($fh, 1);
1087 close($fh);
1088
1089 return $res;
1090}
1091
db656e5f
DM
1092sub machine_type_is_q35 {
1093 my ($conf) = @_;
b467f79a 1094
db656e5f
DM
1095 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1096}
1097
1098sub print_tabletdevice_full {
1099 my ($conf) = @_;
b467f79a 1100
db656e5f
DM
1101 my $q35 = machine_type_is_q35($conf);
1102
1103 # we use uhci for old VMs because tablet driver was buggy in older qemu
1104 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1105
db656e5f
DM
1106 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1107}
1108
ca916ecc 1109sub print_drivedevice_full {
5bdcf937 1110 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1111
1112 my $device = '';
1113 my $maxdev = 0;
19672434 1114
ca916ecc 1115 if ($drive->{interface} eq 'virtio') {
5bdcf937 1116 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1117 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
7183bd9a 1118 $device .= ",iothread=iothread0" if $conf->{iothread};
2ed36a41 1119 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1120 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1121 my $controller = int($drive->{index} / $maxdev);
1122 my $unit = $drive->{index} % $maxdev;
1123 my $devicetype = 'hd';
231f2e13
DA
1124 my $path = '';
1125 if (drive_is_cdrom($drive)) {
1126 $devicetype = 'cd';
29b19529 1127 } else {
231f2e13
DA
1128 if ($drive->{file} =~ m|^/|) {
1129 $path = $drive->{file};
1130 } else {
1131 $path = PVE::Storage::path($storecfg, $drive->{file});
1132 }
d454d040
AD
1133
1134 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1135 $devicetype = 'generic';
1136 } else {
09984754
DM
1137 if (my $info = path_is_scsi($path)) {
1138 if ($info->{type} == 0) {
1139 $devicetype = 'block';
1140 } elsif ($info->{type} == 1) { # tape
1141 $devicetype = 'generic';
1142 }
1143 }
d454d040 1144 }
231f2e13 1145 }
ca916ecc 1146
5b952ff5
DM
1147 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1148 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1149 } else {
1150 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1151 }
1152
2ed36a41
DM
1153 } elsif ($drive->{interface} eq 'ide'){
1154 $maxdev = 2;
1155 my $controller = int($drive->{index} / $maxdev);
1156 my $unit = $drive->{index} % $maxdev;
1157 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1158
7ebe888a 1159 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1160 } elsif ($drive->{interface} eq 'sata'){
1161 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1162 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1163 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1164 } elsif ($drive->{interface} eq 'usb') {
1165 die "implement me";
1166 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1167 } else {
1168 die "unsupported interface type";
ca916ecc
DA
1169 }
1170
3b408e82
DM
1171 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1172
ca916ecc
DA
1173 return $device;
1174}
1175
15b21acc 1176sub get_initiator_name {
46f58b5f 1177 my $initiator;
15b21acc 1178
46f58b5f
DM
1179 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1180 while (defined(my $line = <$fh>)) {
1181 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1182 $initiator = $1;
1183 last;
1184 }
46f58b5f
DM
1185 $fh->close();
1186
15b21acc
MR
1187 return $initiator;
1188}
1189
1e3baf05
DM
1190sub print_drive_full {
1191 my ($storecfg, $vmid, $drive) = @_;
1192
1193 my $opts = '';
1194 foreach my $o (@qemu_drive_options) {
3b408e82 1195 next if $o eq 'bootindex';
1e3baf05 1196 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1197 }
1e3baf05 1198
9bf371a6
DM
1199 foreach my $o (qw(bps bps_rd bps_wr)) {
1200 my $v = $drive->{"m$o"};
1201 $opts .= ",$o=" . int($v*1024*1024) if $v;
1202 }
1203
1e3baf05 1204 # use linux-aio by default (qemu default is threads)
19672434 1205 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1206
1207 my $path;
1208 my $volid = $drive->{file};
6b64503e
DM
1209 if (drive_is_cdrom($drive)) {
1210 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1211 } else {
1212 if ($volid =~ m|^/|) {
1213 $path = $volid;
1214 } else {
6b64503e 1215 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1216 }
1217 }
1218
ef86170e 1219 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1220
f1e05305
AD
1221 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1222 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1223
1e3baf05
DM
1224 my $pathinfo = $path ? "file=$path," : '';
1225
3ebfcc86 1226 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1227}
1228
cc4d6182 1229sub print_netdevice_full {
5bdcf937 1230 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1231
1232 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1233
1234 my $device = $net->{model};
1235 if ($net->{model} eq 'virtio') {
1236 $device = 'virtio-net-pci';
1237 };
1238
1239 # qemu > 0.15 always try to boot from network - we disable that by
1240 # not loading the pxe rom file
1241 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
5bdcf937 1242 my $pciaddr = print_pci_addr("$netid", $bridges);
cc4d6182 1243 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1244 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1245 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1246 my $vectors = $net->{queues} * 2 + 2;
1247 $tmpstr .= ",vectors=$vectors,mq=on";
1248 }
cc4d6182
DA
1249 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1250 return $tmpstr;
1251}
1252
1253sub print_netdev_full {
1254 my ($vmid, $conf, $net, $netid) = @_;
1255
1256 my $i = '';
1257 if ($netid =~ m/^net(\d+)$/) {
1258 $i = int($1);
1259 }
1260
1261 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1262
1263 my $ifname = "tap${vmid}i$i";
1264
1265 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1266 die "interface name '$ifname' is too long (max 15 character)\n"
1267 if length($ifname) >= 16;
1268
1269 my $vhostparam = '';
1270 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1271
1272 my $vmname = $conf->{name} || "vm$vmid";
1273
a9410357
AD
1274 my $netdev = "";
1275
cc4d6182 1276 if ($net->{bridge}) {
a9410357 1277 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1278 } else {
a9410357 1279 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1280 }
a9410357
AD
1281
1282 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1283
1284 return $netdev;
cc4d6182 1285}
1e3baf05
DM
1286
1287sub drive_is_cdrom {
1288 my ($drive) = @_;
1289
1290 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1291
1292}
1293
2ed5d572
AD
1294sub parse_numa {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 foreach my $kvp (split(/,/, $data)) {
1300
1301 if ($kvp =~ m/^memory=(\S+)$/) {
1302 $res->{memory} = $1;
1303 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1304 $res->{policy} = $1;
1305 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1306 $res->{cpus}->{start} = $1;
1307 $res->{cpus}->{end} = $3;
1308 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1309 $res->{hostnodes}->{start} = $1;
1310 $res->{hostnodes}->{end} = $3;
1311 } else {
1312 return undef;
1313 }
1314 }
1315
1316 return $res;
1317}
1318
040b06b7
DA
1319sub parse_hostpci {
1320 my ($value) = @_;
1321
1322 return undef if !$value;
1323
0cea6a01
DM
1324
1325 my @list = split(/,/, $value);
1326 my $found;
1327
040b06b7 1328 my $res = {};
0cea6a01 1329 foreach my $kv (@list) {
040b06b7 1330
4543ecf0 1331 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1332 $found = 1;
4543ecf0
AD
1333 if(defined($4)){
1334 push @{$res->{pciid}}, { id => $2 , function => $4};
1335
1336 }else{
1337 my $pcidevices = lspci($2);
1338 $res->{pciid} = $pcidevices->{$2};
1339 }
0cea6a01
DM
1340 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1341 $res->{driver} = $1;
1342 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1343 $res->{rombar} = $1;
2e3b7e2a
AD
1344 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1345 $res->{'x-vga'} = $1;
1346 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1347 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1348 } else {
1349 warn "unknown hostpci setting '$kv'\n";
1350 }
040b06b7
DA
1351 }
1352
0cea6a01
DM
1353 return undef if !$found;
1354
040b06b7
DA
1355 return $res;
1356}
1357
1e3baf05
DM
1358# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1359sub parse_net {
1360 my ($data) = @_;
1361
1362 my $res = {};
1363
6b64503e 1364 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1365
e4c6e0b8 1366 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1367 my $model = lc($1);
92f0fedc 1368 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1369 $res->{model} = $model;
1370 $res->{macaddr} = $mac;
1371 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1372 $res->{bridge} = $1;
a9410357
AD
1373 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1374 $res->{queues} = $1;
1e3baf05
DM
1375 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1376 $res->{rate} = $1;
5070f384
DA
1377 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1378 $res->{tag} = $1;
2dd4aa4c
AD
1379 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1380 $res->{firewall} = $1;
1e3baf05
DM
1381 } else {
1382 return undef;
1383 }
19672434 1384
1e3baf05
DM
1385 }
1386
1387 return undef if !$res->{model};
1388
1389 return $res;
1390}
1391
1392sub print_net {
1393 my $net = shift;
1394
1395 my $res = "$net->{model}";
1396 $res .= "=$net->{macaddr}" if $net->{macaddr};
1397 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1398 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1399 $res .= ",tag=$net->{tag}" if $net->{tag};
28138e9a 1400 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1e3baf05
DM
1401
1402 return $res;
1403}
1404
1405sub add_random_macs {
1406 my ($settings) = @_;
1407
1408 foreach my $opt (keys %$settings) {
1409 next if $opt !~ m/^net(\d+)$/;
1410 my $net = parse_net($settings->{$opt});
1411 next if !$net;
1412 $settings->{$opt} = print_net($net);
1413 }
1414}
1415
1416sub add_unused_volume {
1858638f 1417 my ($config, $volid) = @_;
1e3baf05
DM
1418
1419 my $key;
1420 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1421 my $test = "unused$ind";
1422 if (my $vid = $config->{$test}) {
1423 return if $vid eq $volid; # do not add duplicates
1424 } else {
1425 $key = $test;
19672434 1426 }
1e3baf05
DM
1427 }
1428
1429 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1430
1858638f 1431 $config->{$key} = $volid;
1e3baf05 1432
1858638f 1433 return $key;
1e3baf05
DM
1434}
1435
2796e7d5
DM
1436my $valid_smbios1_options = {
1437 manufacturer => '\S+',
1438 product => '\S+',
1439 version => '\S+',
1440 serial => '\S+',
1441 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1442 sku => '\S+',
1443 family => '\S+',
1444};
1445
1446# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1447sub parse_smbios1 {
1448 my ($data) = @_;
1449
1450 my $res = {};
1451
1452 foreach my $kvp (split(/,/, $data)) {
1453 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1454 my ($k, $v) = split(/=/, $kvp);
1455 return undef if !defined($k) || !defined($v);
1456 return undef if !$valid_smbios1_options->{$k};
1457 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1458 $res->{$k} = $v;
1459 }
1460
1461 return $res;
1462}
1463
cd11416f
DM
1464sub print_smbios1 {
1465 my ($smbios1) = @_;
1466
1467 my $data = '';
1468 foreach my $k (keys %$smbios1) {
1469 next if !defined($smbios1->{$k});
1470 next if !$valid_smbios1_options->{$k};
1471 $data .= ',' if $data;
1472 $data .= "$k=$smbios1->{$k}";
1473 }
1474 return $data;
1475}
1476
2796e7d5
DM
1477PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1478sub verify_smbios1 {
1479 my ($value, $noerr) = @_;
1480
1481 return $value if parse_smbios1($value);
1482
1483 return undef if $noerr;
1484
1485 die "unable to parse smbios (type 1) options\n";
1486}
1487
1e3baf05
DM
1488PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1489sub verify_bootdisk {
1490 my ($value, $noerr) = @_;
1491
19672434 1492 return $value if valid_drivename($value);
1e3baf05
DM
1493
1494 return undef if $noerr;
1495
1496 die "invalid boot disk '$value'\n";
1497}
1498
2ed5d572
AD
1499PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1500sub verify_numa {
1501 my ($value, $noerr) = @_;
1502
1503 return $value if parse_numa($value);
1504
1505 return undef if $noerr;
1506
1507 die "unable to parse numa options\n";
1508}
1509
1e3baf05
DM
1510PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1511sub verify_net {
1512 my ($value, $noerr) = @_;
1513
1514 return $value if parse_net($value);
1515
1516 return undef if $noerr;
19672434 1517
1e3baf05
DM
1518 die "unable to parse network options\n";
1519}
1520
1521PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1522sub verify_drive {
1523 my ($value, $noerr) = @_;
1524
6b64503e 1525 return $value if parse_drive(undef, $value);
1e3baf05
DM
1526
1527 return undef if $noerr;
19672434 1528
1e3baf05
DM
1529 die "unable to parse drive options\n";
1530}
1531
1532PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1533sub verify_hostpci {
1534 my ($value, $noerr) = @_;
1535
040b06b7
DA
1536 return $value if parse_hostpci($value);
1537
1538 return undef if $noerr;
1539
1540 die "unable to parse pci id\n";
1e3baf05
DM
1541}
1542
0ea9541d
DM
1543PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1544sub verify_watchdog {
1545 my ($value, $noerr) = @_;
1546
1547 return $value if parse_watchdog($value);
1548
1549 return undef if $noerr;
19672434 1550
0ea9541d
DM
1551 die "unable to parse watchdog options\n";
1552}
1553
1554sub parse_watchdog {
1555 my ($value) = @_;
1556
1557 return undef if !$value;
1558
1559 my $res = {};
1560
6b64503e 1561 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1562 next if $p =~ m/^\s*$/;
1563
1564 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1565 $res->{model} = $2;
1566 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1567 $res->{action} = $2;
1568 } else {
1569 return undef;
1570 }
1571 }
1572
1573 return $res;
1574}
1575
59411c4e
DM
1576PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1577sub verify_startup {
1578 my ($value, $noerr) = @_;
1579
1580 return $value if parse_startup($value);
1581
1582 return undef if $noerr;
1583
1584 die "unable to parse startup options\n";
1585}
1586
1587sub parse_startup {
1588 my ($value) = @_;
1589
1590 return undef if !$value;
1591
1592 my $res = {};
1593
1594 foreach my $p (split(/,/, $value)) {
1595 next if $p =~ m/^\s*$/;
1596
1597 if ($p =~ m/^(order=)?(\d+)$/) {
1598 $res->{order} = $2;
1599 } elsif ($p =~ m/^up=(\d+)$/) {
1600 $res->{up} = $1;
1601 } elsif ($p =~ m/^down=(\d+)$/) {
1602 $res->{down} = $1;
1603 } else {
1604 return undef;
1605 }
1606 }
1607
1608 return $res;
1609}
1610
1e3baf05
DM
1611sub parse_usb_device {
1612 my ($value) = @_;
1613
1614 return undef if !$value;
1615
6b64503e 1616 my @dl = split(/,/, $value);
1e3baf05
DM
1617 my $found;
1618
1619 my $res = {};
1620 foreach my $v (@dl) {
036e0e2b 1621 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1622 $found = 1;
036e0e2b
DM
1623 $res->{vendorid} = $2;
1624 $res->{productid} = $4;
1e3baf05
DM
1625 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1626 $found = 1;
1627 $res->{hostbus} = $1;
1628 $res->{hostport} = $2;
80401dd8
DM
1629 } elsif ($v =~ m/^spice$/) {
1630 $found = 1;
1631 $res->{spice} = 1;
1e3baf05
DM
1632 } else {
1633 return undef;
1634 }
1635 }
1636 return undef if !$found;
1637
1638 return $res;
1639}
19672434 1640
1e3baf05
DM
1641PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1642sub verify_usb_device {
1643 my ($value, $noerr) = @_;
1644
1645 return $value if parse_usb_device($value);
1646
1647 return undef if $noerr;
19672434 1648
1e3baf05
DM
1649 die "unable to parse usb device\n";
1650}
1651
1e3baf05
DM
1652# add JSON properties for create and set function
1653sub json_config_properties {
1654 my $prop = shift;
1655
1656 foreach my $opt (keys %$confdesc) {
18bfb361 1657 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1658 $prop->{$opt} = $confdesc->{$opt};
1659 }
1660
1661 return $prop;
1662}
1663
1664sub check_type {
1665 my ($key, $value) = @_;
1666
1667 die "unknown setting '$key'\n" if !$confdesc->{$key};
1668
1669 my $type = $confdesc->{$key}->{type};
1670
6b64503e 1671 if (!defined($value)) {
1e3baf05
DM
1672 die "got undefined value\n";
1673 }
1674
1675 if ($value =~ m/[\n\r]/) {
1676 die "property contains a line feed\n";
1677 }
1678
1679 if ($type eq 'boolean') {
19672434
DM
1680 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1681 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1682 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1683 } elsif ($type eq 'integer') {
1684 return int($1) if $value =~ m/^(\d+)$/;
1685 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1686 } elsif ($type eq 'number') {
1687 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1688 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1689 } elsif ($type eq 'string') {
1690 if (my $fmt = $confdesc->{$key}->{format}) {
1691 if ($fmt eq 'pve-qm-drive') {
1692 # special case - we need to pass $key to parse_drive()
6b64503e 1693 my $drive = parse_drive($key, $value);
1e3baf05
DM
1694 return $value if $drive;
1695 die "unable to parse drive options\n";
1696 }
1697 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1698 return $value;
1699 }
1e3baf05 1700 $value =~ s/^\"(.*)\"$/$1/;
19672434 1701 return $value;
1e3baf05
DM
1702 } else {
1703 die "internal error"
1704 }
1705}
1706
191435c6
DM
1707sub lock_config_full {
1708 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1709
6b64503e 1710 my $filename = config_file_lock($vmid);
1e3baf05 1711
191435c6 1712 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1713
1714 die $@ if $@;
5fdbe4f0
DM
1715
1716 return $res;
1e3baf05
DM
1717}
1718
4e4f83fe
DM
1719sub lock_config_mode {
1720 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1721
1722 my $filename = config_file_lock($vmid);
1723
4e4f83fe 1724 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1725
1726 die $@ if $@;
1727
1728 return $res;
1729}
1730
191435c6
DM
1731sub lock_config {
1732 my ($vmid, $code, @param) = @_;
1733
1734 return lock_config_full($vmid, 10, $code, @param);
1735}
1736
1e3baf05 1737sub cfs_config_path {
a78ccf26 1738 my ($vmid, $node) = @_;
1e3baf05 1739
a78ccf26
DM
1740 $node = $nodename if !$node;
1741 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1742}
1743
040b06b7
DA
1744sub check_iommu_support{
1745 #fixme : need to check IOMMU support
1746 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1747
1748 my $iommu=1;
1749 return $iommu;
1750
1751}
1752
1e3baf05 1753sub config_file {
a78ccf26 1754 my ($vmid, $node) = @_;
1e3baf05 1755
a78ccf26 1756 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1757 return "/etc/pve/$cfspath";
1758}
1759
1760sub config_file_lock {
1761 my ($vmid) = @_;
1762
1763 return "$lock_dir/lock-$vmid.conf";
1764}
1765
1766sub touch_config {
1767 my ($vmid) = @_;
1768
6b64503e 1769 my $conf = config_file($vmid);
1e3baf05
DM
1770 utime undef, undef, $conf;
1771}
1772
1e3baf05 1773sub destroy_vm {
a6af7b3e 1774 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1775
6b64503e 1776 my $conffile = config_file($vmid);
1e3baf05 1777
6b64503e 1778 my $conf = load_config($vmid);
1e3baf05 1779
6b64503e 1780 check_lock($conf);
1e3baf05 1781
19672434 1782 # only remove disks owned by this VM
1e3baf05
DM
1783 foreach_drive($conf, sub {
1784 my ($ds, $drive) = @_;
1785
6b64503e 1786 return if drive_is_cdrom($drive);
1e3baf05
DM
1787
1788 my $volid = $drive->{file};
ed221350 1789
ff1a2432 1790 return if !$volid || $volid =~ m|^/|;
1e3baf05 1791
6b64503e 1792 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1793 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1794
6b64503e 1795 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1796 });
19672434 1797
a6af7b3e 1798 if ($keep_empty_config) {
9c502e26 1799 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1800 } else {
1801 unlink $conffile;
1802 }
1e3baf05
DM
1803
1804 # also remove unused disk
1805 eval {
6b64503e 1806 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1807
1808 eval {
6b64503e 1809 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1810 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1811 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1812 });
1813 };
1814 warn $@ if $@;
1815
1816 };
1817 warn $@ if $@;
1818}
1819
1e3baf05 1820sub load_config {
7e8dcf2c 1821 my ($vmid, $node) = @_;
1e3baf05 1822
7e8dcf2c 1823 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1824
1825 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1826
1827 die "no such VM ('$vmid')\n" if !defined($conf);
1828
1829 return $conf;
19672434 1830}
1e3baf05
DM
1831
1832sub parse_vm_config {
1833 my ($filename, $raw) = @_;
1834
1835 return undef if !defined($raw);
1836
554ac7e7 1837 my $res = {
fc1ddcdc 1838 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1839 snapshots => {},
0d732d16 1840 pending => {},
554ac7e7 1841 };
1e3baf05 1842
19672434 1843 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1844 || die "got strange filename '$filename'";
1845
1846 my $vmid = $1;
1847
0d18dcfc 1848 my $conf = $res;
0581fe4f 1849 my $descr = '';
e297c490 1850 my $section = '';
0581fe4f 1851
0d18dcfc
DM
1852 my @lines = split(/\n/, $raw);
1853 foreach my $line (@lines) {
1e3baf05 1854 next if $line =~ m/^\s*$/;
be190583 1855
eab09f4e 1856 if ($line =~ m/^\[PENDING\]\s*$/i) {
e297c490 1857 $section = 'pending';
0d732d16
DM
1858 $conf->{description} = $descr if $descr;
1859 $descr = '';
e297c490 1860 $conf = $res->{$section} = {};
eab09f4e
AD
1861 next;
1862
0d732d16 1863 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
e297c490 1864 $section = $1;
0d18dcfc 1865 $conf->{description} = $descr if $descr;
782f4f75 1866 $descr = '';
e297c490 1867 $conf = $res->{snapshots}->{$section} = {};
0d18dcfc
DM
1868 next;
1869 }
1e3baf05 1870
0581fe4f
DM
1871 if ($line =~ m/^\#(.*)\s*$/) {
1872 $descr .= PVE::Tools::decode_text($1) . "\n";
1873 next;
1874 }
1875
1e3baf05 1876 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1877 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1878 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1879 $conf->{snapstate} = $1;
1e3baf05
DM
1880 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1881 my $key = $1;
1882 my $value = $2;
0d18dcfc 1883 $conf->{$key} = $value;
e297c490
DM
1884 } elsif (($section eq 'pending') && ($line =~ m/^delete:\s*(.*\S)\s*$/)) {
1885 my $value = $1;
eab09f4e
AD
1886 foreach my $opt (split(/,/, $value)) {
1887 $conf->{del}->{$opt} = 1;
1888 }
1e3baf05
DM
1889 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1890 my $key = $1;
1891 my $value = $2;
1892 eval { $value = check_type($key, $value); };
1893 if ($@) {
1894 warn "vm $vmid - unable to parse value of '$key' - $@";
1895 } else {
1896 my $fmt = $confdesc->{$key}->{format};
1897 if ($fmt && $fmt eq 'pve-qm-drive') {
1898 my $v = parse_drive($key, $value);
1899 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1900 $v->{file} = $volid;
6b64503e 1901 $value = print_drive($vmid, $v);
1e3baf05
DM
1902 } else {
1903 warn "vm $vmid - unable to parse value of '$key'\n";
1904 next;
1905 }
1906 }
1907
1908 if ($key eq 'cdrom') {
0d18dcfc 1909 $conf->{ide2} = $value;
1e3baf05 1910 } else {
0d18dcfc 1911 $conf->{$key} = $value;
1e3baf05
DM
1912 }
1913 }
1914 }
1915 }
1916
0d18dcfc 1917 $conf->{description} = $descr if $descr;
0581fe4f 1918
0d18dcfc 1919 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
1920
1921 return $res;
1922}
1923
1858638f
DM
1924sub write_vm_config {
1925 my ($filename, $conf) = @_;
1e3baf05 1926
0d18dcfc
DM
1927 delete $conf->{snapstate}; # just to be sure
1928
1858638f
DM
1929 if ($conf->{cdrom}) {
1930 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
1931 $conf->{ide2} = $conf->{cdrom};
1932 delete $conf->{cdrom};
1933 }
1e3baf05
DM
1934
1935 # we do not use 'smp' any longer
1858638f
DM
1936 if ($conf->{sockets}) {
1937 delete $conf->{smp};
1938 } elsif ($conf->{smp}) {
1939 $conf->{sockets} = $conf->{smp};
1940 delete $conf->{cores};
1941 delete $conf->{smp};
1e3baf05
DM
1942 }
1943
264e519f 1944 if ($conf->{maxcpus} && $conf->{sockets}) {
3bd18e48
AD
1945 delete $conf->{sockets};
1946 }
264e519f 1947
ee2f90b1 1948 my $used_volids = {};
0d18dcfc 1949
ee2f90b1 1950 my $cleanup_config = sub {
a8e2f942 1951 my ($cref, $snapname) = @_;
1858638f 1952
ee2f90b1
DM
1953 foreach my $key (keys %$cref) {
1954 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
1955 $key eq 'snapstate';
1956 my $value = $cref->{$key};
1957 eval { $value = check_type($key, $value); };
1958 die "unable to parse value of '$key' - $@" if $@;
1858638f 1959
ee2f90b1
DM
1960 $cref->{$key} = $value;
1961
a8e2f942 1962 if (!$snapname && valid_drivename($key)) {
ed221350 1963 my $drive = parse_drive($key, $value);
ee2f90b1
DM
1964 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
1965 }
1e3baf05 1966 }
ee2f90b1
DM
1967 };
1968
1969 &$cleanup_config($conf);
1970 foreach my $snapname (keys %{$conf->{snapshots}}) {
a8e2f942 1971 &$cleanup_config($conf->{snapshots}->{$snapname}, $snapname);
1e3baf05
DM
1972 }
1973
1858638f
DM
1974 # remove 'unusedX' settings if we re-add a volume
1975 foreach my $key (keys %$conf) {
1976 my $value = $conf->{$key};
ee2f90b1 1977 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 1978 delete $conf->{$key};
1e3baf05 1979 }
1858638f 1980 }
be190583 1981
0d18dcfc
DM
1982 my $generate_raw_config = sub {
1983 my ($conf) = @_;
0581fe4f 1984
0d18dcfc
DM
1985 my $raw = '';
1986
1987 # add description as comment to top of file
1988 my $descr = $conf->{description} || '';
1989 foreach my $cl (split(/\n/, $descr)) {
1990 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
1991 }
1992
1993 foreach my $key (sort keys %$conf) {
1994 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots';
1995 $raw .= "$key: $conf->{$key}\n";
1996 }
1997 return $raw;
1998 };
0581fe4f 1999
0d18dcfc
DM
2000 my $raw = &$generate_raw_config($conf);
2001 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2002 $raw .= "\n[$snapname]\n";
2003 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 2004 }
1e3baf05 2005
1858638f
DM
2006 return $raw;
2007}
1e3baf05 2008
1858638f
DM
2009sub update_config_nolock {
2010 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2011
1858638f 2012 check_lock($conf) if !$skiplock;
97d62eb7 2013
1858638f 2014 my $cfspath = cfs_config_path($vmid);
1e3baf05 2015
1858638f
DM
2016 PVE::Cluster::cfs_write_file($cfspath, $conf);
2017}
1e3baf05 2018
1858638f
DM
2019sub update_config {
2020 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2021
1858638f 2022 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
2023}
2024
19672434 2025sub load_defaults {
1e3baf05
DM
2026
2027 my $res = {};
2028
2029 # we use static defaults from our JSON schema configuration
2030 foreach my $key (keys %$confdesc) {
2031 if (defined(my $default = $confdesc->{$key}->{default})) {
2032 $res->{$key} = $default;
2033 }
2034 }
19672434 2035
1e3baf05
DM
2036 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2037 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2038
2039 return $res;
2040}
2041
2042sub config_list {
2043 my $vmlist = PVE::Cluster::get_vmlist();
2044 my $res = {};
2045 return $res if !$vmlist || !$vmlist->{ids};
2046 my $ids = $vmlist->{ids};
2047
1e3baf05
DM
2048 foreach my $vmid (keys %$ids) {
2049 my $d = $ids->{$vmid};
2050 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2051 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2052 $res->{$vmid}->{exists} = 1;
2053 }
2054 return $res;
2055}
2056
64e13401
DM
2057# test if VM uses local resources (to prevent migration)
2058sub check_local_resources {
2059 my ($conf, $noerr) = @_;
2060
2061 my $loc_res = 0;
19672434 2062
e0ab7331
DM
2063 $loc_res = 1 if $conf->{hostusb}; # old syntax
2064 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2065
0d29ab3b 2066 foreach my $k (keys %$conf) {
49ca581d 2067 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 2068 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2069 }
2070
2071 die "VM uses local resources\n" if $loc_res && !$noerr;
2072
2073 return $loc_res;
2074}
2075
719893a9 2076# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2077sub check_storage_availability {
2078 my ($storecfg, $conf, $node) = @_;
2079
2080 foreach_drive($conf, sub {
2081 my ($ds, $drive) = @_;
2082
2083 my $volid = $drive->{file};
2084 return if !$volid;
2085
2086 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2087 return if !$sid;
2088
2089 # check if storage is available on both nodes
2090 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2091 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2092 });
2093}
2094
719893a9
DM
2095# list nodes where all VM images are available (used by has_feature API)
2096sub shared_nodes {
2097 my ($conf, $storecfg) = @_;
2098
2099 my $nodelist = PVE::Cluster::get_nodelist();
2100 my $nodehash = { map { $_ => 1 } @$nodelist };
2101 my $nodename = PVE::INotify::nodename();
be190583 2102
719893a9
DM
2103 foreach_drive($conf, sub {
2104 my ($ds, $drive) = @_;
2105
2106 my $volid = $drive->{file};
2107 return if !$volid;
2108
2109 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2110 if ($storeid) {
2111 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2112 if ($scfg->{disable}) {
2113 $nodehash = {};
2114 } elsif (my $avail = $scfg->{nodes}) {
2115 foreach my $node (keys %$nodehash) {
2116 delete $nodehash->{$node} if !$avail->{$node};
2117 }
2118 } elsif (!$scfg->{shared}) {
2119 foreach my $node (keys %$nodehash) {
2120 delete $nodehash->{$node} if $node ne $nodename
2121 }
2122 }
2123 }
2124 });
2125
2126 return $nodehash
2127}
2128
1e3baf05
DM
2129sub check_lock {
2130 my ($conf) = @_;
2131
2132 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2133}
2134
2135sub check_cmdline {
2136 my ($pidfile, $pid) = @_;
2137
6b64503e
DM
2138 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2139 if (defined($fh)) {
1e3baf05
DM
2140 my $line = <$fh>;
2141 $fh->close;
2142 return undef if !$line;
6b64503e 2143 my @param = split(/\0/, $line);
1e3baf05
DM
2144
2145 my $cmd = $param[0];
06094efd 2146 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2147
2148 for (my $i = 0; $i < scalar (@param); $i++) {
2149 my $p = $param[$i];
2150 next if !$p;
2151 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2152 my $p = $param[$i+1];
2153 return 1 if $p && ($p eq $pidfile);
2154 return undef;
2155 }
2156 }
2157 }
2158 return undef;
2159}
2160
2161sub check_running {
7e8dcf2c 2162 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2163
7e8dcf2c 2164 my $filename = config_file($vmid, $node);
1e3baf05
DM
2165
2166 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2167 if !$nocheck && ! -f $filename;
1e3baf05 2168
e6c3b671 2169 my $pidfile = pidfile_name($vmid);
1e3baf05 2170
e6c3b671
DM
2171 if (my $fd = IO::File->new("<$pidfile")) {
2172 my $st = stat($fd);
1e3baf05 2173 my $line = <$fd>;
6b64503e 2174 close($fd);
1e3baf05
DM
2175
2176 my $mtime = $st->mtime;
2177 if ($mtime > time()) {
2178 warn "file '$filename' modified in future\n";
2179 }
2180
2181 if ($line =~ m/^(\d+)$/) {
2182 my $pid = $1;
e6c3b671
DM
2183 if (check_cmdline($pidfile, $pid)) {
2184 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2185 return $pid;
2186 }
2187 }
1e3baf05
DM
2188 }
2189 }
2190
2191 return undef;
2192}
2193
2194sub vzlist {
19672434 2195
1e3baf05
DM
2196 my $vzlist = config_list();
2197
6b64503e 2198 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2199
19672434 2200 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2201 next if $de !~ m/^(\d+)\.pid$/;
2202 my $vmid = $1;
6b64503e
DM
2203 next if !defined($vzlist->{$vmid});
2204 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2205 $vzlist->{$vmid}->{pid} = $pid;
2206 }
2207 }
2208
2209 return $vzlist;
2210}
2211
1e3baf05
DM
2212sub disksize {
2213 my ($storecfg, $conf) = @_;
2214
2215 my $bootdisk = $conf->{bootdisk};
2216 return undef if !$bootdisk;
2217 return undef if !valid_drivename($bootdisk);
2218
2219 return undef if !$conf->{$bootdisk};
2220
2221 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2222 return undef if !defined($drive);
2223
2224 return undef if drive_is_cdrom($drive);
2225
2226 my $volid = $drive->{file};
2227 return undef if !$volid;
2228
24afaca0 2229 return $drive->{size};
1e3baf05
DM
2230}
2231
2232my $last_proc_pid_stat;
2233
03a33f30
DM
2234# get VM status information
2235# This must be fast and should not block ($full == false)
2236# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2237sub vmstatus {
03a33f30 2238 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2239
2240 my $res = {};
2241
19672434 2242 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2243
2244 my $list = vzlist();
694fcad4 2245 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2246
ae4915a2
DM
2247 my $cpucount = $cpuinfo->{cpus} || 1;
2248
1e3baf05
DM
2249 foreach my $vmid (keys %$list) {
2250 next if $opt_vmid && ($vmid ne $opt_vmid);
2251
2252 my $cfspath = cfs_config_path($vmid);
2253 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2254
2255 my $d = {};
2256 $d->{pid} = $list->{$vmid}->{pid};
2257
2258 # fixme: better status?
2259 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2260
af990afe
DM
2261 my $size = disksize($storecfg, $conf);
2262 if (defined($size)) {
2263 $d->{disk} = 0; # no info available
1e3baf05
DM
2264 $d->{maxdisk} = $size;
2265 } else {
2266 $d->{disk} = 0;
2267 $d->{maxdisk} = 0;
2268 }
2269
2270 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2271 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2272
1e3baf05 2273 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2274 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2275
8b1accf7 2276 if ($conf->{balloon}) {
4bdb0514 2277 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2278 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2279 }
2280
1e3baf05
DM
2281 $d->{uptime} = 0;
2282 $d->{cpu} = 0;
1e3baf05
DM
2283 $d->{mem} = 0;
2284
2285 $d->{netout} = 0;
2286 $d->{netin} = 0;
2287
2288 $d->{diskread} = 0;
2289 $d->{diskwrite} = 0;
2290
4d8c851b
AD
2291 $d->{template} = is_template($conf);
2292
1e3baf05
DM
2293 $res->{$vmid} = $d;
2294 }
2295
2296 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2297 foreach my $dev (keys %$netdev) {
2298 next if $dev !~ m/^tap([1-9]\d*)i/;
2299 my $vmid = $1;
2300 my $d = $res->{$vmid};
2301 next if !$d;
19672434 2302
1e3baf05
DM
2303 $d->{netout} += $netdev->{$dev}->{receive};
2304 $d->{netin} += $netdev->{$dev}->{transmit};
2305 }
2306
1e3baf05
DM
2307 my $ctime = gettimeofday;
2308
2309 foreach my $vmid (keys %$list) {
2310
2311 my $d = $res->{$vmid};
2312 my $pid = $d->{pid};
2313 next if !$pid;
2314
694fcad4
DM
2315 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2316 next if !$pstat; # not running
19672434 2317
694fcad4 2318 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2319
694fcad4 2320 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2321
694fcad4 2322 if ($pstat->{vsize}) {
6b64503e 2323 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2324 }
2325
2326 my $old = $last_proc_pid_stat->{$pid};
2327 if (!$old) {
19672434
DM
2328 $last_proc_pid_stat->{$pid} = {
2329 time => $ctime,
1e3baf05
DM
2330 used => $used,
2331 cpu => 0,
1e3baf05
DM
2332 };
2333 next;
2334 }
2335
7f0b5beb 2336 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2337
2338 if ($dtime > 1000) {
2339 my $dutime = $used - $old->{used};
2340
ae4915a2 2341 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2342 $last_proc_pid_stat->{$pid} = {
19672434 2343 time => $ctime,
1e3baf05
DM
2344 used => $used,
2345 cpu => $d->{cpu},
1e3baf05
DM
2346 };
2347 } else {
2348 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2349 }
2350 }
2351
f5eb281a 2352 return $res if !$full;
03a33f30
DM
2353
2354 my $qmpclient = PVE::QMPClient->new();
2355
64e7fcf2
DM
2356 my $ballooncb = sub {
2357 my ($vmid, $resp) = @_;
2358
2359 my $info = $resp->{'return'};
2360 return if !$info->{max_mem};
be190583 2361
64e7fcf2
DM
2362 my $d = $res->{$vmid};
2363
2364 # use memory assigned to VM
2365 $d->{maxmem} = $info->{max_mem};
2366 $d->{balloon} = $info->{actual};
be190583 2367
64e7fcf2
DM
2368 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2369 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2370 $d->{freemem} = $info->{free_mem};
2371 }
2372
2373 };
2374
03a33f30
DM
2375 my $blockstatscb = sub {
2376 my ($vmid, $resp) = @_;
2377 my $data = $resp->{'return'} || [];
2378 my $totalrdbytes = 0;
2379 my $totalwrbytes = 0;
2380 for my $blockstat (@$data) {
2381 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2382 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2383 }
2384 $res->{$vmid}->{diskread} = $totalrdbytes;
2385 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2386 };
2387
2388 my $statuscb = sub {
2389 my ($vmid, $resp) = @_;
64e7fcf2 2390
03a33f30 2391 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2392 # this fails if ballon driver is not loaded, so this must be
2393 # the last commnand (following command are aborted if this fails).
2394 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2395
2396 my $status = 'unknown';
2397 if (!defined($status = $resp->{'return'}->{status})) {
2398 warn "unable to get VM status\n";
2399 return;
2400 }
2401
2402 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2403 };
2404
2405 foreach my $vmid (keys %$list) {
2406 next if $opt_vmid && ($vmid ne $opt_vmid);
2407 next if !$res->{$vmid}->{pid}; # not running
2408 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2409 }
2410
c8125172 2411 $qmpclient->queue_execute(undef, 1);
03a33f30
DM
2412
2413 foreach my $vmid (keys %$list) {
2414 next if $opt_vmid && ($vmid ne $opt_vmid);
2415 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2416 }
2417
1e3baf05
DM
2418 return $res;
2419}
2420
2421sub foreach_drive {
2422 my ($conf, $func) = @_;
2423
2424 foreach my $ds (keys %$conf) {
2425 next if !valid_drivename($ds);
2426
6b64503e 2427 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2428 next if !$drive;
2429
2430 &$func($ds, $drive);
2431 }
2432}
2433
d5769dc2
DM
2434sub foreach_volid {
2435 my ($conf, $func) = @_;
be190583 2436
d5769dc2
DM
2437 my $volhash = {};
2438
2439 my $test_volid = sub {
2440 my ($volid, $is_cdrom) = @_;
2441
2442 return if !$volid;
be190583 2443
d5769dc2
DM
2444 $volhash->{$volid} = $is_cdrom || 0;
2445 };
2446
ed221350 2447 foreach_drive($conf, sub {
d5769dc2
DM
2448 my ($ds, $drive) = @_;
2449 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2450 });
2451
2452 foreach my $snapname (keys %{$conf->{snapshots}}) {
2453 my $snap = $conf->{snapshots}->{$snapname};
2454 &$test_volid($snap->{vmstate}, 0);
ed221350 2455 foreach_drive($snap, sub {
d5769dc2
DM
2456 my ($ds, $drive) = @_;
2457 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2458 });
2459 }
2460
2461 foreach my $volid (keys %$volhash) {
be190583 2462 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2463 }
2464}
2465
86b8228b
DM
2466sub vga_conf_has_spice {
2467 my ($vga) = @_;
2468
590e698c
DM
2469 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2470
2471 return $1 || 1;
86b8228b
DM
2472}
2473
1e3baf05 2474sub config_to_command {
952958bc 2475 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2476
2477 my $cmd = [];
8c559505
DM
2478 my $globalFlags = [];
2479 my $machineFlags = [];
2480 my $rtcFlags = [];
519ed28c 2481 my $cpuFlags = [];
5bdcf937 2482 my $devices = [];
b78ebef7 2483 my $pciaddr = '';
5bdcf937 2484 my $bridges = {};
1e3baf05
DM
2485 my $kvmver = kvm_user_version();
2486 my $vernum = 0; # unknown
a3c52213
DM
2487 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2488 $vernum = $1*1000000+$2*1000;
2489 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2490 $vernum = $1*1000000+$2*1000+$3;
2491 }
2492
a3c52213 2493 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2494
2495 my $have_ovz = -f '/proc/vz/vestat';
2496
db656e5f
DM
2497 my $q35 = machine_type_is_q35($conf);
2498
1e3baf05
DM
2499 push @$cmd, '/usr/bin/kvm';
2500
2501 push @$cmd, '-id', $vmid;
2502
2503 my $use_virtio = 0;
2504
c971c4f2
AD
2505 my $qmpsocket = qmp_socket($vmid);
2506 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2507 push @$cmd, '-mon', "chardev=qmp,mode=control";
2508
7b7c6d1b 2509 my $socket = vnc_socket($vmid);
1e3baf05
DM
2510 push @$cmd, '-vnc', "unix:$socket,x509,password";
2511
6b64503e 2512 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2513
1e3baf05
DM
2514 push @$cmd, '-daemonize';
2515
2796e7d5
DM
2516 if ($conf->{smbios1}) {
2517 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2518 }
2519
7183bd9a
AD
2520 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2521
db656e5f 2522 if ($q35) {
b467f79a 2523 # the q35 chipset support native usb2, so we enable usb controller
db656e5f 2524 # by default for this machine type
f8e83f05 2525 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2526 } else {
f8e83f05
AD
2527 $pciaddr = print_pci_addr("piix3", $bridges);
2528 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2529
f8e83f05 2530 my $use_usb2 = 0;
db656e5f
DM
2531 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2532 next if !$conf->{"usb$i"};
2533 $use_usb2 = 1;
2534 }
2535 # include usb device config
2536 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2537 }
19672434 2538
5acbfe9e 2539 my $vga = $conf->{vga};
2fa3151e 2540
590e698c
DM
2541 my $qxlnum = vga_conf_has_spice($vga);
2542 $vga = 'qxl' if $qxlnum;
2fa3151e 2543
5acbfe9e 2544 if (!$vga) {
264e519f
DM
2545 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2546 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2547 $conf->{ostype} eq 'w2k8')) {
2548 $vga = 'std';
2549 } else {
2550 $vga = 'cirrus';
2551 }
2552 }
2553
1e3baf05 2554 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2555 my $tablet;
2556 if (defined($conf->{tablet})) {
2557 $tablet = $conf->{tablet};
2558 } else {
2559 $tablet = $defaults->{tablet};
590e698c 2560 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2561 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2562 }
2563
db656e5f 2564 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2565
1e3baf05 2566 # host pci devices
040b06b7 2567 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2568 my $d = parse_hostpci($conf->{"hostpci$i"});
2569 next if !$d;
2570
2571 my $pcie = $d->{pcie};
2572 if($pcie){
2573 die "q35 machine model is not enabled" if !$q35;
2574 $pciaddr = print_pcie_addr("hostpci$i");
2575 }else{
2576 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2577 }
2578
2579 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2580 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2581 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2582 if ($xvga && $xvga ne '') {
2583 push @$cpuFlags, 'kvm=off';
2584 $vga = 'none';
2585 }
2e3b7e2a 2586 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2587 my $pcidevices = $d->{pciid};
2588 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2589
4543ecf0
AD
2590 my $j=0;
2591 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2592
4543ecf0
AD
2593 my $id = "hostpci$i";
2594 $id .= ".$j" if $multifunction;
2595 my $addr = $pciaddr;
2596 $addr .= ".$j" if $multifunction;
2597 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2598
2599 if($j == 0){
2600 $devicestr .= "$rombar$xvga";
2601 $devicestr .= ",multifunction=on" if $multifunction;
2602 }
2603
2604 push @$devices, '-device', $devicestr;
2605 $j++;
2606 }
1e3baf05
DM
2607 }
2608
2609 # usb devices
2610 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2611 my $d = parse_usb_device($conf->{"usb$i"});
2612 next if !$d;
2613 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2614 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2615 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2616 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2617 } elsif ($d->{spice}) {
2618 # usb redir support for spice
2619 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2620 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2621 }
2622 }
2623
1e3baf05 2624 # serial devices
bae179aa 2625 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2626 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2627 if ($path eq 'socket') {
2628 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2629 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2630 push @$devices, '-device', "isa-serial,chardev=serial$i";
2631 } else {
2632 die "no such serial device\n" if ! -c $path;
2633 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2634 push @$devices, '-device', "isa-serial,chardev=serial$i";
2635 }
34978be3 2636 }
1e3baf05
DM
2637 }
2638
2639 # parallel devices
1989a89c 2640 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2641 if (my $path = $conf->{"parallel$i"}) {
19672434 2642 die "no such parallel device\n" if ! -c $path;
32e69805 2643 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2644 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2645 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2646 }
1e3baf05
DM
2647 }
2648
2649 my $vmname = $conf->{name} || "vm$vmid";
2650
2651 push @$cmd, '-name', $vmname;
19672434 2652
1e3baf05
DM
2653 my $sockets = 1;
2654 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2655 $sockets = $conf->{sockets} if $conf->{sockets};
2656
2657 my $cores = $conf->{cores} || 1;
3bd18e48
AD
2658 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2659
76267728
WL
2660 my $total_cores = $sockets * $cores;
2661 my $allowed_cores = $cpuinfo->{cpus};
2662
f34ebd52 2663 die "MAX $allowed_cores cores allowed per VM on this node\n"
76267728
WL
2664 if ($allowed_cores < $total_cores);
2665
264e519f 2666 if ($maxcpus) {
3bd18e48 2667 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
264e519f 2668 } else {
3bd18e48
AD
2669 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2670 }
1e3baf05 2671
1e3baf05
DM
2672 push @$cmd, '-nodefaults';
2673
32baffb4 2674 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2675
0888fdce
DM
2676 my $bootindex_hash = {};
2677 my $i = 1;
2678 foreach my $o (split(//, $bootorder)) {
2679 $bootindex_hash->{$o} = $i*100;
2680 $i++;
afdb31d5 2681 }
3b408e82
DM
2682
2683 push @$cmd, '-boot', "menu=on";
1e3baf05 2684
6b64503e 2685 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2686
6b64503e 2687 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2688
ef5e2be2 2689 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2690
2691 # time drift fix
6b64503e 2692 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2693
6b64503e 2694 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2695 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2696
2697 if (my $ost = $conf->{ostype}) {
6b9d84cf 2698 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2699
2700 if ($ost =~ m/^w/) { # windows
8c559505 2701 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2702
8c559505 2703 # use time drift fix when acpi is enabled
6b64503e 2704 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2705 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2706 }
2707 }
2708
be190583 2709 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2710 $ost eq 'wvista') {
8c559505 2711 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2712 push @$cmd, '-no-hpet';
462e8d19
AD
2713 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2714 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2715 }
2716
2717 if ($ost eq 'win7' || $ost eq 'win8') {
2718 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2719 }
1e3baf05
DM
2720 }
2721
8c559505
DM
2722 push @$rtcFlags, 'driftfix=slew' if $tdf;
2723
7f0b5beb 2724 if ($nokvm) {
8c559505 2725 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2726 } else {
2727 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2728 }
1e3baf05 2729
952958bc
DM
2730 my $machine_type = $forcemachine || $conf->{machine};
2731 if ($machine_type) {
2732 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2733 }
2734
8c559505
DM
2735 if ($conf->{startdate}) {
2736 push @$rtcFlags, "base=$conf->{startdate}";
2737 } elsif ($useLocaltime) {
2738 push @$rtcFlags, 'base=localtime';
2739 }
1e3baf05 2740
519ed28c
AD
2741 my $cpu = $nokvm ? "qemu64" : "kvm64";
2742 $cpu = $conf->{cpu} if $conf->{cpu};
2743
4dc339e7
AD
2744 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2745
6b9d84cf
AD
2746 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2747
2748 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2749
2e1a5389
AD
2750 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2751
be190583 2752 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2753
c0efd8cd
DM
2754 # Note: enforce needs kernel 3.10, so we do not use it for now
2755 # push @$cmd, '-cpu', "$cpu,enforce";
2756 push @$cmd, '-cpu', $cpu;
519ed28c 2757
67fb9de6 2758 my $memory = $conf->{memory} || $defaults->{memory};
8a010eae
AD
2759 push @$cmd, '-m', $memory;
2760
67fb9de6 2761 if ($conf->{numa}) {
8a010eae 2762
2ed5d572
AD
2763 my $numa_totalmemory = undef;
2764 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2765 next if !$conf->{"numa$i"};
2766 my $numa = parse_numa($conf->{"numa$i"});
2767 next if !$numa;
67fb9de6
DM
2768 # memory
2769 die "missing numa node$i memory value\n" if !$numa->{memory};
2ed5d572
AD
2770 my $numa_memory = $numa->{memory};
2771 $numa_totalmemory += $numa_memory;
2772 my $numa_object = "memory-backend-ram,id=ram-node$i,size=$numa_memory"."M";
2773
67fb9de6 2774 # cpus
2ed5d572 2775 my $cpus_start = $numa->{cpus}->{start};
67fb9de6 2776 die "missing numa node$i cpus\n" if !defined($cpus_start);
2ed5d572
AD
2777 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2778 my $cpus = $cpus_start;
2779 if (defined($cpus_end)) {
2780 $cpus .= "-$cpus_end";
67fb9de6 2781 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2ed5d572 2782 }
8a010eae 2783
67fb9de6 2784 # hostnodes
2ed5d572
AD
2785 my $hostnodes_start = $numa->{hostnodes}->{start};
2786 if (defined($hostnodes_start)) {
2787 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2788 my $hostnodes = $hostnodes_start;
2789 if (defined($hostnodes_end)) {
2790 $hostnodes .= "-$hostnodes_end";
67fb9de6 2791 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2ed5d572 2792 }
8a010eae 2793
2ed5d572
AD
2794 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2795 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
67fb9de6 2796 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2ed5d572 2797 }
8a010eae 2798
67fb9de6 2799 # policy
2ed5d572 2800 my $policy = $numa->{policy};
67fb9de6
DM
2801 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2802 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2ed5d572
AD
2803 }
2804
2805 push @$cmd, '-object', $numa_object;
8a010eae
AD
2806 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2807 }
67fb9de6
DM
2808
2809 die "total memory for NUMA nodes must be equal to vm memory\n"
2810 if $numa_totalmemory && $numa_totalmemory != $memory;
2ed5d572
AD
2811
2812 #if no custom tology, we split memory and cores across numa nodes
2813 if(!$numa_totalmemory) {
2814
67fb9de6 2815 my $numa_memory = ($memory / $sockets) . "M";
2ed5d572
AD
2816
2817 for (my $i = 0; $i < $sockets; $i++) {
2818
2819 my $cpustart = ($cores * $i);
2820 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2821 my $cpus = $cpustart;
2822 $cpus .= "-$cpuend" if $cpuend;
2823
2824 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2825 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2826 }
2827 }
8a010eae
AD
2828 }
2829
1e3baf05
DM
2830 push @$cmd, '-S' if $conf->{freeze};
2831
2832 # set keyboard layout
2833 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2834 push @$cmd, '-k', $kb if $kb;
2835
2836 # enable sound
2837 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2838 #push @$cmd, '-soundhw', 'es1370';
2839 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 2840
bc84dcca 2841 if($conf->{agent}) {
7a6c2150 2842 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
2843 my $pciaddr = print_pci_addr("qga0", $bridges);
2844 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2845 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2846 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2847 }
2848
1d794448 2849 my $spice_port;
2fa3151e 2850
590e698c
DM
2851 if ($qxlnum) {
2852 if ($qxlnum > 1) {
2853 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2854 for(my $i = 1; $i < $qxlnum; $i++){
2855 my $pciaddr = print_pci_addr("vga$i", $bridges);
2856 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2857 }
2858 } else {
2859 # assume other OS works like Linux
2860 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2861 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
2862 }
2863 }
2864
1011b570 2865 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 2866
cd339d1f 2867 $spice_port = PVE::Tools::next_spice_port();
943340a6 2868
d2da6d9b 2869 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 2870
d2da6d9b
AD
2871 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2872 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2873 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
2874 }
2875
8d9ae0d2
DM
2876 # enable balloon by default, unless explicitly disabled
2877 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2878 $pciaddr = print_pci_addr("balloon0", $bridges);
2879 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2880 }
1e3baf05 2881
0ea9541d
DM
2882 if ($conf->{watchdog}) {
2883 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 2884 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 2885 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
2886 push @$devices, '-device', "$watchdog$pciaddr";
2887 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
2888 }
2889
1e3baf05 2890 my $vollist = [];
941e0c42 2891 my $scsicontroller = {};
26ee04b6 2892 my $ahcicontroller = {};
cdd20088 2893 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 2894
5881b913
DM
2895 # Add iscsi initiator name if available
2896 if (my $initiator = get_initiator_name()) {
2897 push @$devices, '-iscsi', "initiator-name=$initiator";
2898 }
2899
1e3baf05
DM
2900 foreach_drive($conf, sub {
2901 my ($ds, $drive) = @_;
2902
ff1a2432 2903 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 2904 push @$vollist, $drive->{file};
ff1a2432 2905 }
afdb31d5 2906
1e3baf05 2907 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
2908
2909 if (drive_is_cdrom ($drive)) {
2910 if ($bootindex_hash->{d}) {
2911 $drive->{bootindex} = $bootindex_hash->{d};
2912 $bootindex_hash->{d} += 1;
2913 }
2914 } else {
2915 if ($bootindex_hash->{c}) {
2916 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
2917 $bootindex_hash->{c} += 1;
2918 }
2919 }
2920
941e0c42 2921 if ($drive->{interface} eq 'scsi') {
cdd20088 2922
5b952ff5 2923 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 2924 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
2925 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
2926 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 2927 $scsicontroller->{$controller}=1;
941e0c42 2928 }
3b408e82 2929
26ee04b6
DA
2930 if ($drive->{interface} eq 'sata') {
2931 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
2932 $pciaddr = print_pci_addr("ahci$controller", $bridges);
2933 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
2934 $ahcicontroller->{$controller}=1;
2935 }
46f58b5f 2936
15b21acc
MR
2937 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
2938 push @$devices, '-drive',$drive_cmd;
46f58b5f 2939 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
2940 });
2941
cc4d6182 2942 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 2943 next if !$conf->{"net$i"};
cc4d6182
DA
2944 my $d = parse_net($conf->{"net$i"});
2945 next if !$d;
1e3baf05 2946
cc4d6182 2947 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 2948
cc4d6182
DA
2949 if ($bootindex_hash->{n}) {
2950 $d->{bootindex} = $bootindex_hash->{n};
2951 $bootindex_hash->{n} += 1;
2952 }
1e3baf05 2953
cc4d6182 2954 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
2955 push @$devices, '-netdev', $netdevfull;
2956
2957 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
2958 push @$devices, '-device', $netdevicefull;
2959 }
1e3baf05 2960
db656e5f
DM
2961 if (!$q35) {
2962 # add pci bridges
f8e83f05
AD
2963 while (my ($k, $v) = each %$bridges) {
2964 $pciaddr = print_pci_addr("pci.$k");
2965 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
2966 }
19672434
DM
2967 }
2968
1e3baf05
DM
2969 # hack: virtio with fairsched is unreliable, so we do not use fairsched
2970 # when the VM uses virtio devices.
19672434
DM
2971 if (!$use_virtio && $have_ovz) {
2972
6b64503e 2973 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
2974 $conf->{cpuunits} : $defaults->{cpuunits};
2975
2976 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
2977
2978 # fixme: cpulimit is currently ignored
2979 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
2980 }
2981
2982 # add custom args
2983 if ($conf->{args}) {
3ada46c9 2984 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
2985 push @$cmd, @$aa;
2986 }
2987
5bdcf937 2988 push @$cmd, @$devices;
be190583 2989 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 2990 if scalar(@$rtcFlags);
be190583 2991 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
2992 if scalar(@$machineFlags);
2993 push @$cmd, '-global', join(',', @$globalFlags)
2994 if scalar(@$globalFlags);
2995
1d794448 2996 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 2997}
19672434 2998
1e3baf05
DM
2999sub vnc_socket {
3000 my ($vmid) = @_;
3001 return "${var_run_tmpdir}/$vmid.vnc";
3002}
3003
943340a6 3004sub spice_port {
1011b570 3005 my ($vmid) = @_;
943340a6 3006
1d794448 3007 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
3008
3009 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
3010}
3011
c971c4f2 3012sub qmp_socket {
693d12a2
AD
3013 my ($vmid, $qga) = @_;
3014 my $sockettype = $qga ? 'qga' : 'qmp';
3015 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3016}
3017
1e3baf05
DM
3018sub pidfile_name {
3019 my ($vmid) = @_;
3020 return "${var_run_tmpdir}/$vmid.pid";
3021}
3022
86fdcfb2
DA
3023sub vm_devices_list {
3024 my ($vmid) = @_;
3025
ceea9078
DM
3026 my $res = vm_mon_cmd($vmid, 'query-pci');
3027
3028 my $devices = {};
3029 foreach my $pcibus (@$res) {
3030 foreach my $device (@{$pcibus->{devices}}) {
3031 next if !$device->{'qdev_id'};
f78cc802
AD
3032 $devices->{$device->{'qdev_id'}} = 1;
3033 }
3034 }
3035
3036 my $resblock = vm_mon_cmd($vmid, 'query-block');
3037 foreach my $block (@$resblock) {
3038 if($block->{device} =~ m/^drive-(\S+)/){
3039 $devices->{$1} = 1;
1dc4f496
DM
3040 }
3041 }
86fdcfb2 3042
1dc4f496 3043 return $devices;
86fdcfb2
DA
3044}
3045
ec21aa11 3046sub vm_deviceplug {
f19d1c47 3047 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3048
cd6ecb89 3049 return 1 if !check_running($vmid);
db656e5f
DM
3050
3051 my $q35 = machine_type_is_q35($conf);
3052
cd6ecb89 3053 if ($deviceid eq 'tablet') {
db656e5f 3054 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
cd6ecb89
AD
3055 return 1;
3056 }
3057
2dbe827e 3058 return 1 if !$conf->{hotplug};
afdb31d5 3059
95d6343b
DA
3060 my $devices_list = vm_devices_list($vmid);
3061 return 1 if defined($devices_list->{$deviceid});
3062
40f28a9f
AD
3063 qemu_bridgeadd($storecfg, $conf, $vmid, $deviceid); #add bridge if we need it for the device
3064
5e5dcb73
DA
3065 if ($deviceid =~ m/^(virtio)(\d+)$/) {
3066 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3067 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
5e5dcb73
DA
3068 qemu_deviceadd($vmid, $devicefull);
3069 if(!qemu_deviceaddverify($vmid, $deviceid)) {
3070 qemu_drivedel($vmid, $deviceid);
3071 return undef;
3072 }
f19d1c47 3073 }
cfc817c7 3074
cdd20088
AD
3075 if ($deviceid =~ m/^(scsihw)(\d+)$/) {
3076 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3077 my $pciaddr = print_pci_addr($deviceid);
cdd20088 3078 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
cfc817c7
DA
3079 qemu_deviceadd($vmid, $devicefull);
3080 return undef if(!qemu_deviceaddverify($vmid, $deviceid));
3081 }
3082
a4f091a0 3083 if ($deviceid =~ m/^(scsi)(\d+)$/) {
cdd20088 3084 return undef if !qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
a4f091a0 3085 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3086 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
a4f091a0
DA
3087 if(!qemu_deviceadd($vmid, $devicefull)) {
3088 qemu_drivedel($vmid, $deviceid);
3089 return undef;
3090 }
3091 }
3092
2630d2a9
DA
3093 if ($deviceid =~ m/^(net)(\d+)$/) {
3094 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3095 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3096 qemu_deviceadd($vmid, $netdevicefull);
3097 if(!qemu_deviceaddverify($vmid, $deviceid)) {
3098 qemu_netdevdel($vmid, $deviceid);
3099 return undef;
3100 }
3101 }
3102
b467f79a 3103
f8e83f05 3104 if (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
40f28a9f
AD
3105 my $bridgeid = $2;
3106 my $pciaddr = print_pci_addr($deviceid);
3107 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
3108 qemu_deviceadd($vmid, $devicefull);
3109 return undef if !qemu_deviceaddverify($vmid, $deviceid);
3110 }
3111
5e5dcb73 3112 return 1;
a4dea331
DA
3113}
3114
ec21aa11 3115sub vm_deviceunplug {
f19d1c47 3116 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3117
cd6ecb89
AD
3118 return 1 if !check_running ($vmid);
3119
3120 if ($deviceid eq 'tablet') {
3121 qemu_devicedel($vmid, $deviceid);
3122 return 1;
3123 }
3124
2dbe827e 3125 return 1 if !$conf->{hotplug};
873c2d69 3126
95d6343b
DA
3127 my $devices_list = vm_devices_list($vmid);
3128 return 1 if !defined($devices_list->{$deviceid});
3129
ae57f6b3 3130 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
f19d1c47 3131
5e5dcb73 3132 if ($deviceid =~ m/^(virtio)(\d+)$/) {
5e5dcb73
DA
3133 qemu_devicedel($vmid, $deviceid);
3134 return undef if !qemu_devicedelverify($vmid, $deviceid);
1f219ef5 3135 return undef if !qemu_drivedel($vmid, $deviceid);
5e5dcb73 3136 }
cfc817c7
DA
3137
3138 if ($deviceid =~ m/^(lsi)(\d+)$/) {
3139 return undef if !qemu_devicedel($vmid, $deviceid);
3140 }
3141
a4f091a0
DA
3142 if ($deviceid =~ m/^(scsi)(\d+)$/) {
3143 return undef if !qemu_devicedel($vmid, $deviceid);
3144 return undef if !qemu_drivedel($vmid, $deviceid);
3145 }
3146
2630d2a9 3147 if ($deviceid =~ m/^(net)(\d+)$/) {
2630d2a9
DA
3148 qemu_devicedel($vmid, $deviceid);
3149 return undef if !qemu_devicedelverify($vmid, $deviceid);
750886f8 3150 return undef if !qemu_netdevdel($vmid, $deviceid);
2630d2a9
DA
3151 }
3152
5e5dcb73
DA
3153 return 1;
3154}
3155
3156sub qemu_deviceadd {
3157 my ($vmid, $devicefull) = @_;
873c2d69 3158
d695b5b7
AD
3159 $devicefull = "driver=".$devicefull;
3160 my %options = split(/[=,]/, $devicefull);
f19d1c47 3161
d695b5b7
AD
3162 vm_mon_cmd($vmid, "device_add" , %options);
3163 return 1;
5e5dcb73 3164}
afdb31d5 3165
5e5dcb73
DA
3166sub qemu_devicedel {
3167 my($vmid, $deviceid) = @_;
5a77d8c1
AD
3168 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
3169 return 1;
5e5dcb73
DA
3170}
3171
3172sub qemu_driveadd {
3173 my($storecfg, $vmid, $device) = @_;
3174
3175 my $drive = print_drive_full($storecfg, $vmid, $device);
7b7c6d1b 3176 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
5e5dcb73
DA
3177 # If the command succeeds qemu prints: "OK"
3178 if ($ret !~ m/OK/s) {
3179 syslog("err", "adding drive failed: $ret");
3180 return undef;
f19d1c47 3181 }
5e5dcb73
DA
3182 return 1;
3183}
afdb31d5 3184
5e5dcb73
DA
3185sub qemu_drivedel {
3186 my($vmid, $deviceid) = @_;
873c2d69 3187
7b7c6d1b 3188 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73
DA
3189 $ret =~ s/^\s+//;
3190 if ($ret =~ m/Device \'.*?\' not found/s) {
afdb31d5 3191 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
5e5dcb73
DA
3192 }
3193 elsif ($ret ne "") {
3194 syslog("err", "deleting drive $deviceid failed : $ret");
3195 return undef;
873c2d69 3196 }
5e5dcb73
DA
3197 return 1;
3198}
f19d1c47 3199
5e5dcb73
DA
3200sub qemu_deviceaddverify {
3201 my ($vmid,$deviceid) = @_;
873c2d69 3202
5e5dcb73
DA
3203 for (my $i = 0; $i <= 5; $i++) {
3204 my $devices_list = vm_devices_list($vmid);
3205 return 1 if defined($devices_list->{$deviceid});
3206 sleep 1;
afdb31d5 3207 }
5e5dcb73
DA
3208 syslog("err", "error on hotplug device $deviceid");
3209 return undef;
3210}
afdb31d5 3211
5e5dcb73
DA
3212
3213sub qemu_devicedelverify {
3214 my ($vmid,$deviceid) = @_;
3215
3216 #need to verify the device is correctly remove as device_del is async and empty return is not reliable
3217 for (my $i = 0; $i <= 5; $i++) {
3218 my $devices_list = vm_devices_list($vmid);
3219 return 1 if !defined($devices_list->{$deviceid});
3220 sleep 1;
afdb31d5 3221 }
5e5dcb73
DA
3222 syslog("err", "error on hot-unplugging device $deviceid");
3223 return undef;
873c2d69
DA
3224}
3225
cdd20088 3226sub qemu_findorcreatescsihw {
cfc817c7
DA
3227 my ($storecfg, $conf, $vmid, $device) = @_;
3228
5b952ff5 3229 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3230 my $controller = int($device->{index} / $maxdev);
cdd20088 3231 my $scsihwid="scsihw$controller";
cfc817c7
DA
3232 my $devices_list = vm_devices_list($vmid);
3233
cdd20088
AD
3234 if(!defined($devices_list->{$scsihwid})) {
3235 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7
DA
3236 }
3237 return 1;
3238}
3239
40f28a9f
AD
3240sub qemu_bridgeadd {
3241 my ($storecfg, $conf, $vmid, $device) = @_;
3242
3243 my $bridges = {};
3244 my $bridgeid = undef;
3245 print_pci_addr($device, $bridges);
3246
3247 while (my ($k, $v) = each %$bridges) {
3248 $bridgeid = $k;
3249 }
0e616534 3250 return if !$bridgeid || $bridgeid < 1;
40f28a9f
AD
3251 my $bridge = "pci.$bridgeid";
3252 my $devices_list = vm_devices_list($vmid);
3253
3254 if(!defined($devices_list->{$bridge})) {
3255 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $bridge);
3256 }
3257 return 1;
3258}
3259
2630d2a9
DA
3260sub qemu_netdevadd {
3261 my ($vmid, $conf, $device, $deviceid) = @_;
3262
3263 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3264 my %options = split(/[=,]/, $netdev);
2630d2a9 3265
73aa03b8
AD
3266 vm_mon_cmd($vmid, "netdev_add", %options);
3267 return 1;
2630d2a9
DA
3268}
3269
3270sub qemu_netdevdel {
3271 my ($vmid, $deviceid) = @_;
3272
89c1e0f4
AD
3273 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
3274 return 1;
2630d2a9
DA
3275}
3276
838776ab
AD
3277sub qemu_cpu_hotplug {
3278 my ($vmid, $conf, $cores) = @_;
3279
3280 die "new cores config is not defined" if !$cores;
264e519f
DM
3281 die "you can't add more cores than maxcpus"
3282 if $conf->{maxcpus} && ($cores > $conf->{maxcpus});
838776ab
AD
3283 return if !check_running($vmid);
3284
3285 my $currentcores = $conf->{cores} if $conf->{cores};
3286 die "current cores is not defined" if !$currentcores;
3287 die "maxcpus is not defined" if !$conf->{maxcpus};
264e519f
DM
3288 raise_param_exc({ 'cores' => "online cpu unplug is not yet possible" })
3289 if($cores < $currentcores);
838776ab
AD
3290
3291 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
264e519f
DM
3292 raise_param_exc({ 'cores' => "cores number if running vm is different than configuration" })
3293 if scalar (@{$currentrunningcores}) != $currentcores;
838776ab 3294
264e519f 3295 for(my $i = $currentcores; $i < $cores; $i++) {
838776ab
AD
3296 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3297 }
3298}
3299
affd2f88
AD
3300sub qemu_block_set_io_throttle {
3301 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3302
f3f323a3
AD
3303 return if !check_running($vmid) ;
3304
f3f323a3
AD
3305 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3306
affd2f88
AD
3307}
3308
f5eb281a 3309# old code, only used to shutdown old VM after update
dab36e1e
DM
3310sub __read_avail {
3311 my ($fh, $timeout) = @_;
3312
3313 my $sel = new IO::Select;
3314 $sel->add($fh);
3315
3316 my $res = '';
3317 my $buf;
3318
3319 my @ready;
3320 while (scalar (@ready = $sel->can_read($timeout))) {
3321 my $count;
3322 if ($count = $fh->sysread($buf, 8192)) {
3323 if ($buf =~ /^(.*)\(qemu\) $/s) {
3324 $res .= $1;
3325 last;
3326 } else {
3327 $res .= $buf;
3328 }
3329 } else {
3330 if (!defined($count)) {
3331 die "$!\n";
3332 }
3333 last;
3334 }
3335 }
3336
3337 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3338
dab36e1e
DM
3339 return $res;
3340}
3341
f5eb281a 3342# old code, only used to shutdown old VM after update
dab36e1e
DM
3343sub vm_monitor_command {
3344 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3345
dab36e1e
DM
3346 my $res;
3347
3348 eval {
3349 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3350
3351 my $sname = "${var_run_tmpdir}/$vmid.mon";
3352
3353 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3354 die "unable to connect to VM $vmid socket - $!\n";
3355
3356 my $timeout = 3;
3357
3358 # hack: migrate sometime blocks the monitor (when migrate_downtime
3359 # is set)
3360 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3361 $timeout = 60*60; # 1 hour
3362 }
3363
3364 # read banner;
3365 my $data = __read_avail($sock, $timeout);
3366
3367 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3368 die "got unexpected qemu monitor banner\n";
3369 }
3370
3371 my $sel = new IO::Select;
3372 $sel->add($sock);
3373
3374 if (!scalar(my @ready = $sel->can_write($timeout))) {
3375 die "monitor write error - timeout";
3376 }
3377
3378 my $fullcmd = "$cmdstr\r";
3379
3380 # syslog('info', "VM $vmid monitor command: $cmdstr");
3381
3382 my $b;
3383 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3384 die "monitor write error - $!";
3385 }
3386
3387 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3388
3389 $timeout = 20;
3390
3391 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3392 $timeout = 60*60; # 1 hour
3393 } elsif ($cmdstr =~ m/^(eject|change)/) {
3394 $timeout = 60; # note: cdrom mount command is slow
3395 }
3396 if ($res = __read_avail($sock, $timeout)) {
3397
3398 my @lines = split("\r?\n", $res);
f5eb281a 3399
dab36e1e 3400 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3401
dab36e1e
DM
3402 $res = join("\n", @lines);
3403 $res .= "\n";
3404 }
3405 };
3406
3407 my $err = $@;
3408
3409 if ($err) {
3410 syslog("err", "VM $vmid monitor command failed - $err");
3411 die $err;
3412 }
f5eb281a 3413
dab36e1e
DM
3414 return $res;
3415}
3416
c1175c92
AD
3417sub qemu_block_resize {
3418 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3419
ed221350 3420 my $running = check_running($vmid);
c1175c92
AD
3421
3422 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3423
3424 return if !$running;
3425
3426 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3427
3428}
3429
1ab0057c
AD
3430sub qemu_volume_snapshot {
3431 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3432
ed221350 3433 my $running = check_running($vmid);
1ab0057c
AD
3434
3435 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3436
3437 return if !$running;
3438
3439 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3440
3441}
3442
fc46aff9
AD
3443sub qemu_volume_snapshot_delete {
3444 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3445
ed221350 3446 my $running = check_running($vmid);
fc46aff9
AD
3447
3448 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3449
3450 return if !$running;
3451
18bfb361 3452 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3453}
3454
264e519f
DM
3455sub set_migration_caps {
3456 my ($vmid) = @_;
a89fded1 3457
8b8345f3 3458 my $cap_ref = [];
a89fded1
AD
3459
3460 my $enabled_cap = {
8b8345f3
DM
3461 "auto-converge" => 1,
3462 "xbzrle" => 0,
3463 "x-rdma-pin-all" => 0,
3464 "zero-blocks" => 0,
a89fded1
AD
3465 };
3466
8b8345f3 3467 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3468
8b8345f3 3469 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3470 push @$cap_ref, {
3471 capability => $supported_capability->{capability},
22430fa2
DM
3472 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3473 };
a89fded1
AD
3474 }
3475
8b8345f3
DM
3476 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3477}
a89fded1 3478
1e3baf05 3479sub vm_start {
1d794448 3480 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 3481
6b64503e 3482 lock_config($vmid, sub {
7e8dcf2c 3483 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 3484
8b43bc11 3485 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 3486
6b64503e 3487 check_lock($conf) if !$skiplock;
1e3baf05 3488
7e8dcf2c 3489 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 3490
6c47d546
DM
3491 my $defaults = load_defaults();
3492
3493 # set environment variable useful inside network script
3494 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3495
1d794448 3496 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 3497
1e3baf05 3498 my $migrate_port = 0;
5bc1e039 3499 my $migrate_uri;
1e3baf05
DM
3500 if ($statefile) {
3501 if ($statefile eq 'tcp') {
5bc1e039
SP
3502 my $localip = "localhost";
3503 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3504 if ($datacenterconf->{migration_unsecure}) {
3505 my $nodename = PVE::INotify::nodename();
3506 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3507 }
f9a971e0 3508 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 3509 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
3510 push @$cmd, '-incoming', $migrate_uri;
3511 push @$cmd, '-S';
1e3baf05 3512 } else {
6c47d546 3513 push @$cmd, '-loadstate', $statefile;
1e3baf05 3514 }
91bd6c90
DM
3515 } elsif ($paused) {
3516 push @$cmd, '-S';
1e3baf05
DM
3517 }
3518
1e3baf05 3519 # host pci devices
040b06b7
DA
3520 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3521 my $d = parse_hostpci($conf->{"hostpci$i"});
3522 next if !$d;
b1f72af6
AD
3523 my $pcidevices = $d->{pciid};
3524 foreach my $pcidevice (@$pcidevices) {
3525 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 3526
b1f72af6
AD
3527 my $info = pci_device_info("0000:$pciid");
3528 die "IOMMU not present\n" if !check_iommu_support();
3529 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 3530
b1f72af6
AD
3531 if ($d->{driver} && $d->{driver} eq "vfio") {
3532 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3533 } else {
3534 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3535 }
3536
8f3e88af 3537 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 3538 }
040b06b7 3539 }
1e3baf05
DM
3540
3541 PVE::Storage::activate_volumes($storecfg, $vollist);
3542
585b6e28
DM
3543 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3544 umask => 0077); };
1e3baf05 3545 my $err = $@;
ff1a2432 3546 die "start failed: $err" if $err;
1e3baf05 3547
5bc1e039 3548 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 3549
8c609afd 3550 if ($statefile && $statefile ne 'tcp') {
95381ce0 3551 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 3552 warn $@ if $@;
62de2cbd
DM
3553 }
3554
1d794448 3555 if ($migratedfrom) {
a89fded1
AD
3556
3557 eval {
3558 PVE::QemuServer::set_migration_caps($vmid);
3559 };
1d794448 3560 warn $@ if $@;
a89fded1 3561
1d794448
DM
3562 if ($spice_port) {
3563 print "spice listens on port $spice_port\n";
3564 if ($spice_ticket) {
3565 PVE::QemuServer::vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
3566 PVE::QemuServer::vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
3567 }
3568 }
3569
1d794448 3570 } else {
4ec05c4c 3571
15b1fc93 3572 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 3573 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 3574 if $conf->{balloon};
be190583
DM
3575 vm_mon_cmd_nocheck($vmid, 'qom-set',
3576 path => "machine/peripheral/balloon0",
3577 property => "guest-stats-polling-interval",
4ec05c4c
AD
3578 value => 2);
3579 }
e18b0b99 3580 }
1e3baf05
DM
3581 });
3582}
3583
0eedc444
AD
3584sub vm_mon_cmd {
3585 my ($vmid, $execute, %params) = @_;
3586
26f11676
DM
3587 my $cmd = { execute => $execute, arguments => \%params };
3588 vm_qmp_command($vmid, $cmd);
0eedc444
AD
3589}
3590
3591sub vm_mon_cmd_nocheck {
3592 my ($vmid, $execute, %params) = @_;
3593
26f11676
DM
3594 my $cmd = { execute => $execute, arguments => \%params };
3595 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
3596}
3597
c971c4f2 3598sub vm_qmp_command {
c5a07de5 3599 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 3600
c971c4f2 3601 my $res;
26f11676 3602
14db5366
DM
3603 my $timeout;
3604 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
3605 $timeout = $cmd->{arguments}->{timeout};
3606 delete $cmd->{arguments}->{timeout};
3607 }
be190583 3608
c971c4f2
AD
3609 eval {
3610 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
3611 my $sname = qmp_socket($vmid);
3612 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 3613 my $qmpclient = PVE::QMPClient->new();
dab36e1e 3614
14db5366 3615 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 3616 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
3617 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
3618 if scalar(%{$cmd->{arguments}});
3619 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
3620 } else {
3621 die "unable to open monitor socket\n";
3622 }
c971c4f2 3623 };
26f11676 3624 if (my $err = $@) {
c971c4f2
AD
3625 syslog("err", "VM $vmid qmp command failed - $err");
3626 die $err;
3627 }
3628
3629 return $res;
3630}
3631
9df5cbcc
DM
3632sub vm_human_monitor_command {
3633 my ($vmid, $cmdline) = @_;
3634
3635 my $res;
3636
f5eb281a 3637 my $cmd = {
9df5cbcc
DM
3638 execute => 'human-monitor-command',
3639 arguments => { 'command-line' => $cmdline},
3640 };
3641
3642 return vm_qmp_command($vmid, $cmd);
3643}
3644
1e3baf05
DM
3645sub vm_commandline {
3646 my ($storecfg, $vmid) = @_;
3647
6b64503e 3648 my $conf = load_config($vmid);
1e3baf05
DM
3649
3650 my $defaults = load_defaults();
3651
6b64503e 3652 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 3653
6b64503e 3654 return join(' ', @$cmd);
1e3baf05
DM
3655}
3656
3657sub vm_reset {
3658 my ($vmid, $skiplock) = @_;
3659
6b64503e 3660 lock_config($vmid, sub {
1e3baf05 3661
6b64503e 3662 my $conf = load_config($vmid);
1e3baf05 3663
6b64503e 3664 check_lock($conf) if !$skiplock;
1e3baf05 3665
816e2c4a 3666 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
3667 });
3668}
3669
3670sub get_vm_volumes {
3671 my ($conf) = @_;
1e3baf05 3672
ff1a2432 3673 my $vollist = [];
d5769dc2
DM
3674 foreach_volid($conf, sub {
3675 my ($volid, $is_cdrom) = @_;
ff1a2432 3676
d5769dc2 3677 return if $volid =~ m|^/|;
ff1a2432 3678
d5769dc2
DM
3679 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
3680 return if !$sid;
ff1a2432
DM
3681
3682 push @$vollist, $volid;
1e3baf05 3683 });
ff1a2432
DM
3684
3685 return $vollist;
3686}
3687
3688sub vm_stop_cleanup {
254575e9 3689 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 3690
745fed70
DM
3691 eval {
3692 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 3693
254575e9
DM
3694 if (!$keepActive) {
3695 my $vollist = get_vm_volumes($conf);
3696 PVE::Storage::deactivate_volumes($storecfg, $vollist);
3697 }
961bfcb2 3698
ab6a046f 3699 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
3700 unlink "/var/run/qemu-server/${vmid}.$ext";
3701 }
745fed70
DM
3702 };
3703 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
3704}
3705
e6c3b671 3706# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
3707# We need that when migration VMs to other nodes (files already moved)
3708# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 3709sub vm_stop {
af30308f 3710 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 3711
9269013a 3712 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 3713
af30308f
DM
3714 if ($migratedfrom){
3715 my $pid = check_running($vmid, $nocheck, $migratedfrom);
3716 kill 15, $pid if $pid;
3717 my $conf = load_config($vmid, $migratedfrom);
3718 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
3719 return;
3720 }
3721
e6c3b671 3722 lock_config($vmid, sub {
1e3baf05 3723
e6c3b671 3724 my $pid = check_running($vmid, $nocheck);
ff1a2432 3725 return if !$pid;
1e3baf05 3726
ff1a2432 3727 my $conf;
e6c3b671 3728 if (!$nocheck) {
ff1a2432 3729 $conf = load_config($vmid);
e6c3b671 3730 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
3731 if (!defined($timeout) && $shutdown && $conf->{startup}) {
3732 my $opts = parse_startup($conf->{startup});
3733 $timeout = $opts->{down} if $opts->{down};
3734 }
e6c3b671 3735 }
19672434 3736
7f4a5b5a 3737 $timeout = 60 if !defined($timeout);
67fb9de6 3738
9269013a
DM
3739 eval {
3740 if ($shutdown) {
6fab033c 3741 if (!$nocheck && $conf->{agent}) {
2ea54503 3742 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 3743 } else {
2ea54503 3744 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 3745 }
9269013a 3746 } else {
2ea54503 3747 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 3748 }
9269013a 3749 };
1e3baf05
DM
3750 my $err = $@;
3751
3752 if (!$err) {
1e3baf05 3753 my $count = 0;
e6c3b671 3754 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
3755 $count++;
3756 sleep 1;
3757 }
3758
3759 if ($count >= $timeout) {
9269013a
DM
3760 if ($force) {
3761 warn "VM still running - terminating now with SIGTERM\n";
3762 kill 15, $pid;
3763 } else {
3764 die "VM quit/powerdown failed - got timeout\n";
3765 }
3766 } else {
254575e9 3767 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 3768 return;
1e3baf05
DM
3769 }
3770 } else {
9269013a
DM
3771 if ($force) {
3772 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
3773 kill 15, $pid;
3774 } else {
afdb31d5 3775 die "VM quit/powerdown failed\n";
9269013a 3776 }
1e3baf05
DM
3777 }
3778
3779 # wait again
ff1a2432 3780 $timeout = 10;
1e3baf05
DM
3781
3782 my $count = 0;
e6c3b671 3783 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
3784 $count++;
3785 sleep 1;
3786 }
3787
3788 if ($count >= $timeout) {
ff1a2432 3789 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 3790 kill 9, $pid;
ff1a2432 3791 sleep 1;
1e3baf05
DM
3792 }
3793
254575e9 3794 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 3795 });
1e3baf05
DM
3796}
3797
3798sub vm_suspend {
3799 my ($vmid, $skiplock) = @_;
3800
6b64503e 3801 lock_config($vmid, sub {
1e3baf05 3802
6b64503e 3803 my $conf = load_config($vmid);
1e3baf05 3804
051347aa 3805 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 3806
f77f91f3 3807 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
3808 });
3809}
3810
3811sub vm_resume {
3812 my ($vmid, $skiplock) = @_;
3813
6b64503e 3814 lock_config($vmid, sub {
1e3baf05 3815
6b64503e 3816 my $conf = load_config($vmid);
1e3baf05 3817
051347aa 3818 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 3819
12060fe8 3820 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
3821 });
3822}
3823
5fdbe4f0
DM
3824sub vm_sendkey {
3825 my ($vmid, $skiplock, $key) = @_;
1e3baf05 3826
6b64503e 3827 lock_config($vmid, sub {
1e3baf05 3828
6b64503e 3829 my $conf = load_config($vmid);
f5eb281a 3830
7b7c6d1b
DM
3831 # there is no qmp command, so we use the human monitor command
3832 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
3833 });
3834}
3835
3836sub vm_destroy {
3837 my ($storecfg, $vmid, $skiplock) = @_;
3838
6b64503e 3839 lock_config($vmid, sub {
1e3baf05 3840
6b64503e 3841 my $conf = load_config($vmid);
1e3baf05 3842
6b64503e 3843 check_lock($conf) if !$skiplock;
1e3baf05 3844
ff1a2432
DM
3845 if (!check_running($vmid)) {
3846 fairsched_rmnod($vmid); # try to destroy group
3847 destroy_vm($storecfg, $vmid);
3848 } else {
3849 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
3850 }
3851 });
3852}
3853
1e3baf05
DM
3854# pci helpers
3855
3856sub file_write {
3857 my ($filename, $buf) = @_;
3858
6b64503e 3859 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
3860 return undef if !$fh;
3861
3862 my $res = print $fh $buf;
3863
3864 $fh->close();
3865
3866 return $res;
3867}
3868
3869sub pci_device_info {
3870 my ($name) = @_;
3871
3872 my $res;
3873
3874 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
3875 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
3876
3877 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
3878 return undef if !defined($irq) || $irq !~ m/^\d+$/;
3879
3880 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
3881 return undef if !defined($vendor) || $vendor !~ s/^0x//;
3882
3883 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
3884 return undef if !defined($product) || $product !~ s/^0x//;
3885
3886 $res = {
3887 name => $name,
3888 vendor => $vendor,
3889 product => $product,
3890 domain => $domain,
3891 bus => $bus,
3892 slot => $slot,
3893 func => $func,
3894 irq => $irq,
3895 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
3896 };
3897
3898 return $res;
3899}
3900
3901sub pci_dev_reset {
3902 my ($dev) = @_;
3903
3904 my $name = $dev->{name};
3905
3906 my $fn = "$pcisysfs/devices/$name/reset";
3907
6b64503e 3908 return file_write($fn, "1");
1e3baf05
DM
3909}
3910
3911sub pci_dev_bind_to_stub {
3912 my ($dev) = @_;
3913
3914 my $name = $dev->{name};
3915
3916 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
3917 return 1 if -d $testdir;
3918
3919 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 3920 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
3921
3922 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 3923 if (!file_write($fn, $name)) {
1e3baf05
DM
3924 return undef if -f $fn;
3925 }
3926
3927 $fn = "$pcisysfs/drivers/pci-stub/bind";
3928 if (! -d $testdir) {
6b64503e 3929 return undef if !file_write($fn, $name);
1e3baf05
DM
3930 }
3931
3932 return -d $testdir;
3933}
3934
000fc0a2
SP
3935sub pci_dev_bind_to_vfio {
3936 my ($dev) = @_;
3937
3938 my $name = $dev->{name};
3939
3940 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
3941
3942 if (!-d $vfio_basedir) {
3943 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
3944 }
3945 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
3946
3947 my $testdir = "$vfio_basedir/$name";
3948 return 1 if -d $testdir;
3949
3950 my $data = "$dev->{vendor} $dev->{product}";
3951 return undef if !file_write("$vfio_basedir/new_id", $data);
3952
3953 my $fn = "$pcisysfs/devices/$name/driver/unbind";
3954 if (!file_write($fn, $name)) {
3955 return undef if -f $fn;
3956 }
3957
3958 $fn = "$vfio_basedir/bind";
3959 if (! -d $testdir) {
3960 return undef if !file_write($fn, $name);
3961 }
3962
3963 return -d $testdir;
3964}
3965
3966sub pci_dev_group_bind_to_vfio {
3967 my ($pciid) = @_;
3968
3969 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
3970
3971 if (!-d $vfio_basedir) {
3972 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
3973 }
3974 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
3975
3976 # get IOMMU group devices
3977 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
3978 my @devs = grep /^0000:/, readdir($D);
3979 closedir($D);
3980
3981 foreach my $pciid (@devs) {
3982 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
3983 my $info = pci_device_info($1);
3984 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
3985 }
3986
3987 return 1;
3988}
3989
afdb31d5 3990sub print_pci_addr {
5bdcf937 3991 my ($id, $bridges) = @_;
6b64503e 3992
72a063e4 3993 my $res = '';
6b64503e 3994 my $devices = {
24f0d39a 3995 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 3996 #addr2 : first videocard
13b5a753 3997 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 3998 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
3999 scsihw0 => { bus => 0, addr => 5 },
4000 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 4001 ahci0 => { bus => 0, addr => 7 },
ab6a046f 4002 qga0 => { bus => 0, addr => 8 },
1011b570 4003 spice => { bus => 0, addr => 9 },
6b64503e
DM
4004 virtio0 => { bus => 0, addr => 10 },
4005 virtio1 => { bus => 0, addr => 11 },
4006 virtio2 => { bus => 0, addr => 12 },
4007 virtio3 => { bus => 0, addr => 13 },
4008 virtio4 => { bus => 0, addr => 14 },
4009 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
4010 hostpci0 => { bus => 0, addr => 16 },
4011 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
4012 net0 => { bus => 0, addr => 18 },
4013 net1 => { bus => 0, addr => 19 },
4014 net2 => { bus => 0, addr => 20 },
4015 net3 => { bus => 0, addr => 21 },
4016 net4 => { bus => 0, addr => 22 },
4017 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
4018 vga1 => { bus => 0, addr => 24 },
4019 vga2 => { bus => 0, addr => 25 },
4020 vga3 => { bus => 0, addr => 26 },
5cffb2d2
AD
4021 hostpci2 => { bus => 0, addr => 27 },
4022 hostpci3 => { bus => 0, addr => 28 },
e5f7f8ed 4023 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
4024 'pci.1' => { bus => 0, addr => 30 },
4025 'pci.2' => { bus => 0, addr => 31 },
4026 'net6' => { bus => 1, addr => 1 },
4027 'net7' => { bus => 1, addr => 2 },
4028 'net8' => { bus => 1, addr => 3 },
4029 'net9' => { bus => 1, addr => 4 },
4030 'net10' => { bus => 1, addr => 5 },
4031 'net11' => { bus => 1, addr => 6 },
4032 'net12' => { bus => 1, addr => 7 },
4033 'net13' => { bus => 1, addr => 8 },
4034 'net14' => { bus => 1, addr => 9 },
4035 'net15' => { bus => 1, addr => 10 },
4036 'net16' => { bus => 1, addr => 11 },
4037 'net17' => { bus => 1, addr => 12 },
4038 'net18' => { bus => 1, addr => 13 },
4039 'net19' => { bus => 1, addr => 14 },
4040 'net20' => { bus => 1, addr => 15 },
4041 'net21' => { bus => 1, addr => 16 },
4042 'net22' => { bus => 1, addr => 17 },
4043 'net23' => { bus => 1, addr => 18 },
4044 'net24' => { bus => 1, addr => 19 },
4045 'net25' => { bus => 1, addr => 20 },
4046 'net26' => { bus => 1, addr => 21 },
4047 'net27' => { bus => 1, addr => 22 },
4048 'net28' => { bus => 1, addr => 23 },
4049 'net29' => { bus => 1, addr => 24 },
4050 'net30' => { bus => 1, addr => 25 },
4051 'net31' => { bus => 1, addr => 26 },
4052 'virtio6' => { bus => 2, addr => 1 },
4053 'virtio7' => { bus => 2, addr => 2 },
4054 'virtio8' => { bus => 2, addr => 3 },
4055 'virtio9' => { bus => 2, addr => 4 },
4056 'virtio10' => { bus => 2, addr => 5 },
4057 'virtio11' => { bus => 2, addr => 6 },
4058 'virtio12' => { bus => 2, addr => 7 },
4059 'virtio13' => { bus => 2, addr => 8 },
4060 'virtio14' => { bus => 2, addr => 9 },
4061 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
4062 };
4063
4064 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 4065 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
4066 my $bus = $devices->{$id}->{bus};
4067 $res = ",bus=pci.$bus,addr=$addr";
98627641 4068 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
4069 }
4070 return $res;
4071
4072}
4073
2e3b7e2a
AD
4074sub print_pcie_addr {
4075 my ($id) = @_;
4076
4077 my $res = '';
4078 my $devices = {
4079 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4080 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4081 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4082 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4083 };
4084
4085 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4086 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4087 my $bus = $devices->{$id}->{bus};
4088 $res = ",bus=$bus,addr=$addr";
4089 }
4090 return $res;
4091
4092}
4093
3e16d5fc
DM
4094# vzdump restore implementaion
4095
ed221350 4096sub tar_archive_read_firstfile {
3e16d5fc 4097 my $archive = shift;
afdb31d5 4098
3e16d5fc
DM
4099 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4100
4101 # try to detect archive type first
4102 my $pid = open (TMP, "tar tf '$archive'|") ||
4103 die "unable to open file '$archive'\n";
4104 my $firstfile = <TMP>;
4105 kill 15, $pid;
4106 close TMP;
4107
4108 die "ERROR: archive contaions no data\n" if !$firstfile;
4109 chomp $firstfile;
4110
4111 return $firstfile;
4112}
4113
ed221350
DM
4114sub tar_restore_cleanup {
4115 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
4116
4117 print STDERR "starting cleanup\n";
4118
4119 if (my $fd = IO::File->new($statfile, "r")) {
4120 while (defined(my $line = <$fd>)) {
4121 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4122 my $volid = $2;
4123 eval {
4124 if ($volid =~ m|^/|) {
4125 unlink $volid || die 'unlink failed\n';
4126 } else {
ed221350 4127 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 4128 }
afdb31d5 4129 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
4130 };
4131 print STDERR "unable to cleanup '$volid' - $@" if $@;
4132 } else {
4133 print STDERR "unable to parse line in statfile - $line";
afdb31d5 4134 }
3e16d5fc
DM
4135 }
4136 $fd->close();
4137 }
4138}
4139
4140sub restore_archive {
a0d1b1a2 4141 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 4142
91bd6c90
DM
4143 my $format = $opts->{format};
4144 my $comp;
4145
4146 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4147 $format = 'tar' if !$format;
4148 $comp = 'gzip';
4149 } elsif ($archive =~ m/\.tar$/) {
4150 $format = 'tar' if !$format;
4151 } elsif ($archive =~ m/.tar.lzo$/) {
4152 $format = 'tar' if !$format;
4153 $comp = 'lzop';
4154 } elsif ($archive =~ m/\.vma$/) {
4155 $format = 'vma' if !$format;
4156 } elsif ($archive =~ m/\.vma\.gz$/) {
4157 $format = 'vma' if !$format;
4158 $comp = 'gzip';
4159 } elsif ($archive =~ m/\.vma\.lzo$/) {
4160 $format = 'vma' if !$format;
4161 $comp = 'lzop';
4162 } else {
4163 $format = 'vma' if !$format; # default
4164 }
4165
4166 # try to detect archive format
4167 if ($format eq 'tar') {
4168 return restore_tar_archive($archive, $vmid, $user, $opts);
4169 } else {
4170 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4171 }
4172}
4173
4174sub restore_update_config_line {
4175 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4176
4177 return if $line =~ m/^\#qmdump\#/;
4178 return if $line =~ m/^\#vzdump\#/;
4179 return if $line =~ m/^lock:/;
4180 return if $line =~ m/^unused\d+:/;
4181 return if $line =~ m/^parent:/;
ca3e4fa4 4182 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4183
4184 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4185 # try to convert old 1.X settings
4186 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4187 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4188 my ($model, $macaddr) = split(/\=/, $devconfig);
4189 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4190 my $net = {
4191 model => $model,
4192 bridge => "vmbr$ind",
4193 macaddr => $macaddr,
4194 };
4195 my $netstr = print_net($net);
4196
4197 print $outfd "net$cookie->{netcount}: $netstr\n";
4198 $cookie->{netcount}++;
4199 }
4200 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4201 my ($id, $netstr) = ($1, $2);
4202 my $net = parse_net($netstr);
4203 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4204 $netstr = print_net($net);
4205 print $outfd "$id: $netstr\n";
4206 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4207 my $virtdev = $1;
907ea891 4208 my $value = $3;
91bd6c90
DM
4209 if ($line =~ m/backup=no/) {
4210 print $outfd "#$line";
4211 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4212 my $di = parse_drive($virtdev, $value);
8fd57431 4213 delete $di->{format}; # format can change on restore
91bd6c90 4214 $di->{file} = $map->{$virtdev};
ed221350 4215 $value = print_drive($vmid, $di);
91bd6c90
DM
4216 print $outfd "$virtdev: $value\n";
4217 } else {
4218 print $outfd $line;
4219 }
4220 } else {
4221 print $outfd $line;
4222 }
4223}
4224
4225sub scan_volids {
4226 my ($cfg, $vmid) = @_;
4227
4228 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4229
4230 my $volid_hash = {};
4231 foreach my $storeid (keys %$info) {
4232 foreach my $item (@{$info->{$storeid}}) {
4233 next if !($item->{volid} && $item->{size});
5996a936 4234 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4235 $volid_hash->{$item->{volid}} = $item;
4236 }
4237 }
4238
4239 return $volid_hash;
4240}
4241
a8e2f942
DM
4242sub get_used_paths {
4243 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4244
4245 my $used_path = {};
4246
4247 my $scan_config = sub {
4248 my ($cref, $snapname) = @_;
4249
4250 foreach my $key (keys %$cref) {
4251 my $value = $cref->{$key};
4252 if (valid_drivename($key)) {
4253 next if $skip_drive && $key eq $skip_drive;
4254 my $drive = parse_drive($key, $value);
4255 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4256 if ($drive->{file} =~ m!^/!) {
4257 $used_path->{$drive->{file}}++; # = 1;
4258 } else {
4259 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4260 next if !$storeid;
4261 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4262 next if !$scfg;
4263 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4264 $used_path->{$path}++; # = 1;
4265 }
4266 }
4267 }
4268 };
4269
4270 &$scan_config($conf);
4271
4272 undef $skip_drive;
4273
4274 if ($scan_snapshots) {
4275 foreach my $snapname (keys %{$conf->{snapshots}}) {
4276 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4277 }
4278 }
4279
4280 return $used_path;
4281}
4282
91bd6c90
DM
4283sub update_disksize {
4284 my ($vmid, $conf, $volid_hash) = @_;
be190583 4285
91bd6c90
DM
4286 my $changes;
4287
4288 my $used = {};
4289
5996a936
DM
4290 # Note: it is allowed to define multiple storages with same path (alias), so
4291 # we need to check both 'volid' and real 'path' (two different volid can point
4292 # to the same path).
4293
4294 my $usedpath = {};
be190583 4295
91bd6c90
DM
4296 # update size info
4297 foreach my $opt (keys %$conf) {
ed221350
DM
4298 if (valid_drivename($opt)) {
4299 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4300 my $volid = $drive->{file};
4301 next if !$volid;
4302
4303 $used->{$volid} = 1;
be190583 4304 if ($volid_hash->{$volid} &&
5996a936
DM
4305 (my $path = $volid_hash->{$volid}->{path})) {
4306 $usedpath->{$path} = 1;
4307 }
91bd6c90 4308
ed221350 4309 next if drive_is_cdrom($drive);
91bd6c90
DM
4310 next if !$volid_hash->{$volid};
4311
4312 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4313 my $new = print_drive($vmid, $drive);
4314 if ($new ne $conf->{$opt}) {
4315 $changes = 1;
4316 $conf->{$opt} = $new;
4317 }
91bd6c90
DM
4318 }
4319 }
4320
5996a936
DM
4321 # remove 'unusedX' entry if volume is used
4322 foreach my $opt (keys %$conf) {
4323 next if $opt !~ m/^unused\d+$/;
4324 my $volid = $conf->{$opt};
4325 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4326 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4327 $changes = 1;
4328 delete $conf->{$opt};
4329 }
4330 }
4331
91bd6c90
DM
4332 foreach my $volid (sort keys %$volid_hash) {
4333 next if $volid =~ m/vm-$vmid-state-/;
4334 next if $used->{$volid};
5996a936
DM
4335 my $path = $volid_hash->{$volid}->{path};
4336 next if !$path; # just to be sure
4337 next if $usedpath->{$path};
91bd6c90 4338 $changes = 1;
ed221350 4339 add_unused_volume($conf, $volid);
05937a14 4340 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4341 }
4342
4343 return $changes;
4344}
4345
4346sub rescan {
4347 my ($vmid, $nolock) = @_;
4348
4349 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4350
4351 my $volid_hash = scan_volids($cfg, $vmid);
4352
4353 my $updatefn = sub {
4354 my ($vmid) = @_;
4355
ed221350 4356 my $conf = load_config($vmid);
be190583 4357
ed221350 4358 check_lock($conf);
91bd6c90 4359
03da3f0d
DM
4360 my $vm_volids = {};
4361 foreach my $volid (keys %$volid_hash) {
4362 my $info = $volid_hash->{$volid};
4363 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4364 }
4365
4366 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 4367
ed221350 4368 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
4369 };
4370
4371 if (defined($vmid)) {
4372 if ($nolock) {
4373 &$updatefn($vmid);
4374 } else {
ed221350 4375 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
4376 }
4377 } else {
4378 my $vmlist = config_list();
4379 foreach my $vmid (keys %$vmlist) {
4380 if ($nolock) {
4381 &$updatefn($vmid);
4382 } else {
ed221350 4383 lock_config($vmid, $updatefn, $vmid);
be190583 4384 }
91bd6c90
DM
4385 }
4386 }
4387}
4388
4389sub restore_vma_archive {
4390 my ($archive, $vmid, $user, $opts, $comp) = @_;
4391
4392 my $input = $archive eq '-' ? "<&STDIN" : undef;
4393 my $readfrom = $archive;
4394
4395 my $uncomp = '';
4396 if ($comp) {
4397 $readfrom = '-';
4398 my $qarchive = PVE::Tools::shellquote($archive);
4399 if ($comp eq 'gzip') {
4400 $uncomp = "zcat $qarchive|";
4401 } elsif ($comp eq 'lzop') {
4402 $uncomp = "lzop -d -c $qarchive|";
4403 } else {
4404 die "unknown compression method '$comp'\n";
4405 }
be190583 4406
91bd6c90
DM
4407 }
4408
4409 my $tmpdir = "/var/tmp/vzdumptmp$$";
4410 rmtree $tmpdir;
4411
4412 # disable interrupts (always do cleanups)
4413 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4414 warn "got interrupt - ignored\n";
4415 };
4416
4417 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4418 POSIX::mkfifo($mapfifo, 0600);
4419 my $fifofh;
4420
4421 my $openfifo = sub {
4422 open($fifofh, '>', $mapfifo) || die $!;
4423 };
4424
4425 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4426
4427 my $oldtimeout;
4428 my $timeout = 5;
4429
4430 my $devinfo = {};
4431
4432 my $rpcenv = PVE::RPCEnvironment::get();
4433
ed221350 4434 my $conffile = config_file($vmid);
91bd6c90
DM
4435 my $tmpfn = "$conffile.$$.tmp";
4436
ed221350
DM
4437 # Note: $oldconf is undef if VM does not exists
4438 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4439
91bd6c90
DM
4440 my $print_devmap = sub {
4441 my $virtdev_hash = {};
4442
4443 my $cfgfn = "$tmpdir/qemu-server.conf";
4444
4445 # we can read the config - that is already extracted
4446 my $fh = IO::File->new($cfgfn, "r") ||
4447 "unable to read qemu-server.conf - $!\n";
4448
4449 while (defined(my $line = <$fh>)) {
4450 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4451 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4452 die "archive does not contain data for drive '$virtdev'\n"
4453 if !$devinfo->{$devname};
4454 if (defined($opts->{storage})) {
4455 $storeid = $opts->{storage} || 'local';
4456 } elsif (!$storeid) {
4457 $storeid = 'local';
4458 }
4459 $format = 'raw' if !$format;
4460 $devinfo->{$devname}->{devname} = $devname;
4461 $devinfo->{$devname}->{virtdev} = $virtdev;
4462 $devinfo->{$devname}->{format} = $format;
4463 $devinfo->{$devname}->{storeid} = $storeid;
4464
be190583 4465 # check permission on storage
91bd6c90
DM
4466 my $pool = $opts->{pool}; # todo: do we need that?
4467 if ($user ne 'root@pam') {
4468 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4469 }
4470
4471 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4472 }
4473 }
4474
4475 foreach my $devname (keys %$devinfo) {
be190583
DM
4476 die "found no device mapping information for device '$devname'\n"
4477 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
4478 }
4479
91bd6c90 4480 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
4481
4482 # create empty/temp config
be190583 4483 if ($oldconf) {
ed221350
DM
4484 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4485 foreach_drive($oldconf, sub {
4486 my ($ds, $drive) = @_;
4487
4488 return if drive_is_cdrom($drive);
4489
4490 my $volid = $drive->{file};
4491
4492 return if !$volid || $volid =~ m|^/|;
4493
4494 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4495 return if !$path || !$owner || ($owner != $vmid);
4496
4497 # Note: only delete disk we want to restore
4498 # other volumes will become unused
4499 if ($virtdev_hash->{$ds}) {
4500 PVE::Storage::vdisk_free($cfg, $volid);
4501 }
4502 });
4503 }
4504
4505 my $map = {};
91bd6c90
DM
4506 foreach my $virtdev (sort keys %$virtdev_hash) {
4507 my $d = $virtdev_hash->{$virtdev};
4508 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4509 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
4510
4511 # test if requested format is supported
4512 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4513 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4514 $d->{format} = $defFormat if !$supported;
4515
91bd6c90
DM
4516 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4517 $d->{format}, undef, $alloc_size);
4518 print STDERR "new volume ID is '$volid'\n";
4519 $d->{volid} = $volid;
4520 my $path = PVE::Storage::path($cfg, $volid);
4521
4522 my $write_zeros = 1;
4523 # fixme: what other storages types initialize volumes with zero?
244f2577 4524 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 4525 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
4526 $write_zeros = 0;
4527 }
4528
4529 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4530
4531 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4532 $map->{$virtdev} = $volid;
4533 }
4534
4535 $fh->seek(0, 0) || die "seek failed - $!\n";
4536
4537 my $outfd = new IO::File ($tmpfn, "w") ||
4538 die "unable to write config for VM $vmid\n";
4539
4540 my $cookie = { netcount => 0 };
4541 while (defined(my $line = <$fh>)) {
be190583 4542 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
4543 }
4544
4545 $fh->close();
4546 $outfd->close();
4547 };
4548
4549 eval {
4550 # enable interrupts
4551 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4552 die "interrupted by signal\n";
4553 };
4554 local $SIG{ALRM} = sub { die "got timeout\n"; };
4555
4556 $oldtimeout = alarm($timeout);
4557
4558 my $parser = sub {
4559 my $line = shift;
4560
4561 print "$line\n";
4562
4563 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
4564 my ($dev_id, $size, $devname) = ($1, $2, $3);
4565 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
4566 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 4567 # we correctly received the vma config, so we can disable
3cf90d7a
DM
4568 # the timeout now for disk allocation (set to 10 minutes, so
4569 # that we always timeout if something goes wrong)
4570 alarm(600);
91bd6c90
DM
4571 &$print_devmap();
4572 print $fifofh "done\n";
4573 my $tmp = $oldtimeout || 0;
4574 $oldtimeout = undef;
4575 alarm($tmp);
4576 close($fifofh);
4577 }
4578 };
be190583 4579
91bd6c90
DM
4580 print "restore vma archive: $cmd\n";
4581 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
4582 };
4583 my $err = $@;
4584
4585 alarm($oldtimeout) if $oldtimeout;
4586
4587 unlink $mapfifo;
4588
4589 if ($err) {
4590 rmtree $tmpdir;
4591 unlink $tmpfn;
4592
4593 my $cfg = cfs_read_file('storage.cfg');
4594 foreach my $devname (keys %$devinfo) {
4595 my $volid = $devinfo->{$devname}->{volid};
4596 next if !$volid;
4597 eval {
4598 if ($volid =~ m|^/|) {
4599 unlink $volid || die 'unlink failed\n';
4600 } else {
4601 PVE::Storage::vdisk_free($cfg, $volid);
4602 }
4603 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4604 };
4605 print STDERR "unable to cleanup '$volid' - $@" if $@;
4606 }
4607 die $err;
4608 }
4609
4610 rmtree $tmpdir;
ed221350
DM
4611
4612 rename($tmpfn, $conffile) ||
91bd6c90
DM
4613 die "unable to commit configuration file '$conffile'\n";
4614
ed221350
DM
4615 PVE::Cluster::cfs_update(); # make sure we read new file
4616
91bd6c90
DM
4617 eval { rescan($vmid, 1); };
4618 warn $@ if $@;
4619}
4620
4621sub restore_tar_archive {
4622 my ($archive, $vmid, $user, $opts) = @_;
4623
9c502e26 4624 if ($archive ne '-') {
ed221350 4625 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
4626 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
4627 if $firstfile ne 'qemu-server.conf';
4628 }
3e16d5fc 4629
ed221350 4630 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 4631
ed221350 4632 # destroy existing data - keep empty config
ebb55558
DM
4633 my $vmcfgfn = PVE::QemuServer::config_file($vmid);
4634 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 4635
3e16d5fc
DM
4636 my $tocmd = "/usr/lib/qemu-server/qmextract";
4637
2415a446 4638 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 4639 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
4640 $tocmd .= ' --prealloc' if $opts->{prealloc};
4641 $tocmd .= ' --info' if $opts->{info};
4642
a0d1b1a2 4643 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 4644 # so we pipe to zcat
2415a446
DM
4645 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
4646 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
4647
4648 my $tmpdir = "/var/tmp/vzdumptmp$$";
4649 mkpath $tmpdir;
4650
4651 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
4652 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 4653 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 4654
ed221350 4655 my $conffile = config_file($vmid);
3e16d5fc
DM
4656 my $tmpfn = "$conffile.$$.tmp";
4657
4658 # disable interrupts (always do cleanups)
4659 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4660 print STDERR "got interrupt - ignored\n";
4661 };
4662
afdb31d5 4663 eval {
3e16d5fc
DM
4664 # enable interrupts
4665 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4666 die "interrupted by signal\n";
4667 };
4668
9c502e26
DM
4669 if ($archive eq '-') {
4670 print "extracting archive from STDIN\n";
4671 run_command($cmd, input => "<&STDIN");
4672 } else {
4673 print "extracting archive '$archive'\n";
4674 run_command($cmd);
4675 }
3e16d5fc
DM
4676
4677 return if $opts->{info};
4678
4679 # read new mapping
4680 my $map = {};
4681 my $statfile = "$tmpdir/qmrestore.stat";
4682 if (my $fd = IO::File->new($statfile, "r")) {
4683 while (defined (my $line = <$fd>)) {
4684 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4685 $map->{$1} = $2 if $1;
4686 } else {
4687 print STDERR "unable to parse line in statfile - $line\n";
4688 }
4689 }
4690 $fd->close();
4691 }
4692
4693 my $confsrc = "$tmpdir/qemu-server.conf";
4694
4695 my $srcfd = new IO::File($confsrc, "r") ||
4696 die "unable to open file '$confsrc'\n";
4697
4698 my $outfd = new IO::File ($tmpfn, "w") ||
4699 die "unable to write config for VM $vmid\n";
4700
91bd6c90 4701 my $cookie = { netcount => 0 };
3e16d5fc 4702 while (defined (my $line = <$srcfd>)) {
be190583 4703 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
4704 }
4705
4706 $srcfd->close();
4707 $outfd->close();
4708 };
4709 my $err = $@;
4710
afdb31d5 4711 if ($err) {
3e16d5fc
DM
4712
4713 unlink $tmpfn;
4714
ed221350 4715 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 4716
3e16d5fc 4717 die $err;
afdb31d5 4718 }
3e16d5fc
DM
4719
4720 rmtree $tmpdir;
4721
4722 rename $tmpfn, $conffile ||
4723 die "unable to commit configuration file '$conffile'\n";
91bd6c90 4724
ed221350
DM
4725 PVE::Cluster::cfs_update(); # make sure we read new file
4726
91bd6c90
DM
4727 eval { rescan($vmid, 1); };
4728 warn $@ if $@;
3e16d5fc
DM
4729};
4730
0d18dcfc
DM
4731
4732# Internal snapshots
4733
4734# NOTE: Snapshot create/delete involves several non-atomic
4735# action, and can take a long time.
4736# So we try to avoid locking the file and use 'lock' variable
4737# inside the config file instead.
4738
ef59d1ca
DM
4739my $snapshot_copy_config = sub {
4740 my ($source, $dest) = @_;
4741
4742 foreach my $k (keys %$source) {
4743 next if $k eq 'snapshots';
982c7f12
DM
4744 next if $k eq 'snapstate';
4745 next if $k eq 'snaptime';
18bfb361 4746 next if $k eq 'vmstate';
ef59d1ca
DM
4747 next if $k eq 'lock';
4748 next if $k eq 'digest';
db7c26e5 4749 next if $k eq 'description';
ef59d1ca 4750 next if $k =~ m/^unused\d+$/;
be190583 4751
ef59d1ca
DM
4752 $dest->{$k} = $source->{$k};
4753 }
4754};
4755
4756my $snapshot_apply_config = sub {
4757 my ($conf, $snap) = @_;
4758
4759 # copy snapshot list
4760 my $newconf = {
4761 snapshots => $conf->{snapshots},
4762 };
4763
db7c26e5 4764 # keep description and list of unused disks
ef59d1ca 4765 foreach my $k (keys %$conf) {
db7c26e5 4766 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
4767 $newconf->{$k} = $conf->{$k};
4768 }
4769
4770 &$snapshot_copy_config($snap, $newconf);
4771
4772 return $newconf;
4773};
4774
18bfb361
DM
4775sub foreach_writable_storage {
4776 my ($conf, $func) = @_;
4777
4778 my $sidhash = {};
4779
4780 foreach my $ds (keys %$conf) {
4781 next if !valid_drivename($ds);
4782
4783 my $drive = parse_drive($ds, $conf->{$ds});
4784 next if !$drive;
4785 next if drive_is_cdrom($drive);
4786
4787 my $volid = $drive->{file};
4788
4789 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 4790 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
4791 }
4792
4793 foreach my $sid (sort keys %$sidhash) {
4794 &$func($sid);
4795 }
4796}
4797
4798my $alloc_vmstate_volid = sub {
4799 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 4800
18bfb361
DM
4801 # Note: we try to be smart when selecting a $target storage
4802
4803 my $target;
4804
4805 # search shared storage first
4806 foreach_writable_storage($conf, sub {
4807 my ($sid) = @_;
4808 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4809 return if !$scfg->{shared};
4810
4811 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
4812 });
4813
4814 if (!$target) {
4815 # now search local storage
4816 foreach_writable_storage($conf, sub {
4817 my ($sid) = @_;
4818 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4819 return if $scfg->{shared};
4820
4821 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
4822 });
4823 }
4824
4825 $target = 'local' if !$target;
4826
fe6249f4
DM
4827 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
4828 # we abort live save after $conf->{memory}, so we need at max twice that space
4829 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
4830
4831 my $name = "vm-$vmid-state-$snapname";
4832 my $scfg = PVE::Storage::storage_config($storecfg, $target);
4833 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
4834 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
4835
4836 return $volid;
4837};
4838
0d18dcfc 4839my $snapshot_prepare = sub {
18bfb361 4840 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
4841
4842 my $snap;
0d18dcfc
DM
4843
4844 my $updatefn = sub {
4845
4846 my $conf = load_config($vmid);
4847
be190583 4848 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
4849 if is_template($conf);
4850
0d18dcfc
DM
4851 check_lock($conf);
4852
22c377f0
DM
4853 $conf->{lock} = 'snapshot';
4854
be190583
DM
4855 die "snapshot name '$snapname' already used\n"
4856 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 4857
ee2f90b1 4858 my $storecfg = PVE::Storage::config();
7ea975ef 4859 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 4860
782f4f75 4861 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 4862
18bfb361
DM
4863 if ($save_vmstate && check_running($vmid)) {
4864 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
4865 }
4866
ef59d1ca 4867 &$snapshot_copy_config($conf, $snap);
0d18dcfc 4868
782f4f75
DM
4869 $snap->{snapstate} = "prepare";
4870 $snap->{snaptime} = time();
4871 $snap->{description} = $comment if $comment;
4872
4b15803d
DM
4873 # always overwrite machine if we save vmstate. This makes sure we
4874 # can restore it later using correct machine type
4875 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
4876
0d18dcfc
DM
4877 update_config_nolock($vmid, $conf, 1);
4878 };
4879
4880 lock_config($vmid, $updatefn);
22c377f0
DM
4881
4882 return $snap;
0d18dcfc
DM
4883};
4884
4885my $snapshot_commit = sub {
4886 my ($vmid, $snapname) = @_;
4887
4888 my $updatefn = sub {
4889
4890 my $conf = load_config($vmid);
4891
be190583
DM
4892 die "missing snapshot lock\n"
4893 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc 4894
7946e0fa
DM
4895 my $has_machine_config = defined($conf->{machine});
4896
0d18dcfc
DM
4897 my $snap = $conf->{snapshots}->{$snapname};
4898
be190583
DM
4899 die "snapshot '$snapname' does not exist\n" if !defined($snap);
4900
4901 die "wrong snapshot state\n"
4902 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 4903
0d18dcfc 4904 delete $snap->{snapstate};
ee2f90b1 4905 delete $conf->{lock};
0d18dcfc 4906
ef59d1ca 4907 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 4908
7946e0fa
DM
4909 delete $newconf->{machine} if !$has_machine_config;
4910
05e5ad3f
DM
4911 $newconf->{parent} = $snapname;
4912
0d18dcfc
DM
4913 update_config_nolock($vmid, $newconf, 1);
4914 };
4915
4916 lock_config($vmid, $updatefn);
4917};
4918
22c377f0
DM
4919sub snapshot_rollback {
4920 my ($vmid, $snapname) = @_;
4921
4922 my $snap;
4923
4924 my $prepare = 1;
4925
a3222b91 4926 my $storecfg = PVE::Storage::config();
be190583 4927
22c377f0
DM
4928 my $updatefn = sub {
4929
4930 my $conf = load_config($vmid);
4931
8b43bc11 4932 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 4933
ab33a7c2
DM
4934 $snap = $conf->{snapshots}->{$snapname};
4935
be190583 4936 die "snapshot '$snapname' does not exist\n" if !defined($snap);
ab33a7c2 4937
be190583 4938 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
4939 if $snap->{snapstate};
4940
a3222b91
DM
4941 if ($prepare) {
4942 check_lock($conf);
4943 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
4944 }
22c377f0
DM
4945
4946 die "unable to rollback vm $vmid: vm is running\n"
4947 if check_running($vmid);
4948
4949 if ($prepare) {
4950 $conf->{lock} = 'rollback';
4951 } else {
4952 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
4953 delete $conf->{lock};
4954 }
4955
4b15803d
DM
4956 my $forcemachine;
4957
22c377f0 4958 if (!$prepare) {
4b15803d
DM
4959 my $has_machine_config = defined($conf->{machine});
4960
22c377f0 4961 # copy snapshot config to current config
ef59d1ca
DM
4962 $conf = &$snapshot_apply_config($conf, $snap);
4963 $conf->{parent} = $snapname;
4b15803d 4964
d8b916fd
DM
4965 # Note: old code did not store 'machine', so we try to be smart
4966 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
4967 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 4968 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
4969 # in the original config.
4970 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
4971 }
4972
4973 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
4974
4975 if (!$prepare && $snap->{vmstate}) {
4976 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 4977 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 4978 }
22c377f0
DM
4979 };
4980
4981 lock_config($vmid, $updatefn);
be190583 4982
22c377f0
DM
4983 foreach_drive($snap, sub {
4984 my ($ds, $drive) = @_;
4985
4986 return if drive_is_cdrom($drive);
4987
4988 my $volid = $drive->{file};
4989 my $device = "drive-$ds";
4990
79e57b29 4991 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
4992 });
4993
4994 $prepare = 0;
4995 lock_config($vmid, $updatefn);
4996}
4997
9dcf4909
DM
4998my $savevm_wait = sub {
4999 my ($vmid) = @_;
5000
5001 for(;;) {
ed221350 5002 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
5003 if (!$stat->{status}) {
5004 die "savevm not active\n";
5005 } elsif ($stat->{status} eq 'active') {
5006 sleep(1);
5007 next;
5008 } elsif ($stat->{status} eq 'completed') {
5009 last;
5010 } else {
5011 die "query-savevm returned status '$stat->{status}'\n";
5012 }
5013 }
5014};
5015
0d18dcfc 5016sub snapshot_create {
af9110dd 5017 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
0d18dcfc 5018
18bfb361 5019 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 5020
af9110dd 5021 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
18bfb361 5022
67fb9de6
DM
5023 my $config = load_config($vmid);
5024
af9110dd
WL
5025 my $running = check_running($vmid);
5026
67fb9de6 5027 my $freezefs = $running && $config->{agent};
af9110dd
WL
5028 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5029
5030 my $drivehash = {};
5031
5032 if ($freezefs) {
65994ad7
WL
5033 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5034 warn "guest-fsfreeze-freeze problems - $@" if $@;
5035 }
67fb9de6 5036
0d18dcfc
DM
5037 eval {
5038 # create internal snapshots of all drives
22c377f0
DM
5039
5040 my $storecfg = PVE::Storage::config();
a3222b91
DM
5041
5042 if ($running) {
5043 if ($snap->{vmstate}) {
be190583 5044 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
5045 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5046 &$savevm_wait($vmid);
a3222b91 5047 } else {
9dcf4909 5048 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
5049 }
5050 };
5051
22c377f0
DM
5052 foreach_drive($snap, sub {
5053 my ($ds, $drive) = @_;
5054
5055 return if drive_is_cdrom($drive);
0d18dcfc 5056
22c377f0
DM
5057 my $volid = $drive->{file};
5058 my $device = "drive-$ds";
5059
5060 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 5061 $drivehash->{$ds} = 1;
22c377f0 5062 });
0d18dcfc 5063 };
22c377f0
DM
5064 my $err = $@;
5065
65994ad7
WL
5066 if ($running) {
5067 eval { vm_mon_cmd($vmid, "savevm-end") };
5068 warn $@ if $@;
22c377f0 5069
af9110dd 5070 if ($freezefs) {
67fb9de6 5071 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
65994ad7
WL
5072 warn "guest-fsfreeze-thaw problems - $@" if $@;
5073 }
22c377f0 5074
65994ad7 5075 # savevm-end is async, we need to wait
f34ebd52 5076 for (;;) {
2c9e8036
AD
5077 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5078 if (!$stat->{bytes}) {
5079 last;
5080 } else {
5081 print "savevm not yet finished\n";
5082 sleep(1);
5083 next;
5084 }
5085 }
5086 }
5087
22c377f0 5088 if ($err) {
0d18dcfc 5089 warn "snapshot create failed: starting cleanup\n";
3ee28e38 5090 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
5091 warn $@ if $@;
5092 die $err;
5093 }
5094
5095 &$snapshot_commit($vmid, $snapname);
5096}
5097
3ee28e38 5098# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 5099sub snapshot_delete {
3ee28e38 5100 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
5101
5102 my $prepare = 1;
5103
22c377f0 5104 my $snap;
ee2f90b1 5105 my $unused = [];
0d18dcfc 5106
6cb1a8cf
DM
5107 my $unlink_parent = sub {
5108 my ($confref, $new_parent) = @_;
5109
5110 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5111 if ($new_parent) {
5112 $confref->{parent} = $new_parent;
5113 } else {
5114 delete $confref->{parent};
5115 }
5116 }
5117 };
be190583 5118
0d18dcfc 5119 my $updatefn = sub {
2009f324 5120 my ($remove_drive) = @_;
0d18dcfc 5121
22c377f0 5122 my $conf = load_config($vmid);
0d18dcfc 5123
5295b23d
DM
5124 if (!$drivehash) {
5125 check_lock($conf);
be190583 5126 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
5127 if is_template($conf);
5128 }
0d18dcfc 5129
22c377f0 5130 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 5131
be190583 5132 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
5133
5134 # remove parent refs
8fd882a4
SP
5135 if (!$prepare) {
5136 &$unlink_parent($conf, $snap->{parent});
5137 foreach my $sn (keys %{$conf->{snapshots}}) {
5138 next if $sn eq $snapname;
5139 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5140 }
0d18dcfc
DM
5141 }
5142
2009f324 5143 if ($remove_drive) {
18bfb361
DM
5144 if ($remove_drive eq 'vmstate') {
5145 delete $snap->{$remove_drive};
5146 } else {
5147 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5148 my $volid = $drive->{file};
5149 delete $snap->{$remove_drive};
5150 add_unused_volume($conf, $volid);
5151 }
2009f324
DM
5152 }
5153
0d18dcfc
DM
5154 if ($prepare) {
5155 $snap->{snapstate} = 'delete';
5156 } else {
5157 delete $conf->{snapshots}->{$snapname};
3ee28e38 5158 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
5159 foreach my $volid (@$unused) {
5160 add_unused_volume($conf, $volid);
5161 }
0d18dcfc
DM
5162 }
5163
5164 update_config_nolock($vmid, $conf, 1);
5165 };
5166
5167 lock_config($vmid, $updatefn);
5168
18bfb361 5169 # now remove vmstate file
0d18dcfc 5170
22c377f0
DM
5171 my $storecfg = PVE::Storage::config();
5172
18bfb361
DM
5173 if ($snap->{vmstate}) {
5174 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5175 if (my $err = $@) {
5176 die $err if !$force;
5177 warn $err;
5178 }
5179 # save changes (remove vmstate from snapshot)
5180 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5181 };
5182
5183 # now remove all internal snapshots
5184 foreach_drive($snap, sub {
22c377f0
DM
5185 my ($ds, $drive) = @_;
5186
5187 return if drive_is_cdrom($drive);
3ee28e38 5188
22c377f0
DM
5189 my $volid = $drive->{file};
5190 my $device = "drive-$ds";
5191
2009f324
DM
5192 if (!$drivehash || $drivehash->{$ds}) {
5193 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5194 if (my $err = $@) {
5195 die $err if !$force;
5196 warn $err;
5197 }
3ee28e38 5198 }
2009f324
DM
5199
5200 # save changes (remove drive fron snapshot)
5201 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5202 push @$unused, $volid;
22c377f0 5203 });
0d18dcfc
DM
5204
5205 # now cleanup config
5206 $prepare = 0;
5207 lock_config($vmid, $updatefn);
5208}
5209
9cd07842 5210sub has_feature {
7ea975ef
AD
5211 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5212
719893a9 5213 my $err;
7ea975ef
AD
5214 foreach_drive($conf, sub {
5215 my ($ds, $drive) = @_;
5216
5217 return if drive_is_cdrom($drive);
5218 my $volid = $drive->{file};
5219 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5220 });
5221
719893a9 5222 return $err ? 0 : 1;
7ea975ef 5223}
04a69bb4
AD
5224
5225sub template_create {
5226 my ($vmid, $conf, $disk) = @_;
5227
04a69bb4 5228 my $storecfg = PVE::Storage::config();
04a69bb4 5229
9cd07842
DM
5230 foreach_drive($conf, sub {
5231 my ($ds, $drive) = @_;
5232
5233 return if drive_is_cdrom($drive);
5234 return if $disk && $ds ne $disk;
5235
5236 my $volid = $drive->{file};
bbd56097 5237 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5238
04a69bb4
AD
5239 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5240 $drive->{file} = $voliddst;
152fe752
DM
5241 $conf->{$ds} = print_drive($vmid, $drive);
5242 update_config_nolock($vmid, $conf, 1);
04a69bb4 5243 });
04a69bb4
AD
5244}
5245
624361b3
AD
5246sub is_template {
5247 my ($conf) = @_;
5248
96d695c0 5249 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5250}
5251
5133de42
AD
5252sub qemu_img_convert {
5253 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5254
5255 my $storecfg = PVE::Storage::config();
5256 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5257 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5258
5259 if ($src_storeid && $dst_storeid) {
5260 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5261 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5262
5263 my $src_format = qemu_img_format($src_scfg, $src_volname);
5264 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5265
5266 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5267 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5268
5269 my $cmd = [];
71ddbff9 5270 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5271 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5272 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5273
5274 my $parser = sub {
5275 my $line = shift;
5276 if($line =~ m/\((\S+)\/100\%\)/){
5277 my $percent = $1;
5278 my $transferred = int($size * $percent / 100);
5279 my $remaining = $size - $transferred;
5280
5281 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5282 }
5283
5284 };
5285
5286 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5287 my $err = $@;
5288 die "copy failed: $err" if $err;
5289 }
5290}
5291
5292sub qemu_img_format {
5293 my ($scfg, $volname) = @_;
5294
ccb5c001 5295 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5296 return $1;
ccb5c001 5297 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5298 return "host_device";
be190583 5299 } else {
5133de42 5300 return "raw";
5133de42
AD
5301 }
5302}
5303
cfad42af 5304sub qemu_drive_mirror {
ab6ecffe 5305 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
cfad42af 5306
ab6ecffe 5307 my $count = 0;
cfad42af
AD
5308 my $old_len = 0;
5309 my $frozen = undef;
ab6ecffe 5310 my $maxwait = 120;
cfad42af
AD
5311
5312 my $storecfg = PVE::Storage::config();
08ac653f 5313 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
152fe752 5314
08ac653f 5315 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 5316
08ac653f
DM
5317 my $format;
5318 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5319 $format = $1;
5320 }
21ccdb50 5321
08ac653f 5322 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 5323
88383920
DM
5324 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5325 $opts->{format} = $format if $format;
5326
5327 #fixme : sometime drive-mirror timeout, but works fine after.
5328 # (I have see the problem with big volume > 200GB), so we need to eval
f34ebd52 5329 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
88383920 5330 # ignore errors here
21ccdb50 5331
08ac653f
DM
5332 eval {
5333 while (1) {
5334 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5335 my $stat = @$stats[0];
5336 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5337 die "error job is not mirroring" if $stat->{type} ne "mirror";
5338
08ac653f
DM
5339 my $busy = $stat->{busy};
5340
6f708643
DM
5341 if (my $total = $stat->{len}) {
5342 my $transferred = $stat->{offset} || 0;
5343 my $remaining = $total - $transferred;
5344 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
67fb9de6 5345
6f708643
DM
5346 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
5347 }
f34ebd52 5348
08ac653f
DM
5349 if ($stat->{len} == $stat->{offset}) {
5350 if ($busy eq 'false') {
5351
5352 last if $vmiddst != $vmid;
f34ebd52 5353
08ac653f
DM
5354 # try to switch the disk if source and destination are on the same guest
5355 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
5356 last if !$@;
5357 die $@ if $@ !~ m/cannot be completed/;
cfad42af 5358 }
b467f79a 5359
08ac653f
DM
5360 if ($count > $maxwait) {
5361 # if too much writes to disk occurs at the end of migration
5362 #the disk needs to be freezed to be able to complete the migration
5363 vm_suspend($vmid,1);
5364 $frozen = 1;
bcc87408 5365 }
08ac653f
DM
5366 $count ++
5367 }
5368 $old_len = $stat->{offset};
5369 sleep 1;
cfad42af
AD
5370 }
5371
08ac653f
DM
5372 vm_resume($vmid, 1) if $frozen;
5373
5374 };
88383920 5375 my $err = $@;
08ac653f 5376
88383920 5377 my $cancel_job = sub {
08ac653f
DM
5378 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
5379 while (1) {
5380 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5381 my $stat = @$stats[0];
5382 last if !$stat;
5383 sleep 1;
cfad42af 5384 }
88383920
DM
5385 };
5386
5387 if ($err) {
f34ebd52 5388 eval { &$cancel_job(); };
88383920
DM
5389 die "mirroring error: $err";
5390 }
5391
5392 if ($vmiddst != $vmid) {
5393 # if we clone a disk for a new target vm, we don't switch the disk
5394 &$cancel_job(); # so we call block-job-cancel
cfad42af
AD
5395 }
5396}
5397
152fe752 5398sub clone_disk {
be190583 5399 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
5400 $newvmid, $storage, $format, $full, $newvollist) = @_;
5401
5402 my $newvolid;
5403
5404 if (!$full) {
5405 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 5406 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
5407 push @$newvollist, $newvolid;
5408 } else {
5409 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5410 $storeid = $storage if $storage;
5411
1377d7b0
DM
5412 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5413 if (!$format) {
5414 $format = $drive->{format} || $defFormat;
152fe752
DM
5415 }
5416
1377d7b0
DM
5417 # test if requested format is supported - else use default
5418 my $supported = grep { $_ eq $format } @$validFormats;
5419 $format = $defFormat if !$supported;
5420
152fe752
DM
5421 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5422
5423 print "create full clone of drive $drivename ($drive->{file})\n";
5424 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5425 push @$newvollist, $newvolid;
5426
5427 if (!$running || $snapname) {
5428 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5429 } else {
5430 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 5431 }
152fe752
DM
5432 }
5433
5434 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5435
5436 my $disk = $drive;
5437 $disk->{format} = undef;
5438 $disk->{file} = $newvolid;
5439 $disk->{size} = $size;
5440
5441 return $disk;
5442}
5443
ff556cf2
DM
5444# this only works if VM is running
5445sub get_current_qemu_machine {
5446 my ($vmid) = @_;
5447
5448 my $cmd = { execute => 'query-machines', arguments => {} };
be190583 5449 my $res = PVE::QemuServer::vm_qmp_command($vmid, $cmd);
ff556cf2
DM
5450
5451 my ($current, $default);
5452 foreach my $e (@$res) {
5453 $default = $e->{name} if $e->{'is-default'};
5454 $current = $e->{name} if $e->{'is-current'};
5455 }
5456
5457 # fallback to the default machine if current is not supported by qemu
5458 return $current || $default || 'pc';
5459}
5460
4543ecf0
AD
5461sub lspci {
5462
5463 my $devices = {};
5464
5465 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5466 my (undef, $id, $function) = @_;
5467 my $res = { id => $id, function => $function};
5468 push @{$devices->{$id}}, $res;
5469 });
5470
5471 return $devices;
5472}
5473
1e3baf05 54741;