]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
bump version to 3.3-7
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05 154my $confdesc = {
7183bd9a
AD
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
1e3baf05
DM
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
2ff09f52
DA
173 hotplug => {
174 optional => 1,
e8b9c17c 175 type => 'boolean',
6c52b679 176 description => "Allow hotplug for disk and network device",
2dbe827e 177 default => 0,
2ff09f52 178 },
1e3baf05
DM
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
22c377f0 189 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
7878afeb 209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
210 minimum => 16,
211 default => 512,
212 },
13a48620
DA
213 balloon => {
214 optional => 1,
215 type => 'integer',
8b1accf7
DM
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
13a48620 226 },
1e3baf05
DM
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 231 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
7fabe17d 236 type => 'string', format => 'dns-name',
1e3baf05
DM
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
cdd20088
AD
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
5b952ff5 243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
244 default => 'lsi',
245 },
1e3baf05
DM
246 description => {
247 optional => 1,
248 type => 'string',
0581fe4f 249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
6b9d84cf 254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
255 description => <<EODESC,
256Used to enable special optimization/features for specific
257operating systems:
258
259other => unspecified OS
260wxp => Microsoft Windows XP
261w2k => Microsoft Windows 2000
262w2k3 => Microsoft Windows 2003
263w2k8 => Microsoft Windows 2008
264wvista => Microsoft Windows Vista
265win7 => Microsoft Windows 7
a70ebde3 266win8 => Microsoft Windows 8/2012
1e3baf05
DM
267l24 => Linux 2.4 Kernel
268l26 => Linux 2.6/3.X Kernel
6b9d84cf 269solaris => solaris/opensolaris/openindiania kernel
1e3baf05 270
6b9d84cf 271other|l24|l26|solaris ... no special behaviour
a70ebde3 272wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
273EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
32baffb4 280 default => 'cdn',
1e3baf05
DM
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
03e480fc 286 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
8a010eae
AD
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
3bd18e48
AD
315 maxcpus => {
316 optional => 1,
317 type => 'integer',
318 description => "Maximum cpus for hotplug.",
319 minimum => 1,
320 default => 1,
321 },
1e3baf05
DM
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
bc84dcca 328 agent => {
ab6a046f
AD
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
be79c214 332 default => 0,
ab6a046f 333 },
1e3baf05
DM
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
8c559505
DM
343 description => "Enable/disable time drift fix.",
344 default => 0,
1e3baf05 345 },
19672434 346 localtime => {
1e3baf05
DM
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
ef5e2be2 359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 361 },
0ea9541d
DM
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
1e3baf05
DM
368 startdate => {
369 optional => 1,
19672434 370 type => 'string',
1e3baf05
DM
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
59411c4e
DM
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
68eda3ab
AD
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
1e3baf05
DM
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394args: -no-reboot -no-hpet
395EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
5acbfe9e 401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
04432191 412 type => 'number',
1e3baf05
DM
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
04432191 415 default => 0.1,
1e3baf05
DM
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
3aefd6fd 427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 428 default => 'kvm64',
1e3baf05 429 },
b7ba6b79
DM
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
982c7f12
DM
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
18bfb361
DM
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
3bafc510
DM
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
2796e7d5
DM
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
1e3baf05
DM
459};
460
461# what about other qemu settings ?
462#cpu => 'string',
463#machine => 'string',
464#fda => 'file',
465#fdb => 'file',
466#mtdblock => 'file',
467#sd => 'file',
468#pflash => 'file',
469#snapshot => 'bool',
470#bootp => 'file',
471##tftp => 'dir',
472##smb => 'dir',
473#kernel => 'file',
474#append => 'string',
475#initrd => 'file',
476##soundhw => 'string',
477
478while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480}
481
482my $MAX_IDE_DISKS = 4;
f62db2a4 483my $MAX_SCSI_DISKS = 14;
a2650619 484my $MAX_VIRTIO_DISKS = 16;
cdb0931f 485my $MAX_SATA_DISKS = 6;
1e3baf05 486my $MAX_USB_DEVICES = 5;
5bdcf937 487my $MAX_NETS = 32;
1e3baf05 488my $MAX_UNUSED_DISKS = 8;
5cffb2d2 489my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 490my $MAX_SERIAL_PORTS = 4;
1989a89c 491my $MAX_PARALLEL_PORTS = 3;
2ed5d572
AD
492my $MAX_NUMA = 8;
493
494my $numadesc = {
495 optional => 1,
496 type => 'string', format => 'pve-qm-numanode',
497 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>][,policy=<preferred|bind|interleave>]]",
498 description => "numa topology",
499};
500PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
501
502for (my $i = 0; $i < $MAX_NUMA; $i++) {
503 $confdesc->{"numa$i"} = $numadesc;
504}
1e3baf05
DM
505
506my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
e4c6e0b8 507 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
6b64503e 508my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 509
1e3baf05
DM
510my $netdesc = {
511 optional => 1,
512 type => 'string', format => 'pve-qm-net',
a9410357 513 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
1e3baf05 514 description => <<EODESCR,
19672434 515Specify network devices.
1e3baf05
DM
516
517MODEL is one of: $nic_model_list_txt
518
19672434 519XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
520automatically generated if not specified.
521
522The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
523
524Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
525
526If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
527
52810.0.2.2 Gateway
52910.0.2.3 DNS Server
53010.0.2.4 SMB Server
531
532The DHCP server assign addresses to the guest starting from 10.0.2.15.
533
534EODESCR
535};
536PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
537
538for (my $i = 0; $i < $MAX_NETS; $i++) {
539 $confdesc->{"net$i"} = $netdesc;
540}
541
542my $drivename_hash;
19672434 543
1e3baf05
DM
544my $idedesc = {
545 optional => 1,
546 type => 'string', format => 'pve-qm-drive',
8d87f8aa 547 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 548 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
549};
550PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
551
552my $scsidesc = {
553 optional => 1,
554 type => 'string', format => 'pve-qm-drive',
8d87f8aa 555 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 556 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
557};
558PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
559
cdb0931f
DA
560my $satadesc = {
561 optional => 1,
562 type => 'string', format => 'pve-qm-drive',
8d87f8aa 563 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 564 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
565};
566PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
567
1e3baf05
DM
568my $virtiodesc = {
569 optional => 1,
570 type => 'string', format => 'pve-qm-drive',
8d87f8aa 571 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 572 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
573};
574PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
575
576my $usbdesc = {
577 optional => 1,
578 type => 'string', format => 'pve-qm-usb-device',
80401dd8 579 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 580 description => <<EODESCR,
2fe1a152 581Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
582pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
583
19672434 584'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
585'vendor_id:product_id' (hexadeciaml numbers)
586
19672434 587You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
588
589Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
590
80401dd8
DM
591The value 'spice' can be used to add a usb redirection devices for spice.
592
1e3baf05
DM
593EODESCR
594};
595PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
596
040b06b7
DA
597my $hostpcidesc = {
598 optional => 1,
599 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 600 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
601 description => <<EODESCR,
602Map host pci devices. HOSTPCIDEVICE syntax is:
603
604'bus:dev.func' (hexadecimal numbers)
605
606You can us the 'lspci' command to list existing pci devices.
607
0cea6a01
DM
608The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
609
040b06b7
DA
610Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
611
612Experimental: user reported problems with this option.
613EODESCR
614};
615PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
616
bae179aa
DA
617my $serialdesc = {
618 optional => 1,
ca0cef26 619 type => 'string',
1b0b51ed 620 pattern => '(/dev/.+|socket)',
bae179aa 621 description => <<EODESCR,
1b0b51ed 622Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
623
624Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
625
626Experimental: user reported problems with this option.
627EODESCR
628};
bae179aa 629
1989a89c
DA
630my $paralleldesc= {
631 optional => 1,
ca0cef26 632 type => 'string',
9ecc8431 633 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 634 description => <<EODESCR,
19672434 635Map host parallel devices (n is 0 to 2).
1989a89c
DA
636
637Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
638
639Experimental: user reported problems with this option.
640EODESCR
641};
1989a89c
DA
642
643for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
644 $confdesc->{"parallel$i"} = $paralleldesc;
645}
646
bae179aa
DA
647for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
648 $confdesc->{"serial$i"} = $serialdesc;
649}
650
040b06b7
DA
651for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
652 $confdesc->{"hostpci$i"} = $hostpcidesc;
653}
1e3baf05
DM
654
655for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
656 $drivename_hash->{"ide$i"} = 1;
657 $confdesc->{"ide$i"} = $idedesc;
658}
659
cdb0931f
DA
660for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
661 $drivename_hash->{"sata$i"} = 1;
662 $confdesc->{"sata$i"} = $satadesc;
663}
664
1e3baf05
DM
665for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
666 $drivename_hash->{"scsi$i"} = 1;
667 $confdesc->{"scsi$i"} = $scsidesc ;
668}
669
670for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
671 $drivename_hash->{"virtio$i"} = 1;
672 $confdesc->{"virtio$i"} = $virtiodesc;
673}
674
675for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
676 $confdesc->{"usb$i"} = $usbdesc;
677}
678
679my $unuseddesc = {
680 optional => 1,
681 type => 'string', format => 'pve-volume-id',
682 description => "Reference to unused volumes.",
683};
684
685for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
686 $confdesc->{"unused$i"} = $unuseddesc;
687}
688
689my $kvm_api_version = 0;
690
691sub kvm_version {
692
693 return $kvm_api_version if $kvm_api_version;
694
6b64503e 695 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
696 return 0;
697
6b64503e 698 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
699 $kvm_api_version = $v;
700 }
701
702 $fh->close();
703
704 return $kvm_api_version;
705}
706
707my $kvm_user_version;
708
709sub kvm_user_version {
710
711 return $kvm_user_version if $kvm_user_version;
712
713 $kvm_user_version = 'unknown';
714
715 my $tmp = `kvm -help 2>/dev/null`;
19672434 716
fa7ae705 717 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
718 $kvm_user_version = $2;
719 }
720
721 return $kvm_user_version;
722
723}
724
725my $kernel_has_vhost_net = -c '/dev/vhost-net';
726
727sub disknames {
728 # order is important - used to autoselect boot disk
19672434 729 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 730 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
731 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
732 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
733}
734
735sub valid_drivename {
736 my $dev = shift;
737
6b64503e 738 return defined($drivename_hash->{$dev});
1e3baf05
DM
739}
740
741sub option_exists {
742 my $key = shift;
743 return defined($confdesc->{$key});
19672434 744}
1e3baf05
DM
745
746sub nic_models {
747 return $nic_model_list;
748}
749
750sub os_list_description {
751
752 return {
753 other => 'Other',
754 wxp => 'Windows XP',
755 w2k => 'Windows 2000',
756 w2k3 =>, 'Windows 2003',
757 w2k8 => 'Windows 2008',
758 wvista => 'Windows Vista',
759 win7 => 'Windows 7',
a70ebde3 760 win8 => 'Windows 8/2012',
1e3baf05
DM
761 l24 => 'Linux 2.4',
762 l26 => 'Linux 2.6',
19672434 763 };
1e3baf05
DM
764}
765
1e3baf05
DM
766my $cdrom_path;
767
768sub get_cdrom_path {
769
770 return $cdrom_path if $cdrom_path;
771
772 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
773 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
774 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
775}
776
777sub get_iso_path {
778 my ($storecfg, $vmid, $cdrom) = @_;
779
780 if ($cdrom eq 'cdrom') {
781 return get_cdrom_path();
782 } elsif ($cdrom eq 'none') {
783 return '';
784 } elsif ($cdrom =~ m|^/|) {
785 return $cdrom;
786 } else {
6b64503e 787 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
788 }
789}
790
791# try to convert old style file names to volume IDs
792sub filename_to_volume_id {
793 my ($vmid, $file, $media) = @_;
794
795 if (!($file eq 'none' || $file eq 'cdrom' ||
796 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 797
1e3baf05 798 return undef if $file =~ m|/|;
19672434 799
1e3baf05
DM
800 if ($media && $media eq 'cdrom') {
801 $file = "local:iso/$file";
802 } else {
803 $file = "local:$vmid/$file";
804 }
805 }
806
807 return $file;
808}
809
810sub verify_media_type {
811 my ($opt, $vtype, $media) = @_;
812
813 return if !$media;
814
815 my $etype;
816 if ($media eq 'disk') {
a125592c 817 $etype = 'images';
1e3baf05
DM
818 } elsif ($media eq 'cdrom') {
819 $etype = 'iso';
820 } else {
821 die "internal error";
822 }
823
824 return if ($vtype eq $etype);
19672434 825
1e3baf05
DM
826 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
827}
828
829sub cleanup_drive_path {
830 my ($opt, $storecfg, $drive) = @_;
831
832 # try to convert filesystem paths to volume IDs
833
834 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
835 ($drive->{file} !~ m|^/dev/.+|) &&
836 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 837 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
838 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
839 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
840 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
841 verify_media_type($opt, $vtype, $drive->{media});
842 $drive->{file} = $volid;
843 }
844
845 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
846}
847
848sub create_conf_nolock {
849 my ($vmid, $settings) = @_;
850
6b64503e 851 my $filename = config_file($vmid);
1e3baf05
DM
852
853 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 854
1e3baf05
DM
855 my $defaults = load_defaults();
856
857 $settings->{name} = "vm$vmid" if !$settings->{name};
858 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
859
860 my $data = '';
861 foreach my $opt (keys %$settings) {
862 next if !$confdesc->{$opt};
863
864 my $value = $settings->{$opt};
865 next if !$value;
866
867 $data .= "$opt: $value\n";
868 }
869
870 PVE::Tools::file_set_contents($filename, $data);
871}
872
f36ed4f4
DM
873my $parse_size = sub {
874 my ($value) = @_;
875
9bf371a6 876 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
877 my ($size, $unit) = ($1, $3);
878 if ($unit) {
879 if ($unit eq 'K') {
880 $size = $size * 1024;
881 } elsif ($unit eq 'M') {
882 $size = $size * 1024 * 1024;
883 } elsif ($unit eq 'G') {
884 $size = $size * 1024 * 1024 * 1024;
885 }
886 }
887 return int($size);
888};
889
890my $format_size = sub {
891 my ($size) = @_;
892
893 $size = int($size);
894
895 my $kb = int($size/1024);
896 return $size if $kb*1024 != $size;
897
898 my $mb = int($kb/1024);
899 return "${kb}K" if $mb*1024 != $kb;
900
901 my $gb = int($mb/1024);
902 return "${mb}M" if $gb*1024 != $mb;
903
904 return "${gb}G";
905};
906
1e3baf05
DM
907# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
908# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 909# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 910# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
911
912sub parse_drive {
913 my ($key, $data) = @_;
914
915 my $res = {};
19672434 916
1e3baf05
DM
917 # $key may be undefined - used to verify JSON parameters
918 if (!defined($key)) {
919 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
920 $res->{index} = 0;
921 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
922 $res->{interface} = $1;
923 $res->{index} = $2;
924 } else {
925 return undef;
926 }
927
928 foreach my $p (split (/,/, $data)) {
929 next if $p =~ m/^\s*$/;
930
74edd76b 931 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
932 my ($k, $v) = ($1, $2);
933
934 $k = 'file' if $k eq 'volume';
935
936 return undef if defined $res->{$k};
19672434 937
9bf371a6
DM
938 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
939 return undef if !$v || $v !~ m/^\d+/;
940 $k = "m$k";
941 $v = sprintf("%.3f", $v / (1024*1024));
942 }
1e3baf05
DM
943 $res->{$k} = $v;
944 } else {
945 if (!$res->{file} && $p !~ m/=/) {
946 $res->{file} = $p;
947 } else {
948 return undef;
949 }
950 }
951 }
952
953 return undef if !$res->{file};
954
bdf3f362
AD
955 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
956 $res->{format} = $1;
957 }
958
19672434 959 return undef if $res->{cache} &&
e482cec3 960 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
961 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
962 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
963 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
964 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
965 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
966 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
967 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
968 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
969 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
970 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
971 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 972 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 973
9bf371a6
DM
974 return undef if $res->{mbps_rd} && $res->{mbps};
975 return undef if $res->{mbps_wr} && $res->{mbps};
976
977 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 978 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 979 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 980 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 981 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 982 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 983
affd2f88
AD
984 return undef if $res->{iops_rd} && $res->{iops};
985 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
986
987
affd2f88 988 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 989 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 990 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 991 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 992 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 993 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
994
995
24afaca0 996 if ($res->{size}) {
be190583 997 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
998 }
999
1e3baf05
DM
1000 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1001 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 1002 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
1003 return undef if $res->{interface} eq 'virtio';
1004 }
1005
1006 # rerror does not work with scsi drives
1007 if ($res->{rerror}) {
1008 return undef if $res->{interface} eq 'scsi';
1009 }
1010
1011 return $res;
1012}
1013
74edd76b 1014my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
1015
1016sub print_drive {
1017 my ($vmid, $drive) = @_;
1018
1019 my $opts = '';
74edd76b 1020 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
1021 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1022 }
1023
24afaca0
DM
1024 if ($drive->{size}) {
1025 $opts .= ",size=" . &$format_size($drive->{size});
1026 }
1027
1e3baf05
DM
1028 return "$drive->{file}$opts";
1029}
1030
28ef82d3
DM
1031sub scsi_inquiry {
1032 my($fh, $noerr) = @_;
1033
1034 my $SG_IO = 0x2285;
1035 my $SG_GET_VERSION_NUM = 0x2282;
1036
1037 my $versionbuf = "\x00" x 8;
1038 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1039 if (!$ret) {
1040 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1041 return undef;
1042 }
97d62eb7 1043 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1044 if ($version < 30000) {
1045 die "scsi generic interface too old\n" if !$noerr;
1046 return undef;
1047 }
97d62eb7 1048
28ef82d3
DM
1049 my $buf = "\x00" x 36;
1050 my $sensebuf = "\x00" x 8;
f334aa3e 1051 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1052
28ef82d3
DM
1053 # see /usr/include/scsi/sg.h
1054 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1055
97d62eb7
DM
1056 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1057 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1058 $cmd, $sensebuf, 6000);
1059
1060 $ret = ioctl($fh, $SG_IO, $packet);
1061 if (!$ret) {
1062 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1063 return undef;
1064 }
97d62eb7 1065
28ef82d3
DM
1066 my @res = unpack($sg_io_hdr_t, $packet);
1067 if ($res[17] || $res[18]) {
1068 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1069 return undef;
1070 }
1071
1072 my $res = {};
09984754 1073 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1074 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1075
09984754
DM
1076 $res->{removable} = $byte1 & 128 ? 1 : 0;
1077 $res->{type} = $byte0 & 31;
1078
28ef82d3
DM
1079 return $res;
1080}
1081
1082sub path_is_scsi {
1083 my ($path) = @_;
1084
1085 my $fh = IO::File->new("+<$path") || return undef;
1086 my $res = scsi_inquiry($fh, 1);
1087 close($fh);
1088
1089 return $res;
1090}
1091
db656e5f
DM
1092sub machine_type_is_q35 {
1093 my ($conf) = @_;
b467f79a 1094
db656e5f
DM
1095 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1096}
1097
1098sub print_tabletdevice_full {
1099 my ($conf) = @_;
b467f79a 1100
db656e5f
DM
1101 my $q35 = machine_type_is_q35($conf);
1102
1103 # we use uhci for old VMs because tablet driver was buggy in older qemu
1104 my $usbbus = $q35 ? "ehci" : "uhci";
b467f79a 1105
db656e5f
DM
1106 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1107}
1108
ca916ecc 1109sub print_drivedevice_full {
5bdcf937 1110 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1111
1112 my $device = '';
1113 my $maxdev = 0;
19672434 1114
ca916ecc 1115 if ($drive->{interface} eq 'virtio') {
5bdcf937 1116 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41 1117 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
7183bd9a 1118 $device .= ",iothread=iothread0" if $conf->{iothread};
2ed36a41 1119 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1120 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1121 my $controller = int($drive->{index} / $maxdev);
1122 my $unit = $drive->{index} % $maxdev;
1123 my $devicetype = 'hd';
231f2e13
DA
1124 my $path = '';
1125 if (drive_is_cdrom($drive)) {
1126 $devicetype = 'cd';
29b19529 1127 } else {
231f2e13
DA
1128 if ($drive->{file} =~ m|^/|) {
1129 $path = $drive->{file};
1130 } else {
1131 $path = PVE::Storage::path($storecfg, $drive->{file});
1132 }
d454d040
AD
1133
1134 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1135 $devicetype = 'generic';
1136 } else {
09984754
DM
1137 if (my $info = path_is_scsi($path)) {
1138 if ($info->{type} == 0) {
1139 $devicetype = 'block';
1140 } elsif ($info->{type} == 1) { # tape
1141 $devicetype = 'generic';
1142 }
1143 }
d454d040 1144 }
231f2e13 1145 }
ca916ecc 1146
5b952ff5
DM
1147 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1148 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1149 } else {
1150 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1151 }
1152
2ed36a41
DM
1153 } elsif ($drive->{interface} eq 'ide'){
1154 $maxdev = 2;
1155 my $controller = int($drive->{index} / $maxdev);
1156 my $unit = $drive->{index} % $maxdev;
1157 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1158
7ebe888a 1159 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1160 } elsif ($drive->{interface} eq 'sata'){
1161 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1162 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1163 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1164 } elsif ($drive->{interface} eq 'usb') {
1165 die "implement me";
1166 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1167 } else {
1168 die "unsupported interface type";
ca916ecc
DA
1169 }
1170
3b408e82
DM
1171 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1172
ca916ecc
DA
1173 return $device;
1174}
1175
15b21acc 1176sub get_initiator_name {
46f58b5f 1177 my $initiator;
15b21acc 1178
46f58b5f
DM
1179 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1180 while (defined(my $line = <$fh>)) {
1181 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1182 $initiator = $1;
1183 last;
1184 }
46f58b5f
DM
1185 $fh->close();
1186
15b21acc
MR
1187 return $initiator;
1188}
1189
1e3baf05
DM
1190sub print_drive_full {
1191 my ($storecfg, $vmid, $drive) = @_;
1192
1193 my $opts = '';
1194 foreach my $o (@qemu_drive_options) {
3b408e82 1195 next if $o eq 'bootindex';
1e3baf05 1196 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1197 }
1e3baf05 1198
9bf371a6
DM
1199 foreach my $o (qw(bps bps_rd bps_wr)) {
1200 my $v = $drive->{"m$o"};
1201 $opts .= ",$o=" . int($v*1024*1024) if $v;
1202 }
1203
1e3baf05 1204 # use linux-aio by default (qemu default is threads)
19672434 1205 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1206
1207 my $path;
1208 my $volid = $drive->{file};
6b64503e
DM
1209 if (drive_is_cdrom($drive)) {
1210 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1211 } else {
1212 if ($volid =~ m|^/|) {
1213 $path = $volid;
1214 } else {
6b64503e 1215 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1216 }
1217 }
1218
ef86170e 1219 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1220
f1e05305
AD
1221 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1222 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1223
1e3baf05
DM
1224 my $pathinfo = $path ? "file=$path," : '';
1225
3ebfcc86 1226 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1227}
1228
cc4d6182 1229sub print_netdevice_full {
5bdcf937 1230 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1231
1232 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1233
1234 my $device = $net->{model};
1235 if ($net->{model} eq 'virtio') {
1236 $device = 'virtio-net-pci';
1237 };
1238
1239 # qemu > 0.15 always try to boot from network - we disable that by
1240 # not loading the pxe rom file
1241 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
5bdcf937 1242 my $pciaddr = print_pci_addr("$netid", $bridges);
cc4d6182 1243 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1244 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1245 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1246 my $vectors = $net->{queues} * 2 + 2;
1247 $tmpstr .= ",vectors=$vectors,mq=on";
1248 }
cc4d6182
DA
1249 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1250 return $tmpstr;
1251}
1252
1253sub print_netdev_full {
1254 my ($vmid, $conf, $net, $netid) = @_;
1255
1256 my $i = '';
1257 if ($netid =~ m/^net(\d+)$/) {
1258 $i = int($1);
1259 }
1260
1261 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1262
1263 my $ifname = "tap${vmid}i$i";
1264
1265 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1266 die "interface name '$ifname' is too long (max 15 character)\n"
1267 if length($ifname) >= 16;
1268
1269 my $vhostparam = '';
1270 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1271
1272 my $vmname = $conf->{name} || "vm$vmid";
1273
a9410357
AD
1274 my $netdev = "";
1275
cc4d6182 1276 if ($net->{bridge}) {
a9410357 1277 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1278 } else {
a9410357 1279 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1280 }
a9410357
AD
1281
1282 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1283
1284 return $netdev;
cc4d6182 1285}
1e3baf05
DM
1286
1287sub drive_is_cdrom {
1288 my ($drive) = @_;
1289
1290 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1291
1292}
1293
2ed5d572
AD
1294sub parse_numa {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 foreach my $kvp (split(/,/, $data)) {
1300
1301 if ($kvp =~ m/^memory=(\S+)$/) {
1302 $res->{memory} = $1;
1303 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1304 $res->{policy} = $1;
1305 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1306 $res->{cpus}->{start} = $1;
1307 $res->{cpus}->{end} = $3;
1308 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1309 $res->{hostnodes}->{start} = $1;
1310 $res->{hostnodes}->{end} = $3;
1311 } else {
1312 return undef;
1313 }
1314 }
1315
1316 return $res;
1317}
1318
040b06b7
DA
1319sub parse_hostpci {
1320 my ($value) = @_;
1321
1322 return undef if !$value;
1323
0cea6a01
DM
1324
1325 my @list = split(/,/, $value);
1326 my $found;
1327
040b06b7 1328 my $res = {};
0cea6a01 1329 foreach my $kv (@list) {
040b06b7 1330
4543ecf0 1331 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1332 $found = 1;
4543ecf0
AD
1333 if(defined($4)){
1334 push @{$res->{pciid}}, { id => $2 , function => $4};
1335
1336 }else{
1337 my $pcidevices = lspci($2);
1338 $res->{pciid} = $pcidevices->{$2};
1339 }
0cea6a01
DM
1340 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1341 $res->{driver} = $1;
1342 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1343 $res->{rombar} = $1;
2e3b7e2a
AD
1344 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1345 $res->{'x-vga'} = $1;
1346 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1347 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1348 } else {
1349 warn "unknown hostpci setting '$kv'\n";
1350 }
040b06b7
DA
1351 }
1352
0cea6a01
DM
1353 return undef if !$found;
1354
040b06b7
DA
1355 return $res;
1356}
1357
1e3baf05
DM
1358# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1359sub parse_net {
1360 my ($data) = @_;
1361
1362 my $res = {};
1363
6b64503e 1364 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1365
e4c6e0b8 1366 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1367 my $model = lc($1);
92f0fedc 1368 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1369 $res->{model} = $model;
1370 $res->{macaddr} = $mac;
1371 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1372 $res->{bridge} = $1;
a9410357
AD
1373 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1374 $res->{queues} = $1;
1e3baf05
DM
1375 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1376 $res->{rate} = $1;
5070f384
DA
1377 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1378 $res->{tag} = $1;
2dd4aa4c
AD
1379 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1380 $res->{firewall} = $1;
1e3baf05
DM
1381 } else {
1382 return undef;
1383 }
19672434 1384
1e3baf05
DM
1385 }
1386
1387 return undef if !$res->{model};
1388
1389 return $res;
1390}
1391
1392sub print_net {
1393 my $net = shift;
1394
1395 my $res = "$net->{model}";
1396 $res .= "=$net->{macaddr}" if $net->{macaddr};
1397 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1398 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1399 $res .= ",tag=$net->{tag}" if $net->{tag};
28138e9a 1400 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1e3baf05
DM
1401
1402 return $res;
1403}
1404
1405sub add_random_macs {
1406 my ($settings) = @_;
1407
1408 foreach my $opt (keys %$settings) {
1409 next if $opt !~ m/^net(\d+)$/;
1410 my $net = parse_net($settings->{$opt});
1411 next if !$net;
1412 $settings->{$opt} = print_net($net);
1413 }
1414}
1415
1416sub add_unused_volume {
1858638f 1417 my ($config, $volid) = @_;
1e3baf05
DM
1418
1419 my $key;
1420 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1421 my $test = "unused$ind";
1422 if (my $vid = $config->{$test}) {
1423 return if $vid eq $volid; # do not add duplicates
1424 } else {
1425 $key = $test;
19672434 1426 }
1e3baf05
DM
1427 }
1428
1429 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1430
1858638f 1431 $config->{$key} = $volid;
1e3baf05 1432
1858638f 1433 return $key;
1e3baf05
DM
1434}
1435
2796e7d5
DM
1436my $valid_smbios1_options = {
1437 manufacturer => '\S+',
1438 product => '\S+',
1439 version => '\S+',
1440 serial => '\S+',
1441 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1442 sku => '\S+',
1443 family => '\S+',
1444};
1445
1446# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1447sub parse_smbios1 {
1448 my ($data) = @_;
1449
1450 my $res = {};
1451
1452 foreach my $kvp (split(/,/, $data)) {
1453 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1454 my ($k, $v) = split(/=/, $kvp);
1455 return undef if !defined($k) || !defined($v);
1456 return undef if !$valid_smbios1_options->{$k};
1457 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1458 $res->{$k} = $v;
1459 }
1460
1461 return $res;
1462}
1463
cd11416f
DM
1464sub print_smbios1 {
1465 my ($smbios1) = @_;
1466
1467 my $data = '';
1468 foreach my $k (keys %$smbios1) {
1469 next if !defined($smbios1->{$k});
1470 next if !$valid_smbios1_options->{$k};
1471 $data .= ',' if $data;
1472 $data .= "$k=$smbios1->{$k}";
1473 }
1474 return $data;
1475}
1476
2796e7d5
DM
1477PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1478sub verify_smbios1 {
1479 my ($value, $noerr) = @_;
1480
1481 return $value if parse_smbios1($value);
1482
1483 return undef if $noerr;
1484
1485 die "unable to parse smbios (type 1) options\n";
1486}
1487
1e3baf05
DM
1488PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1489sub verify_bootdisk {
1490 my ($value, $noerr) = @_;
1491
19672434 1492 return $value if valid_drivename($value);
1e3baf05
DM
1493
1494 return undef if $noerr;
1495
1496 die "invalid boot disk '$value'\n";
1497}
1498
2ed5d572
AD
1499PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1500sub verify_numa {
1501 my ($value, $noerr) = @_;
1502
1503 return $value if parse_numa($value);
1504
1505 return undef if $noerr;
1506
1507 die "unable to parse numa options\n";
1508}
1509
1e3baf05
DM
1510PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1511sub verify_net {
1512 my ($value, $noerr) = @_;
1513
1514 return $value if parse_net($value);
1515
1516 return undef if $noerr;
19672434 1517
1e3baf05
DM
1518 die "unable to parse network options\n";
1519}
1520
1521PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1522sub verify_drive {
1523 my ($value, $noerr) = @_;
1524
6b64503e 1525 return $value if parse_drive(undef, $value);
1e3baf05
DM
1526
1527 return undef if $noerr;
19672434 1528
1e3baf05
DM
1529 die "unable to parse drive options\n";
1530}
1531
1532PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1533sub verify_hostpci {
1534 my ($value, $noerr) = @_;
1535
040b06b7
DA
1536 return $value if parse_hostpci($value);
1537
1538 return undef if $noerr;
1539
1540 die "unable to parse pci id\n";
1e3baf05
DM
1541}
1542
0ea9541d
DM
1543PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1544sub verify_watchdog {
1545 my ($value, $noerr) = @_;
1546
1547 return $value if parse_watchdog($value);
1548
1549 return undef if $noerr;
19672434 1550
0ea9541d
DM
1551 die "unable to parse watchdog options\n";
1552}
1553
1554sub parse_watchdog {
1555 my ($value) = @_;
1556
1557 return undef if !$value;
1558
1559 my $res = {};
1560
6b64503e 1561 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1562 next if $p =~ m/^\s*$/;
1563
1564 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1565 $res->{model} = $2;
1566 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1567 $res->{action} = $2;
1568 } else {
1569 return undef;
1570 }
1571 }
1572
1573 return $res;
1574}
1575
59411c4e
DM
1576PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1577sub verify_startup {
1578 my ($value, $noerr) = @_;
1579
1580 return $value if parse_startup($value);
1581
1582 return undef if $noerr;
1583
1584 die "unable to parse startup options\n";
1585}
1586
1587sub parse_startup {
1588 my ($value) = @_;
1589
1590 return undef if !$value;
1591
1592 my $res = {};
1593
1594 foreach my $p (split(/,/, $value)) {
1595 next if $p =~ m/^\s*$/;
1596
1597 if ($p =~ m/^(order=)?(\d+)$/) {
1598 $res->{order} = $2;
1599 } elsif ($p =~ m/^up=(\d+)$/) {
1600 $res->{up} = $1;
1601 } elsif ($p =~ m/^down=(\d+)$/) {
1602 $res->{down} = $1;
1603 } else {
1604 return undef;
1605 }
1606 }
1607
1608 return $res;
1609}
1610
1e3baf05
DM
1611sub parse_usb_device {
1612 my ($value) = @_;
1613
1614 return undef if !$value;
1615
6b64503e 1616 my @dl = split(/,/, $value);
1e3baf05
DM
1617 my $found;
1618
1619 my $res = {};
1620 foreach my $v (@dl) {
036e0e2b 1621 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1622 $found = 1;
036e0e2b
DM
1623 $res->{vendorid} = $2;
1624 $res->{productid} = $4;
1e3baf05
DM
1625 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1626 $found = 1;
1627 $res->{hostbus} = $1;
1628 $res->{hostport} = $2;
80401dd8
DM
1629 } elsif ($v =~ m/^spice$/) {
1630 $found = 1;
1631 $res->{spice} = 1;
1e3baf05
DM
1632 } else {
1633 return undef;
1634 }
1635 }
1636 return undef if !$found;
1637
1638 return $res;
1639}
19672434 1640
1e3baf05
DM
1641PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1642sub verify_usb_device {
1643 my ($value, $noerr) = @_;
1644
1645 return $value if parse_usb_device($value);
1646
1647 return undef if $noerr;
19672434 1648
1e3baf05
DM
1649 die "unable to parse usb device\n";
1650}
1651
1e3baf05
DM
1652# add JSON properties for create and set function
1653sub json_config_properties {
1654 my $prop = shift;
1655
1656 foreach my $opt (keys %$confdesc) {
18bfb361 1657 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1658 $prop->{$opt} = $confdesc->{$opt};
1659 }
1660
1661 return $prop;
1662}
1663
1664sub check_type {
1665 my ($key, $value) = @_;
1666
1667 die "unknown setting '$key'\n" if !$confdesc->{$key};
1668
1669 my $type = $confdesc->{$key}->{type};
1670
6b64503e 1671 if (!defined($value)) {
1e3baf05
DM
1672 die "got undefined value\n";
1673 }
1674
1675 if ($value =~ m/[\n\r]/) {
1676 die "property contains a line feed\n";
1677 }
1678
1679 if ($type eq 'boolean') {
19672434
DM
1680 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1681 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1682 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1683 } elsif ($type eq 'integer') {
1684 return int($1) if $value =~ m/^(\d+)$/;
1685 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1686 } elsif ($type eq 'number') {
1687 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1688 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1689 } elsif ($type eq 'string') {
1690 if (my $fmt = $confdesc->{$key}->{format}) {
1691 if ($fmt eq 'pve-qm-drive') {
1692 # special case - we need to pass $key to parse_drive()
6b64503e 1693 my $drive = parse_drive($key, $value);
1e3baf05
DM
1694 return $value if $drive;
1695 die "unable to parse drive options\n";
1696 }
1697 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1698 return $value;
1699 }
1e3baf05 1700 $value =~ s/^\"(.*)\"$/$1/;
19672434 1701 return $value;
1e3baf05
DM
1702 } else {
1703 die "internal error"
1704 }
1705}
1706
191435c6
DM
1707sub lock_config_full {
1708 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1709
6b64503e 1710 my $filename = config_file_lock($vmid);
1e3baf05 1711
191435c6 1712 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1713
1714 die $@ if $@;
5fdbe4f0
DM
1715
1716 return $res;
1e3baf05
DM
1717}
1718
4e4f83fe
DM
1719sub lock_config_mode {
1720 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1721
1722 my $filename = config_file_lock($vmid);
1723
4e4f83fe 1724 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1725
1726 die $@ if $@;
1727
1728 return $res;
1729}
1730
191435c6
DM
1731sub lock_config {
1732 my ($vmid, $code, @param) = @_;
1733
1734 return lock_config_full($vmid, 10, $code, @param);
1735}
1736
1e3baf05 1737sub cfs_config_path {
a78ccf26 1738 my ($vmid, $node) = @_;
1e3baf05 1739
a78ccf26
DM
1740 $node = $nodename if !$node;
1741 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1742}
1743
040b06b7
DA
1744sub check_iommu_support{
1745 #fixme : need to check IOMMU support
1746 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1747
1748 my $iommu=1;
1749 return $iommu;
1750
1751}
1752
1e3baf05 1753sub config_file {
a78ccf26 1754 my ($vmid, $node) = @_;
1e3baf05 1755
a78ccf26 1756 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1757 return "/etc/pve/$cfspath";
1758}
1759
1760sub config_file_lock {
1761 my ($vmid) = @_;
1762
1763 return "$lock_dir/lock-$vmid.conf";
1764}
1765
1766sub touch_config {
1767 my ($vmid) = @_;
1768
6b64503e 1769 my $conf = config_file($vmid);
1e3baf05
DM
1770 utime undef, undef, $conf;
1771}
1772
1e3baf05 1773sub destroy_vm {
a6af7b3e 1774 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1775
6b64503e 1776 my $conffile = config_file($vmid);
1e3baf05 1777
6b64503e 1778 my $conf = load_config($vmid);
1e3baf05 1779
6b64503e 1780 check_lock($conf);
1e3baf05 1781
19672434 1782 # only remove disks owned by this VM
1e3baf05
DM
1783 foreach_drive($conf, sub {
1784 my ($ds, $drive) = @_;
1785
6b64503e 1786 return if drive_is_cdrom($drive);
1e3baf05
DM
1787
1788 my $volid = $drive->{file};
ed221350 1789
ff1a2432 1790 return if !$volid || $volid =~ m|^/|;
1e3baf05 1791
6b64503e 1792 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1793 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1794
6b64503e 1795 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1796 });
19672434 1797
a6af7b3e 1798 if ($keep_empty_config) {
9c502e26 1799 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1800 } else {
1801 unlink $conffile;
1802 }
1e3baf05
DM
1803
1804 # also remove unused disk
1805 eval {
6b64503e 1806 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1807
1808 eval {
6b64503e 1809 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1810 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1811 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1812 });
1813 };
1814 warn $@ if $@;
1815
1816 };
1817 warn $@ if $@;
1818}
1819
1e3baf05 1820sub load_config {
7e8dcf2c 1821 my ($vmid, $node) = @_;
1e3baf05 1822
7e8dcf2c 1823 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1824
1825 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1826
1827 die "no such VM ('$vmid')\n" if !defined($conf);
1828
1829 return $conf;
19672434 1830}
1e3baf05
DM
1831
1832sub parse_vm_config {
1833 my ($filename, $raw) = @_;
1834
1835 return undef if !defined($raw);
1836
554ac7e7 1837 my $res = {
fc1ddcdc 1838 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1839 snapshots => {},
554ac7e7 1840 };
1e3baf05 1841
19672434 1842 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1843 || die "got strange filename '$filename'";
1844
1845 my $vmid = $1;
1846
0d18dcfc 1847 my $conf = $res;
0581fe4f
DM
1848 my $descr = '';
1849
0d18dcfc
DM
1850 my @lines = split(/\n/, $raw);
1851 foreach my $line (@lines) {
1e3baf05 1852 next if $line =~ m/^\s*$/;
be190583 1853
0d18dcfc
DM
1854 if ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
1855 my $snapname = $1;
1856 $conf->{description} = $descr if $descr;
782f4f75 1857 $descr = '';
be190583 1858 $conf = $res->{snapshots}->{$snapname} = {};
0d18dcfc
DM
1859 next;
1860 }
1e3baf05 1861
0581fe4f
DM
1862 if ($line =~ m/^\#(.*)\s*$/) {
1863 $descr .= PVE::Tools::decode_text($1) . "\n";
1864 next;
1865 }
1866
1e3baf05 1867 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1868 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1869 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1870 $conf->{snapstate} = $1;
1e3baf05
DM
1871 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1872 my $key = $1;
1873 my $value = $2;
0d18dcfc 1874 $conf->{$key} = $value;
1e3baf05
DM
1875 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1876 my $key = $1;
1877 my $value = $2;
1878 eval { $value = check_type($key, $value); };
1879 if ($@) {
1880 warn "vm $vmid - unable to parse value of '$key' - $@";
1881 } else {
1882 my $fmt = $confdesc->{$key}->{format};
1883 if ($fmt && $fmt eq 'pve-qm-drive') {
1884 my $v = parse_drive($key, $value);
1885 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1886 $v->{file} = $volid;
6b64503e 1887 $value = print_drive($vmid, $v);
1e3baf05
DM
1888 } else {
1889 warn "vm $vmid - unable to parse value of '$key'\n";
1890 next;
1891 }
1892 }
1893
1894 if ($key eq 'cdrom') {
0d18dcfc 1895 $conf->{ide2} = $value;
1e3baf05 1896 } else {
0d18dcfc 1897 $conf->{$key} = $value;
1e3baf05
DM
1898 }
1899 }
1900 }
1901 }
1902
0d18dcfc 1903 $conf->{description} = $descr if $descr;
0581fe4f 1904
0d18dcfc 1905 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
1906
1907 return $res;
1908}
1909
1858638f
DM
1910sub write_vm_config {
1911 my ($filename, $conf) = @_;
1e3baf05 1912
0d18dcfc
DM
1913 delete $conf->{snapstate}; # just to be sure
1914
1858638f
DM
1915 if ($conf->{cdrom}) {
1916 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
1917 $conf->{ide2} = $conf->{cdrom};
1918 delete $conf->{cdrom};
1919 }
1e3baf05
DM
1920
1921 # we do not use 'smp' any longer
1858638f
DM
1922 if ($conf->{sockets}) {
1923 delete $conf->{smp};
1924 } elsif ($conf->{smp}) {
1925 $conf->{sockets} = $conf->{smp};
1926 delete $conf->{cores};
1927 delete $conf->{smp};
1e3baf05
DM
1928 }
1929
264e519f 1930 if ($conf->{maxcpus} && $conf->{sockets}) {
3bd18e48
AD
1931 delete $conf->{sockets};
1932 }
264e519f 1933
ee2f90b1 1934 my $used_volids = {};
0d18dcfc 1935
ee2f90b1 1936 my $cleanup_config = sub {
a8e2f942 1937 my ($cref, $snapname) = @_;
1858638f 1938
ee2f90b1
DM
1939 foreach my $key (keys %$cref) {
1940 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
1941 $key eq 'snapstate';
1942 my $value = $cref->{$key};
1943 eval { $value = check_type($key, $value); };
1944 die "unable to parse value of '$key' - $@" if $@;
1858638f 1945
ee2f90b1
DM
1946 $cref->{$key} = $value;
1947
a8e2f942 1948 if (!$snapname && valid_drivename($key)) {
ed221350 1949 my $drive = parse_drive($key, $value);
ee2f90b1
DM
1950 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
1951 }
1e3baf05 1952 }
ee2f90b1
DM
1953 };
1954
1955 &$cleanup_config($conf);
1956 foreach my $snapname (keys %{$conf->{snapshots}}) {
a8e2f942 1957 &$cleanup_config($conf->{snapshots}->{$snapname}, $snapname);
1e3baf05
DM
1958 }
1959
1858638f
DM
1960 # remove 'unusedX' settings if we re-add a volume
1961 foreach my $key (keys %$conf) {
1962 my $value = $conf->{$key};
ee2f90b1 1963 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 1964 delete $conf->{$key};
1e3baf05 1965 }
1858638f 1966 }
be190583 1967
0d18dcfc
DM
1968 my $generate_raw_config = sub {
1969 my ($conf) = @_;
0581fe4f 1970
0d18dcfc
DM
1971 my $raw = '';
1972
1973 # add description as comment to top of file
1974 my $descr = $conf->{description} || '';
1975 foreach my $cl (split(/\n/, $descr)) {
1976 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
1977 }
1978
1979 foreach my $key (sort keys %$conf) {
1980 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots';
1981 $raw .= "$key: $conf->{$key}\n";
1982 }
1983 return $raw;
1984 };
0581fe4f 1985
0d18dcfc
DM
1986 my $raw = &$generate_raw_config($conf);
1987 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
1988 $raw .= "\n[$snapname]\n";
1989 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 1990 }
1e3baf05 1991
1858638f
DM
1992 return $raw;
1993}
1e3baf05 1994
1858638f
DM
1995sub update_config_nolock {
1996 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 1997
1858638f 1998 check_lock($conf) if !$skiplock;
97d62eb7 1999
1858638f 2000 my $cfspath = cfs_config_path($vmid);
1e3baf05 2001
1858638f
DM
2002 PVE::Cluster::cfs_write_file($cfspath, $conf);
2003}
1e3baf05 2004
1858638f
DM
2005sub update_config {
2006 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 2007
1858638f 2008 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
2009}
2010
19672434 2011sub load_defaults {
1e3baf05
DM
2012
2013 my $res = {};
2014
2015 # we use static defaults from our JSON schema configuration
2016 foreach my $key (keys %$confdesc) {
2017 if (defined(my $default = $confdesc->{$key}->{default})) {
2018 $res->{$key} = $default;
2019 }
2020 }
19672434 2021
1e3baf05
DM
2022 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2023 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2024
2025 return $res;
2026}
2027
2028sub config_list {
2029 my $vmlist = PVE::Cluster::get_vmlist();
2030 my $res = {};
2031 return $res if !$vmlist || !$vmlist->{ids};
2032 my $ids = $vmlist->{ids};
2033
1e3baf05
DM
2034 foreach my $vmid (keys %$ids) {
2035 my $d = $ids->{$vmid};
2036 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 2037 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
2038 $res->{$vmid}->{exists} = 1;
2039 }
2040 return $res;
2041}
2042
64e13401
DM
2043# test if VM uses local resources (to prevent migration)
2044sub check_local_resources {
2045 my ($conf, $noerr) = @_;
2046
2047 my $loc_res = 0;
19672434 2048
e0ab7331
DM
2049 $loc_res = 1 if $conf->{hostusb}; # old syntax
2050 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 2051
0d29ab3b 2052 foreach my $k (keys %$conf) {
49ca581d 2053 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 2054 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
2055 }
2056
2057 die "VM uses local resources\n" if $loc_res && !$noerr;
2058
2059 return $loc_res;
2060}
2061
719893a9 2062# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
2063sub check_storage_availability {
2064 my ($storecfg, $conf, $node) = @_;
2065
2066 foreach_drive($conf, sub {
2067 my ($ds, $drive) = @_;
2068
2069 my $volid = $drive->{file};
2070 return if !$volid;
2071
2072 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2073 return if !$sid;
2074
2075 # check if storage is available on both nodes
2076 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2077 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2078 });
2079}
2080
719893a9
DM
2081# list nodes where all VM images are available (used by has_feature API)
2082sub shared_nodes {
2083 my ($conf, $storecfg) = @_;
2084
2085 my $nodelist = PVE::Cluster::get_nodelist();
2086 my $nodehash = { map { $_ => 1 } @$nodelist };
2087 my $nodename = PVE::INotify::nodename();
be190583 2088
719893a9
DM
2089 foreach_drive($conf, sub {
2090 my ($ds, $drive) = @_;
2091
2092 my $volid = $drive->{file};
2093 return if !$volid;
2094
2095 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2096 if ($storeid) {
2097 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2098 if ($scfg->{disable}) {
2099 $nodehash = {};
2100 } elsif (my $avail = $scfg->{nodes}) {
2101 foreach my $node (keys %$nodehash) {
2102 delete $nodehash->{$node} if !$avail->{$node};
2103 }
2104 } elsif (!$scfg->{shared}) {
2105 foreach my $node (keys %$nodehash) {
2106 delete $nodehash->{$node} if $node ne $nodename
2107 }
2108 }
2109 }
2110 });
2111
2112 return $nodehash
2113}
2114
1e3baf05
DM
2115sub check_lock {
2116 my ($conf) = @_;
2117
2118 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2119}
2120
2121sub check_cmdline {
2122 my ($pidfile, $pid) = @_;
2123
6b64503e
DM
2124 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2125 if (defined($fh)) {
1e3baf05
DM
2126 my $line = <$fh>;
2127 $fh->close;
2128 return undef if !$line;
6b64503e 2129 my @param = split(/\0/, $line);
1e3baf05
DM
2130
2131 my $cmd = $param[0];
06094efd 2132 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2133
2134 for (my $i = 0; $i < scalar (@param); $i++) {
2135 my $p = $param[$i];
2136 next if !$p;
2137 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2138 my $p = $param[$i+1];
2139 return 1 if $p && ($p eq $pidfile);
2140 return undef;
2141 }
2142 }
2143 }
2144 return undef;
2145}
2146
2147sub check_running {
7e8dcf2c 2148 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2149
7e8dcf2c 2150 my $filename = config_file($vmid, $node);
1e3baf05
DM
2151
2152 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2153 if !$nocheck && ! -f $filename;
1e3baf05 2154
e6c3b671 2155 my $pidfile = pidfile_name($vmid);
1e3baf05 2156
e6c3b671
DM
2157 if (my $fd = IO::File->new("<$pidfile")) {
2158 my $st = stat($fd);
1e3baf05 2159 my $line = <$fd>;
6b64503e 2160 close($fd);
1e3baf05
DM
2161
2162 my $mtime = $st->mtime;
2163 if ($mtime > time()) {
2164 warn "file '$filename' modified in future\n";
2165 }
2166
2167 if ($line =~ m/^(\d+)$/) {
2168 my $pid = $1;
e6c3b671
DM
2169 if (check_cmdline($pidfile, $pid)) {
2170 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2171 return $pid;
2172 }
2173 }
1e3baf05
DM
2174 }
2175 }
2176
2177 return undef;
2178}
2179
2180sub vzlist {
19672434 2181
1e3baf05
DM
2182 my $vzlist = config_list();
2183
6b64503e 2184 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2185
19672434 2186 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2187 next if $de !~ m/^(\d+)\.pid$/;
2188 my $vmid = $1;
6b64503e
DM
2189 next if !defined($vzlist->{$vmid});
2190 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2191 $vzlist->{$vmid}->{pid} = $pid;
2192 }
2193 }
2194
2195 return $vzlist;
2196}
2197
1e3baf05
DM
2198sub disksize {
2199 my ($storecfg, $conf) = @_;
2200
2201 my $bootdisk = $conf->{bootdisk};
2202 return undef if !$bootdisk;
2203 return undef if !valid_drivename($bootdisk);
2204
2205 return undef if !$conf->{$bootdisk};
2206
2207 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2208 return undef if !defined($drive);
2209
2210 return undef if drive_is_cdrom($drive);
2211
2212 my $volid = $drive->{file};
2213 return undef if !$volid;
2214
24afaca0 2215 return $drive->{size};
1e3baf05
DM
2216}
2217
2218my $last_proc_pid_stat;
2219
03a33f30
DM
2220# get VM status information
2221# This must be fast and should not block ($full == false)
2222# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2223sub vmstatus {
03a33f30 2224 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2225
2226 my $res = {};
2227
19672434 2228 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2229
2230 my $list = vzlist();
694fcad4 2231 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2232
ae4915a2
DM
2233 my $cpucount = $cpuinfo->{cpus} || 1;
2234
1e3baf05
DM
2235 foreach my $vmid (keys %$list) {
2236 next if $opt_vmid && ($vmid ne $opt_vmid);
2237
2238 my $cfspath = cfs_config_path($vmid);
2239 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2240
2241 my $d = {};
2242 $d->{pid} = $list->{$vmid}->{pid};
2243
2244 # fixme: better status?
2245 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2246
af990afe
DM
2247 my $size = disksize($storecfg, $conf);
2248 if (defined($size)) {
2249 $d->{disk} = 0; # no info available
1e3baf05
DM
2250 $d->{maxdisk} = $size;
2251 } else {
2252 $d->{disk} = 0;
2253 $d->{maxdisk} = 0;
2254 }
2255
2256 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2257 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2258
1e3baf05 2259 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2260 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2261
8b1accf7 2262 if ($conf->{balloon}) {
4bdb0514 2263 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2264 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2265 }
2266
1e3baf05
DM
2267 $d->{uptime} = 0;
2268 $d->{cpu} = 0;
1e3baf05
DM
2269 $d->{mem} = 0;
2270
2271 $d->{netout} = 0;
2272 $d->{netin} = 0;
2273
2274 $d->{diskread} = 0;
2275 $d->{diskwrite} = 0;
2276
4d8c851b
AD
2277 $d->{template} = is_template($conf);
2278
1e3baf05
DM
2279 $res->{$vmid} = $d;
2280 }
2281
2282 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2283 foreach my $dev (keys %$netdev) {
2284 next if $dev !~ m/^tap([1-9]\d*)i/;
2285 my $vmid = $1;
2286 my $d = $res->{$vmid};
2287 next if !$d;
19672434 2288
1e3baf05
DM
2289 $d->{netout} += $netdev->{$dev}->{receive};
2290 $d->{netin} += $netdev->{$dev}->{transmit};
2291 }
2292
1e3baf05
DM
2293 my $ctime = gettimeofday;
2294
2295 foreach my $vmid (keys %$list) {
2296
2297 my $d = $res->{$vmid};
2298 my $pid = $d->{pid};
2299 next if !$pid;
2300
694fcad4
DM
2301 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2302 next if !$pstat; # not running
19672434 2303
694fcad4 2304 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2305
694fcad4 2306 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2307
694fcad4 2308 if ($pstat->{vsize}) {
6b64503e 2309 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2310 }
2311
2312 my $old = $last_proc_pid_stat->{$pid};
2313 if (!$old) {
19672434
DM
2314 $last_proc_pid_stat->{$pid} = {
2315 time => $ctime,
1e3baf05
DM
2316 used => $used,
2317 cpu => 0,
1e3baf05
DM
2318 };
2319 next;
2320 }
2321
7f0b5beb 2322 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2323
2324 if ($dtime > 1000) {
2325 my $dutime = $used - $old->{used};
2326
ae4915a2 2327 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2328 $last_proc_pid_stat->{$pid} = {
19672434 2329 time => $ctime,
1e3baf05
DM
2330 used => $used,
2331 cpu => $d->{cpu},
1e3baf05
DM
2332 };
2333 } else {
2334 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2335 }
2336 }
2337
f5eb281a 2338 return $res if !$full;
03a33f30
DM
2339
2340 my $qmpclient = PVE::QMPClient->new();
2341
64e7fcf2
DM
2342 my $ballooncb = sub {
2343 my ($vmid, $resp) = @_;
2344
2345 my $info = $resp->{'return'};
2346 return if !$info->{max_mem};
be190583 2347
64e7fcf2
DM
2348 my $d = $res->{$vmid};
2349
2350 # use memory assigned to VM
2351 $d->{maxmem} = $info->{max_mem};
2352 $d->{balloon} = $info->{actual};
be190583 2353
64e7fcf2
DM
2354 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2355 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2356 $d->{freemem} = $info->{free_mem};
2357 }
2358
2359 };
2360
03a33f30
DM
2361 my $blockstatscb = sub {
2362 my ($vmid, $resp) = @_;
2363 my $data = $resp->{'return'} || [];
2364 my $totalrdbytes = 0;
2365 my $totalwrbytes = 0;
2366 for my $blockstat (@$data) {
2367 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2368 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2369 }
2370 $res->{$vmid}->{diskread} = $totalrdbytes;
2371 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2372 };
2373
2374 my $statuscb = sub {
2375 my ($vmid, $resp) = @_;
64e7fcf2 2376
03a33f30 2377 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2378 # this fails if ballon driver is not loaded, so this must be
2379 # the last commnand (following command are aborted if this fails).
2380 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2381
2382 my $status = 'unknown';
2383 if (!defined($status = $resp->{'return'}->{status})) {
2384 warn "unable to get VM status\n";
2385 return;
2386 }
2387
2388 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2389 };
2390
2391 foreach my $vmid (keys %$list) {
2392 next if $opt_vmid && ($vmid ne $opt_vmid);
2393 next if !$res->{$vmid}->{pid}; # not running
2394 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2395 }
2396
c8125172 2397 $qmpclient->queue_execute(undef, 1);
03a33f30
DM
2398
2399 foreach my $vmid (keys %$list) {
2400 next if $opt_vmid && ($vmid ne $opt_vmid);
2401 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2402 }
2403
1e3baf05
DM
2404 return $res;
2405}
2406
2407sub foreach_drive {
2408 my ($conf, $func) = @_;
2409
2410 foreach my $ds (keys %$conf) {
2411 next if !valid_drivename($ds);
2412
6b64503e 2413 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2414 next if !$drive;
2415
2416 &$func($ds, $drive);
2417 }
2418}
2419
d5769dc2
DM
2420sub foreach_volid {
2421 my ($conf, $func) = @_;
be190583 2422
d5769dc2
DM
2423 my $volhash = {};
2424
2425 my $test_volid = sub {
2426 my ($volid, $is_cdrom) = @_;
2427
2428 return if !$volid;
be190583 2429
d5769dc2
DM
2430 $volhash->{$volid} = $is_cdrom || 0;
2431 };
2432
ed221350 2433 foreach_drive($conf, sub {
d5769dc2
DM
2434 my ($ds, $drive) = @_;
2435 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2436 });
2437
2438 foreach my $snapname (keys %{$conf->{snapshots}}) {
2439 my $snap = $conf->{snapshots}->{$snapname};
2440 &$test_volid($snap->{vmstate}, 0);
ed221350 2441 foreach_drive($snap, sub {
d5769dc2
DM
2442 my ($ds, $drive) = @_;
2443 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2444 });
2445 }
2446
2447 foreach my $volid (keys %$volhash) {
be190583 2448 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2449 }
2450}
2451
86b8228b
DM
2452sub vga_conf_has_spice {
2453 my ($vga) = @_;
2454
590e698c
DM
2455 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2456
2457 return $1 || 1;
86b8228b
DM
2458}
2459
1e3baf05 2460sub config_to_command {
952958bc 2461 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2462
2463 my $cmd = [];
8c559505
DM
2464 my $globalFlags = [];
2465 my $machineFlags = [];
2466 my $rtcFlags = [];
519ed28c 2467 my $cpuFlags = [];
5bdcf937 2468 my $devices = [];
b78ebef7 2469 my $pciaddr = '';
5bdcf937 2470 my $bridges = {};
1e3baf05
DM
2471 my $kvmver = kvm_user_version();
2472 my $vernum = 0; # unknown
a3c52213
DM
2473 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2474 $vernum = $1*1000000+$2*1000;
2475 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2476 $vernum = $1*1000000+$2*1000+$3;
2477 }
2478
a3c52213 2479 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2480
2481 my $have_ovz = -f '/proc/vz/vestat';
2482
db656e5f
DM
2483 my $q35 = machine_type_is_q35($conf);
2484
1e3baf05
DM
2485 push @$cmd, '/usr/bin/kvm';
2486
2487 push @$cmd, '-id', $vmid;
2488
2489 my $use_virtio = 0;
2490
c971c4f2
AD
2491 my $qmpsocket = qmp_socket($vmid);
2492 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2493 push @$cmd, '-mon', "chardev=qmp,mode=control";
2494
7b7c6d1b 2495 my $socket = vnc_socket($vmid);
1e3baf05
DM
2496 push @$cmd, '-vnc', "unix:$socket,x509,password";
2497
6b64503e 2498 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2499
1e3baf05
DM
2500 push @$cmd, '-daemonize';
2501
2796e7d5
DM
2502 if ($conf->{smbios1}) {
2503 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2504 }
2505
7183bd9a
AD
2506 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2507
db656e5f 2508 if ($q35) {
b467f79a 2509 # the q35 chipset support native usb2, so we enable usb controller
db656e5f 2510 # by default for this machine type
f8e83f05 2511 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2512 } else {
f8e83f05
AD
2513 $pciaddr = print_pci_addr("piix3", $bridges);
2514 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2515
f8e83f05 2516 my $use_usb2 = 0;
db656e5f
DM
2517 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2518 next if !$conf->{"usb$i"};
2519 $use_usb2 = 1;
2520 }
2521 # include usb device config
2522 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2523 }
19672434 2524
5acbfe9e 2525 my $vga = $conf->{vga};
2fa3151e 2526
590e698c
DM
2527 my $qxlnum = vga_conf_has_spice($vga);
2528 $vga = 'qxl' if $qxlnum;
2fa3151e 2529
5acbfe9e 2530 if (!$vga) {
264e519f
DM
2531 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2532 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2533 $conf->{ostype} eq 'w2k8')) {
2534 $vga = 'std';
2535 } else {
2536 $vga = 'cirrus';
2537 }
2538 }
2539
1e3baf05 2540 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2541 my $tablet;
2542 if (defined($conf->{tablet})) {
2543 $tablet = $conf->{tablet};
2544 } else {
2545 $tablet = $defaults->{tablet};
590e698c 2546 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2547 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2548 }
2549
db656e5f 2550 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
b467f79a 2551
1e3baf05 2552 # host pci devices
040b06b7 2553 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2554 my $d = parse_hostpci($conf->{"hostpci$i"});
2555 next if !$d;
2556
2557 my $pcie = $d->{pcie};
2558 if($pcie){
2559 die "q35 machine model is not enabled" if !$q35;
2560 $pciaddr = print_pcie_addr("hostpci$i");
2561 }else{
2562 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2563 }
2564
2565 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2566 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2567 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2568 if ($xvga && $xvga ne '') {
2569 push @$cpuFlags, 'kvm=off';
2570 $vga = 'none';
2571 }
2e3b7e2a 2572 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2573 my $pcidevices = $d->{pciid};
2574 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2575
4543ecf0
AD
2576 my $j=0;
2577 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2578
4543ecf0
AD
2579 my $id = "hostpci$i";
2580 $id .= ".$j" if $multifunction;
2581 my $addr = $pciaddr;
2582 $addr .= ".$j" if $multifunction;
2583 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2584
2585 if($j == 0){
2586 $devicestr .= "$rombar$xvga";
2587 $devicestr .= ",multifunction=on" if $multifunction;
2588 }
2589
2590 push @$devices, '-device', $devicestr;
2591 $j++;
2592 }
1e3baf05
DM
2593 }
2594
2595 # usb devices
2596 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2597 my $d = parse_usb_device($conf->{"usb$i"});
2598 next if !$d;
2599 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2600 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2601 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2602 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2603 } elsif ($d->{spice}) {
2604 # usb redir support for spice
2605 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2606 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2607 }
2608 }
2609
1e3baf05 2610 # serial devices
bae179aa 2611 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2612 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2613 if ($path eq 'socket') {
2614 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2615 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2616 push @$devices, '-device', "isa-serial,chardev=serial$i";
2617 } else {
2618 die "no such serial device\n" if ! -c $path;
2619 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2620 push @$devices, '-device', "isa-serial,chardev=serial$i";
2621 }
34978be3 2622 }
1e3baf05
DM
2623 }
2624
2625 # parallel devices
1989a89c 2626 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2627 if (my $path = $conf->{"parallel$i"}) {
19672434 2628 die "no such parallel device\n" if ! -c $path;
32e69805 2629 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2630 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2631 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2632 }
1e3baf05
DM
2633 }
2634
2635 my $vmname = $conf->{name} || "vm$vmid";
2636
2637 push @$cmd, '-name', $vmname;
19672434 2638
1e3baf05
DM
2639 my $sockets = 1;
2640 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2641 $sockets = $conf->{sockets} if $conf->{sockets};
2642
2643 my $cores = $conf->{cores} || 1;
3bd18e48
AD
2644 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2645
76267728
WL
2646 my $total_cores = $sockets * $cores;
2647 my $allowed_cores = $cpuinfo->{cpus};
2648
f34ebd52 2649 die "MAX $allowed_cores cores allowed per VM on this node\n"
76267728
WL
2650 if ($allowed_cores < $total_cores);
2651
264e519f 2652 if ($maxcpus) {
3bd18e48 2653 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
264e519f 2654 } else {
3bd18e48
AD
2655 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2656 }
1e3baf05 2657
1e3baf05
DM
2658 push @$cmd, '-nodefaults';
2659
32baffb4 2660 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2661
0888fdce
DM
2662 my $bootindex_hash = {};
2663 my $i = 1;
2664 foreach my $o (split(//, $bootorder)) {
2665 $bootindex_hash->{$o} = $i*100;
2666 $i++;
afdb31d5 2667 }
3b408e82
DM
2668
2669 push @$cmd, '-boot', "menu=on";
1e3baf05 2670
6b64503e 2671 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2672
6b64503e 2673 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2674
ef5e2be2 2675 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2676
2677 # time drift fix
6b64503e 2678 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2679
6b64503e 2680 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2681 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2682
2683 if (my $ost = $conf->{ostype}) {
6b9d84cf 2684 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2685
2686 if ($ost =~ m/^w/) { # windows
8c559505 2687 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2688
8c559505 2689 # use time drift fix when acpi is enabled
6b64503e 2690 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2691 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2692 }
2693 }
2694
be190583 2695 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2696 $ost eq 'wvista') {
8c559505 2697 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2698 push @$cmd, '-no-hpet';
462e8d19
AD
2699 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2700 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2701 }
2702
2703 if ($ost eq 'win7' || $ost eq 'win8') {
2704 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2705 }
1e3baf05
DM
2706 }
2707
8c559505
DM
2708 push @$rtcFlags, 'driftfix=slew' if $tdf;
2709
7f0b5beb 2710 if ($nokvm) {
8c559505 2711 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2712 } else {
2713 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2714 }
1e3baf05 2715
952958bc
DM
2716 my $machine_type = $forcemachine || $conf->{machine};
2717 if ($machine_type) {
2718 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2719 }
2720
8c559505
DM
2721 if ($conf->{startdate}) {
2722 push @$rtcFlags, "base=$conf->{startdate}";
2723 } elsif ($useLocaltime) {
2724 push @$rtcFlags, 'base=localtime';
2725 }
1e3baf05 2726
519ed28c
AD
2727 my $cpu = $nokvm ? "qemu64" : "kvm64";
2728 $cpu = $conf->{cpu} if $conf->{cpu};
2729
4dc339e7
AD
2730 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2731
6b9d84cf
AD
2732 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2733
2734 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2735
2e1a5389
AD
2736 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2737
be190583 2738 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2739
c0efd8cd
DM
2740 # Note: enforce needs kernel 3.10, so we do not use it for now
2741 # push @$cmd, '-cpu', "$cpu,enforce";
2742 push @$cmd, '-cpu', $cpu;
519ed28c 2743
67fb9de6 2744 my $memory = $conf->{memory} || $defaults->{memory};
8a010eae
AD
2745 push @$cmd, '-m', $memory;
2746
67fb9de6 2747 if ($conf->{numa}) {
8a010eae 2748
2ed5d572
AD
2749 my $numa_totalmemory = undef;
2750 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2751 next if !$conf->{"numa$i"};
2752 my $numa = parse_numa($conf->{"numa$i"});
2753 next if !$numa;
67fb9de6
DM
2754 # memory
2755 die "missing numa node$i memory value\n" if !$numa->{memory};
2ed5d572
AD
2756 my $numa_memory = $numa->{memory};
2757 $numa_totalmemory += $numa_memory;
2758 my $numa_object = "memory-backend-ram,id=ram-node$i,size=$numa_memory"."M";
2759
67fb9de6 2760 # cpus
2ed5d572 2761 my $cpus_start = $numa->{cpus}->{start};
67fb9de6 2762 die "missing numa node$i cpus\n" if !defined($cpus_start);
2ed5d572
AD
2763 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2764 my $cpus = $cpus_start;
2765 if (defined($cpus_end)) {
2766 $cpus .= "-$cpus_end";
67fb9de6 2767 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2ed5d572 2768 }
8a010eae 2769
67fb9de6 2770 # hostnodes
2ed5d572
AD
2771 my $hostnodes_start = $numa->{hostnodes}->{start};
2772 if (defined($hostnodes_start)) {
2773 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2774 my $hostnodes = $hostnodes_start;
2775 if (defined($hostnodes_end)) {
2776 $hostnodes .= "-$hostnodes_end";
67fb9de6 2777 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2ed5d572 2778 }
8a010eae 2779
2ed5d572
AD
2780 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2781 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
67fb9de6 2782 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2ed5d572 2783 }
8a010eae 2784
67fb9de6 2785 # policy
2ed5d572 2786 my $policy = $numa->{policy};
67fb9de6
DM
2787 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2788 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2ed5d572
AD
2789 }
2790
2791 push @$cmd, '-object', $numa_object;
8a010eae
AD
2792 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2793 }
67fb9de6
DM
2794
2795 die "total memory for NUMA nodes must be equal to vm memory\n"
2796 if $numa_totalmemory && $numa_totalmemory != $memory;
2ed5d572
AD
2797
2798 #if no custom tology, we split memory and cores across numa nodes
2799 if(!$numa_totalmemory) {
2800
67fb9de6 2801 my $numa_memory = ($memory / $sockets) . "M";
2ed5d572
AD
2802
2803 for (my $i = 0; $i < $sockets; $i++) {
2804
2805 my $cpustart = ($cores * $i);
2806 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2807 my $cpus = $cpustart;
2808 $cpus .= "-$cpuend" if $cpuend;
2809
2810 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2811 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2812 }
2813 }
8a010eae
AD
2814 }
2815
1e3baf05
DM
2816 push @$cmd, '-S' if $conf->{freeze};
2817
2818 # set keyboard layout
2819 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2820 push @$cmd, '-k', $kb if $kb;
2821
2822 # enable sound
2823 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2824 #push @$cmd, '-soundhw', 'es1370';
2825 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 2826
bc84dcca 2827 if($conf->{agent}) {
7a6c2150 2828 my $qgasocket = qmp_socket($vmid, 1);
ab6a046f
AD
2829 my $pciaddr = print_pci_addr("qga0", $bridges);
2830 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2831 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2832 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2833 }
2834
1d794448 2835 my $spice_port;
2fa3151e 2836
590e698c
DM
2837 if ($qxlnum) {
2838 if ($qxlnum > 1) {
2839 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2840 for(my $i = 1; $i < $qxlnum; $i++){
2841 my $pciaddr = print_pci_addr("vga$i", $bridges);
2842 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2843 }
2844 } else {
2845 # assume other OS works like Linux
2846 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2847 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
2848 }
2849 }
2850
1011b570 2851 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 2852
cd339d1f 2853 $spice_port = PVE::Tools::next_spice_port();
943340a6 2854
d2da6d9b 2855 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 2856
d2da6d9b
AD
2857 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2858 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2859 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
2860 }
2861
8d9ae0d2
DM
2862 # enable balloon by default, unless explicitly disabled
2863 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2864 $pciaddr = print_pci_addr("balloon0", $bridges);
2865 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2866 }
1e3baf05 2867
0ea9541d
DM
2868 if ($conf->{watchdog}) {
2869 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 2870 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 2871 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
2872 push @$devices, '-device', "$watchdog$pciaddr";
2873 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
2874 }
2875
1e3baf05 2876 my $vollist = [];
941e0c42 2877 my $scsicontroller = {};
26ee04b6 2878 my $ahcicontroller = {};
cdd20088 2879 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 2880
5881b913
DM
2881 # Add iscsi initiator name if available
2882 if (my $initiator = get_initiator_name()) {
2883 push @$devices, '-iscsi', "initiator-name=$initiator";
2884 }
2885
1e3baf05
DM
2886 foreach_drive($conf, sub {
2887 my ($ds, $drive) = @_;
2888
ff1a2432 2889 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 2890 push @$vollist, $drive->{file};
ff1a2432 2891 }
afdb31d5 2892
1e3baf05 2893 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
2894
2895 if (drive_is_cdrom ($drive)) {
2896 if ($bootindex_hash->{d}) {
2897 $drive->{bootindex} = $bootindex_hash->{d};
2898 $bootindex_hash->{d} += 1;
2899 }
2900 } else {
2901 if ($bootindex_hash->{c}) {
2902 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
2903 $bootindex_hash->{c} += 1;
2904 }
2905 }
2906
941e0c42 2907 if ($drive->{interface} eq 'scsi') {
cdd20088 2908
5b952ff5 2909 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 2910 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
2911 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
2912 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 2913 $scsicontroller->{$controller}=1;
941e0c42 2914 }
3b408e82 2915
26ee04b6
DA
2916 if ($drive->{interface} eq 'sata') {
2917 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
2918 $pciaddr = print_pci_addr("ahci$controller", $bridges);
2919 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
2920 $ahcicontroller->{$controller}=1;
2921 }
46f58b5f 2922
15b21acc
MR
2923 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
2924 push @$devices, '-drive',$drive_cmd;
46f58b5f 2925 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
2926 });
2927
cc4d6182 2928 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 2929 next if !$conf->{"net$i"};
cc4d6182
DA
2930 my $d = parse_net($conf->{"net$i"});
2931 next if !$d;
1e3baf05 2932
cc4d6182 2933 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 2934
cc4d6182
DA
2935 if ($bootindex_hash->{n}) {
2936 $d->{bootindex} = $bootindex_hash->{n};
2937 $bootindex_hash->{n} += 1;
2938 }
1e3baf05 2939
cc4d6182 2940 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
2941 push @$devices, '-netdev', $netdevfull;
2942
2943 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
2944 push @$devices, '-device', $netdevicefull;
2945 }
1e3baf05 2946
db656e5f
DM
2947 if (!$q35) {
2948 # add pci bridges
f8e83f05
AD
2949 while (my ($k, $v) = each %$bridges) {
2950 $pciaddr = print_pci_addr("pci.$k");
2951 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
2952 }
19672434
DM
2953 }
2954
1e3baf05
DM
2955 # hack: virtio with fairsched is unreliable, so we do not use fairsched
2956 # when the VM uses virtio devices.
19672434
DM
2957 if (!$use_virtio && $have_ovz) {
2958
6b64503e 2959 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
2960 $conf->{cpuunits} : $defaults->{cpuunits};
2961
2962 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
2963
2964 # fixme: cpulimit is currently ignored
2965 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
2966 }
2967
2968 # add custom args
2969 if ($conf->{args}) {
3ada46c9 2970 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
2971 push @$cmd, @$aa;
2972 }
2973
5bdcf937 2974 push @$cmd, @$devices;
be190583 2975 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 2976 if scalar(@$rtcFlags);
be190583 2977 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
2978 if scalar(@$machineFlags);
2979 push @$cmd, '-global', join(',', @$globalFlags)
2980 if scalar(@$globalFlags);
2981
1d794448 2982 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 2983}
19672434 2984
1e3baf05
DM
2985sub vnc_socket {
2986 my ($vmid) = @_;
2987 return "${var_run_tmpdir}/$vmid.vnc";
2988}
2989
943340a6 2990sub spice_port {
1011b570 2991 my ($vmid) = @_;
943340a6 2992
1d794448 2993 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
2994
2995 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
2996}
2997
c971c4f2 2998sub qmp_socket {
693d12a2
AD
2999 my ($vmid, $qga) = @_;
3000 my $sockettype = $qga ? 'qga' : 'qmp';
3001 return "${var_run_tmpdir}/$vmid.$sockettype";
c971c4f2
AD
3002}
3003
1e3baf05
DM
3004sub pidfile_name {
3005 my ($vmid) = @_;
3006 return "${var_run_tmpdir}/$vmid.pid";
3007}
3008
86fdcfb2
DA
3009sub vm_devices_list {
3010 my ($vmid) = @_;
3011
ceea9078
DM
3012 my $res = vm_mon_cmd($vmid, 'query-pci');
3013
3014 my $devices = {};
3015 foreach my $pcibus (@$res) {
3016 foreach my $device (@{$pcibus->{devices}}) {
3017 next if !$device->{'qdev_id'};
f78cc802
AD
3018 $devices->{$device->{'qdev_id'}} = 1;
3019 }
3020 }
3021
3022 my $resblock = vm_mon_cmd($vmid, 'query-block');
3023 foreach my $block (@$resblock) {
3024 if($block->{device} =~ m/^drive-(\S+)/){
3025 $devices->{$1} = 1;
1dc4f496
DM
3026 }
3027 }
86fdcfb2 3028
1dc4f496 3029 return $devices;
86fdcfb2
DA
3030}
3031
ec21aa11 3032sub vm_deviceplug {
f19d1c47 3033 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 3034
cd6ecb89 3035 return 1 if !check_running($vmid);
db656e5f
DM
3036
3037 my $q35 = machine_type_is_q35($conf);
3038
cd6ecb89 3039 if ($deviceid eq 'tablet') {
db656e5f 3040 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
cd6ecb89
AD
3041 return 1;
3042 }
3043
2dbe827e 3044 return 1 if !$conf->{hotplug};
afdb31d5 3045
95d6343b
DA
3046 my $devices_list = vm_devices_list($vmid);
3047 return 1 if defined($devices_list->{$deviceid});
3048
40f28a9f
AD
3049 qemu_bridgeadd($storecfg, $conf, $vmid, $deviceid); #add bridge if we need it for the device
3050
5e5dcb73
DA
3051 if ($deviceid =~ m/^(virtio)(\d+)$/) {
3052 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3053 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
5e5dcb73
DA
3054 qemu_deviceadd($vmid, $devicefull);
3055 if(!qemu_deviceaddverify($vmid, $deviceid)) {
3056 qemu_drivedel($vmid, $deviceid);
3057 return undef;
3058 }
f19d1c47 3059 }
cfc817c7 3060
cdd20088
AD
3061 if ($deviceid =~ m/^(scsihw)(\d+)$/) {
3062 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 3063 my $pciaddr = print_pci_addr($deviceid);
cdd20088 3064 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
cfc817c7
DA
3065 qemu_deviceadd($vmid, $devicefull);
3066 return undef if(!qemu_deviceaddverify($vmid, $deviceid));
3067 }
3068
a4f091a0 3069 if ($deviceid =~ m/^(scsi)(\d+)$/) {
cdd20088 3070 return undef if !qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
a4f091a0 3071 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 3072 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
a4f091a0
DA
3073 if(!qemu_deviceadd($vmid, $devicefull)) {
3074 qemu_drivedel($vmid, $deviceid);
3075 return undef;
3076 }
3077 }
3078
2630d2a9
DA
3079 if ($deviceid =~ m/^(net)(\d+)$/) {
3080 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3081 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3082 qemu_deviceadd($vmid, $netdevicefull);
3083 if(!qemu_deviceaddverify($vmid, $deviceid)) {
3084 qemu_netdevdel($vmid, $deviceid);
3085 return undef;
3086 }
3087 }
3088
b467f79a 3089
f8e83f05 3090 if (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
40f28a9f
AD
3091 my $bridgeid = $2;
3092 my $pciaddr = print_pci_addr($deviceid);
3093 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
3094 qemu_deviceadd($vmid, $devicefull);
3095 return undef if !qemu_deviceaddverify($vmid, $deviceid);
3096 }
3097
5e5dcb73 3098 return 1;
a4dea331
DA
3099}
3100
ec21aa11 3101sub vm_deviceunplug {
f19d1c47 3102 my ($vmid, $conf, $deviceid) = @_;
873c2d69 3103
cd6ecb89
AD
3104 return 1 if !check_running ($vmid);
3105
3106 if ($deviceid eq 'tablet') {
3107 qemu_devicedel($vmid, $deviceid);
3108 return 1;
3109 }
3110
2dbe827e 3111 return 1 if !$conf->{hotplug};
873c2d69 3112
95d6343b
DA
3113 my $devices_list = vm_devices_list($vmid);
3114 return 1 if !defined($devices_list->{$deviceid});
3115
ae57f6b3 3116 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
f19d1c47 3117
5e5dcb73 3118 if ($deviceid =~ m/^(virtio)(\d+)$/) {
5e5dcb73
DA
3119 qemu_devicedel($vmid, $deviceid);
3120 return undef if !qemu_devicedelverify($vmid, $deviceid);
1f219ef5 3121 return undef if !qemu_drivedel($vmid, $deviceid);
5e5dcb73 3122 }
cfc817c7
DA
3123
3124 if ($deviceid =~ m/^(lsi)(\d+)$/) {
3125 return undef if !qemu_devicedel($vmid, $deviceid);
3126 }
3127
a4f091a0
DA
3128 if ($deviceid =~ m/^(scsi)(\d+)$/) {
3129 return undef if !qemu_devicedel($vmid, $deviceid);
3130 return undef if !qemu_drivedel($vmid, $deviceid);
3131 }
3132
2630d2a9 3133 if ($deviceid =~ m/^(net)(\d+)$/) {
2630d2a9
DA
3134 qemu_devicedel($vmid, $deviceid);
3135 return undef if !qemu_devicedelverify($vmid, $deviceid);
750886f8 3136 return undef if !qemu_netdevdel($vmid, $deviceid);
2630d2a9
DA
3137 }
3138
5e5dcb73
DA
3139 return 1;
3140}
3141
3142sub qemu_deviceadd {
3143 my ($vmid, $devicefull) = @_;
873c2d69 3144
d695b5b7
AD
3145 $devicefull = "driver=".$devicefull;
3146 my %options = split(/[=,]/, $devicefull);
f19d1c47 3147
d695b5b7
AD
3148 vm_mon_cmd($vmid, "device_add" , %options);
3149 return 1;
5e5dcb73 3150}
afdb31d5 3151
5e5dcb73
DA
3152sub qemu_devicedel {
3153 my($vmid, $deviceid) = @_;
5a77d8c1
AD
3154 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
3155 return 1;
5e5dcb73
DA
3156}
3157
3158sub qemu_driveadd {
3159 my($storecfg, $vmid, $device) = @_;
3160
3161 my $drive = print_drive_full($storecfg, $vmid, $device);
7b7c6d1b 3162 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
5e5dcb73
DA
3163 # If the command succeeds qemu prints: "OK"
3164 if ($ret !~ m/OK/s) {
3165 syslog("err", "adding drive failed: $ret");
3166 return undef;
f19d1c47 3167 }
5e5dcb73
DA
3168 return 1;
3169}
afdb31d5 3170
5e5dcb73
DA
3171sub qemu_drivedel {
3172 my($vmid, $deviceid) = @_;
873c2d69 3173
7b7c6d1b 3174 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73
DA
3175 $ret =~ s/^\s+//;
3176 if ($ret =~ m/Device \'.*?\' not found/s) {
afdb31d5 3177 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
5e5dcb73
DA
3178 }
3179 elsif ($ret ne "") {
3180 syslog("err", "deleting drive $deviceid failed : $ret");
3181 return undef;
873c2d69 3182 }
5e5dcb73
DA
3183 return 1;
3184}
f19d1c47 3185
5e5dcb73
DA
3186sub qemu_deviceaddverify {
3187 my ($vmid,$deviceid) = @_;
873c2d69 3188
5e5dcb73
DA
3189 for (my $i = 0; $i <= 5; $i++) {
3190 my $devices_list = vm_devices_list($vmid);
3191 return 1 if defined($devices_list->{$deviceid});
3192 sleep 1;
afdb31d5 3193 }
5e5dcb73
DA
3194 syslog("err", "error on hotplug device $deviceid");
3195 return undef;
3196}
afdb31d5 3197
5e5dcb73
DA
3198
3199sub qemu_devicedelverify {
3200 my ($vmid,$deviceid) = @_;
3201
3202 #need to verify the device is correctly remove as device_del is async and empty return is not reliable
3203 for (my $i = 0; $i <= 5; $i++) {
3204 my $devices_list = vm_devices_list($vmid);
3205 return 1 if !defined($devices_list->{$deviceid});
3206 sleep 1;
afdb31d5 3207 }
5e5dcb73
DA
3208 syslog("err", "error on hot-unplugging device $deviceid");
3209 return undef;
873c2d69
DA
3210}
3211
cdd20088 3212sub qemu_findorcreatescsihw {
cfc817c7
DA
3213 my ($storecfg, $conf, $vmid, $device) = @_;
3214
5b952ff5 3215 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3216 my $controller = int($device->{index} / $maxdev);
cdd20088 3217 my $scsihwid="scsihw$controller";
cfc817c7
DA
3218 my $devices_list = vm_devices_list($vmid);
3219
cdd20088
AD
3220 if(!defined($devices_list->{$scsihwid})) {
3221 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7
DA
3222 }
3223 return 1;
3224}
3225
40f28a9f
AD
3226sub qemu_bridgeadd {
3227 my ($storecfg, $conf, $vmid, $device) = @_;
3228
3229 my $bridges = {};
3230 my $bridgeid = undef;
3231 print_pci_addr($device, $bridges);
3232
3233 while (my ($k, $v) = each %$bridges) {
3234 $bridgeid = $k;
3235 }
0e616534 3236 return if !$bridgeid || $bridgeid < 1;
40f28a9f
AD
3237 my $bridge = "pci.$bridgeid";
3238 my $devices_list = vm_devices_list($vmid);
3239
3240 if(!defined($devices_list->{$bridge})) {
3241 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $bridge);
3242 }
3243 return 1;
3244}
3245
2630d2a9
DA
3246sub qemu_netdevadd {
3247 my ($vmid, $conf, $device, $deviceid) = @_;
3248
3249 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3250 my %options = split(/[=,]/, $netdev);
2630d2a9 3251
73aa03b8
AD
3252 vm_mon_cmd($vmid, "netdev_add", %options);
3253 return 1;
2630d2a9
DA
3254}
3255
3256sub qemu_netdevdel {
3257 my ($vmid, $deviceid) = @_;
3258
89c1e0f4
AD
3259 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
3260 return 1;
2630d2a9
DA
3261}
3262
838776ab
AD
3263sub qemu_cpu_hotplug {
3264 my ($vmid, $conf, $cores) = @_;
3265
3266 die "new cores config is not defined" if !$cores;
264e519f
DM
3267 die "you can't add more cores than maxcpus"
3268 if $conf->{maxcpus} && ($cores > $conf->{maxcpus});
838776ab
AD
3269 return if !check_running($vmid);
3270
3271 my $currentcores = $conf->{cores} if $conf->{cores};
3272 die "current cores is not defined" if !$currentcores;
3273 die "maxcpus is not defined" if !$conf->{maxcpus};
264e519f
DM
3274 raise_param_exc({ 'cores' => "online cpu unplug is not yet possible" })
3275 if($cores < $currentcores);
838776ab
AD
3276
3277 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
264e519f
DM
3278 raise_param_exc({ 'cores' => "cores number if running vm is different than configuration" })
3279 if scalar (@{$currentrunningcores}) != $currentcores;
838776ab 3280
264e519f 3281 for(my $i = $currentcores; $i < $cores; $i++) {
838776ab
AD
3282 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3283 }
3284}
3285
affd2f88
AD
3286sub qemu_block_set_io_throttle {
3287 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3288
f3f323a3
AD
3289 return if !check_running($vmid) ;
3290
f3f323a3
AD
3291 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3292
affd2f88
AD
3293}
3294
f5eb281a 3295# old code, only used to shutdown old VM after update
dab36e1e
DM
3296sub __read_avail {
3297 my ($fh, $timeout) = @_;
3298
3299 my $sel = new IO::Select;
3300 $sel->add($fh);
3301
3302 my $res = '';
3303 my $buf;
3304
3305 my @ready;
3306 while (scalar (@ready = $sel->can_read($timeout))) {
3307 my $count;
3308 if ($count = $fh->sysread($buf, 8192)) {
3309 if ($buf =~ /^(.*)\(qemu\) $/s) {
3310 $res .= $1;
3311 last;
3312 } else {
3313 $res .= $buf;
3314 }
3315 } else {
3316 if (!defined($count)) {
3317 die "$!\n";
3318 }
3319 last;
3320 }
3321 }
3322
3323 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3324
dab36e1e
DM
3325 return $res;
3326}
3327
f5eb281a 3328# old code, only used to shutdown old VM after update
dab36e1e
DM
3329sub vm_monitor_command {
3330 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3331
dab36e1e
DM
3332 my $res;
3333
3334 eval {
3335 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3336
3337 my $sname = "${var_run_tmpdir}/$vmid.mon";
3338
3339 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3340 die "unable to connect to VM $vmid socket - $!\n";
3341
3342 my $timeout = 3;
3343
3344 # hack: migrate sometime blocks the monitor (when migrate_downtime
3345 # is set)
3346 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3347 $timeout = 60*60; # 1 hour
3348 }
3349
3350 # read banner;
3351 my $data = __read_avail($sock, $timeout);
3352
3353 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3354 die "got unexpected qemu monitor banner\n";
3355 }
3356
3357 my $sel = new IO::Select;
3358 $sel->add($sock);
3359
3360 if (!scalar(my @ready = $sel->can_write($timeout))) {
3361 die "monitor write error - timeout";
3362 }
3363
3364 my $fullcmd = "$cmdstr\r";
3365
3366 # syslog('info', "VM $vmid monitor command: $cmdstr");
3367
3368 my $b;
3369 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3370 die "monitor write error - $!";
3371 }
3372
3373 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3374
3375 $timeout = 20;
3376
3377 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3378 $timeout = 60*60; # 1 hour
3379 } elsif ($cmdstr =~ m/^(eject|change)/) {
3380 $timeout = 60; # note: cdrom mount command is slow
3381 }
3382 if ($res = __read_avail($sock, $timeout)) {
3383
3384 my @lines = split("\r?\n", $res);
f5eb281a 3385
dab36e1e 3386 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3387
dab36e1e
DM
3388 $res = join("\n", @lines);
3389 $res .= "\n";
3390 }
3391 };
3392
3393 my $err = $@;
3394
3395 if ($err) {
3396 syslog("err", "VM $vmid monitor command failed - $err");
3397 die $err;
3398 }
f5eb281a 3399
dab36e1e
DM
3400 return $res;
3401}
3402
c1175c92
AD
3403sub qemu_block_resize {
3404 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3405
ed221350 3406 my $running = check_running($vmid);
c1175c92
AD
3407
3408 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3409
3410 return if !$running;
3411
3412 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3413
3414}
3415
1ab0057c
AD
3416sub qemu_volume_snapshot {
3417 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3418
ed221350 3419 my $running = check_running($vmid);
1ab0057c
AD
3420
3421 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3422
3423 return if !$running;
3424
3425 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3426
3427}
3428
fc46aff9
AD
3429sub qemu_volume_snapshot_delete {
3430 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3431
ed221350 3432 my $running = check_running($vmid);
fc46aff9
AD
3433
3434 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3435
3436 return if !$running;
3437
18bfb361 3438 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3439}
3440
264e519f
DM
3441sub set_migration_caps {
3442 my ($vmid) = @_;
a89fded1 3443
8b8345f3 3444 my $cap_ref = [];
a89fded1
AD
3445
3446 my $enabled_cap = {
8b8345f3
DM
3447 "auto-converge" => 1,
3448 "xbzrle" => 0,
3449 "x-rdma-pin-all" => 0,
3450 "zero-blocks" => 0,
a89fded1
AD
3451 };
3452
8b8345f3 3453 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3454
8b8345f3 3455 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3456 push @$cap_ref, {
3457 capability => $supported_capability->{capability},
22430fa2
DM
3458 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3459 };
a89fded1
AD
3460 }
3461
8b8345f3
DM
3462 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3463}
a89fded1 3464
1e3baf05 3465sub vm_start {
1d794448 3466 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 3467
6b64503e 3468 lock_config($vmid, sub {
7e8dcf2c 3469 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 3470
8b43bc11 3471 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 3472
6b64503e 3473 check_lock($conf) if !$skiplock;
1e3baf05 3474
7e8dcf2c 3475 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 3476
6c47d546
DM
3477 my $defaults = load_defaults();
3478
3479 # set environment variable useful inside network script
3480 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3481
1d794448 3482 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 3483
1e3baf05 3484 my $migrate_port = 0;
5bc1e039 3485 my $migrate_uri;
1e3baf05
DM
3486 if ($statefile) {
3487 if ($statefile eq 'tcp') {
5bc1e039
SP
3488 my $localip = "localhost";
3489 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3490 if ($datacenterconf->{migration_unsecure}) {
3491 my $nodename = PVE::INotify::nodename();
3492 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3493 }
f9a971e0 3494 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 3495 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
3496 push @$cmd, '-incoming', $migrate_uri;
3497 push @$cmd, '-S';
1e3baf05 3498 } else {
6c47d546 3499 push @$cmd, '-loadstate', $statefile;
1e3baf05 3500 }
91bd6c90
DM
3501 } elsif ($paused) {
3502 push @$cmd, '-S';
1e3baf05
DM
3503 }
3504
1e3baf05 3505 # host pci devices
040b06b7
DA
3506 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3507 my $d = parse_hostpci($conf->{"hostpci$i"});
3508 next if !$d;
b1f72af6
AD
3509 my $pcidevices = $d->{pciid};
3510 foreach my $pcidevice (@$pcidevices) {
3511 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 3512
b1f72af6
AD
3513 my $info = pci_device_info("0000:$pciid");
3514 die "IOMMU not present\n" if !check_iommu_support();
3515 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 3516
b1f72af6
AD
3517 if ($d->{driver} && $d->{driver} eq "vfio") {
3518 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3519 } else {
3520 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3521 }
3522
8f3e88af 3523 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 3524 }
040b06b7 3525 }
1e3baf05
DM
3526
3527 PVE::Storage::activate_volumes($storecfg, $vollist);
3528
585b6e28
DM
3529 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3530 umask => 0077); };
1e3baf05 3531 my $err = $@;
ff1a2432 3532 die "start failed: $err" if $err;
1e3baf05 3533
5bc1e039 3534 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 3535
8c609afd 3536 if ($statefile && $statefile ne 'tcp') {
95381ce0 3537 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 3538 warn $@ if $@;
62de2cbd
DM
3539 }
3540
1d794448 3541 if ($migratedfrom) {
a89fded1
AD
3542
3543 eval {
3544 PVE::QemuServer::set_migration_caps($vmid);
3545 };
1d794448 3546 warn $@ if $@;
a89fded1 3547
1d794448
DM
3548 if ($spice_port) {
3549 print "spice listens on port $spice_port\n";
3550 if ($spice_ticket) {
3551 PVE::QemuServer::vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
3552 PVE::QemuServer::vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
3553 }
3554 }
3555
1d794448 3556 } else {
4ec05c4c 3557
15b1fc93 3558 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 3559 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 3560 if $conf->{balloon};
be190583
DM
3561 vm_mon_cmd_nocheck($vmid, 'qom-set',
3562 path => "machine/peripheral/balloon0",
3563 property => "guest-stats-polling-interval",
4ec05c4c
AD
3564 value => 2);
3565 }
e18b0b99 3566 }
1e3baf05
DM
3567 });
3568}
3569
0eedc444
AD
3570sub vm_mon_cmd {
3571 my ($vmid, $execute, %params) = @_;
3572
26f11676
DM
3573 my $cmd = { execute => $execute, arguments => \%params };
3574 vm_qmp_command($vmid, $cmd);
0eedc444
AD
3575}
3576
3577sub vm_mon_cmd_nocheck {
3578 my ($vmid, $execute, %params) = @_;
3579
26f11676
DM
3580 my $cmd = { execute => $execute, arguments => \%params };
3581 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
3582}
3583
c971c4f2 3584sub vm_qmp_command {
c5a07de5 3585 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 3586
c971c4f2 3587 my $res;
26f11676 3588
14db5366
DM
3589 my $timeout;
3590 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
3591 $timeout = $cmd->{arguments}->{timeout};
3592 delete $cmd->{arguments}->{timeout};
3593 }
be190583 3594
c971c4f2
AD
3595 eval {
3596 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
7a6c2150
DM
3597 my $sname = qmp_socket($vmid);
3598 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
c5a07de5 3599 my $qmpclient = PVE::QMPClient->new();
dab36e1e 3600
14db5366 3601 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
c5a07de5 3602 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
dab36e1e
DM
3603 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
3604 if scalar(%{$cmd->{arguments}});
3605 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
3606 } else {
3607 die "unable to open monitor socket\n";
3608 }
c971c4f2 3609 };
26f11676 3610 if (my $err = $@) {
c971c4f2
AD
3611 syslog("err", "VM $vmid qmp command failed - $err");
3612 die $err;
3613 }
3614
3615 return $res;
3616}
3617
9df5cbcc
DM
3618sub vm_human_monitor_command {
3619 my ($vmid, $cmdline) = @_;
3620
3621 my $res;
3622
f5eb281a 3623 my $cmd = {
9df5cbcc
DM
3624 execute => 'human-monitor-command',
3625 arguments => { 'command-line' => $cmdline},
3626 };
3627
3628 return vm_qmp_command($vmid, $cmd);
3629}
3630
1e3baf05
DM
3631sub vm_commandline {
3632 my ($storecfg, $vmid) = @_;
3633
6b64503e 3634 my $conf = load_config($vmid);
1e3baf05
DM
3635
3636 my $defaults = load_defaults();
3637
6b64503e 3638 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 3639
6b64503e 3640 return join(' ', @$cmd);
1e3baf05
DM
3641}
3642
3643sub vm_reset {
3644 my ($vmid, $skiplock) = @_;
3645
6b64503e 3646 lock_config($vmid, sub {
1e3baf05 3647
6b64503e 3648 my $conf = load_config($vmid);
1e3baf05 3649
6b64503e 3650 check_lock($conf) if !$skiplock;
1e3baf05 3651
816e2c4a 3652 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
3653 });
3654}
3655
3656sub get_vm_volumes {
3657 my ($conf) = @_;
1e3baf05 3658
ff1a2432 3659 my $vollist = [];
d5769dc2
DM
3660 foreach_volid($conf, sub {
3661 my ($volid, $is_cdrom) = @_;
ff1a2432 3662
d5769dc2 3663 return if $volid =~ m|^/|;
ff1a2432 3664
d5769dc2
DM
3665 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
3666 return if !$sid;
ff1a2432
DM
3667
3668 push @$vollist, $volid;
1e3baf05 3669 });
ff1a2432
DM
3670
3671 return $vollist;
3672}
3673
3674sub vm_stop_cleanup {
254575e9 3675 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 3676
745fed70
DM
3677 eval {
3678 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 3679
254575e9
DM
3680 if (!$keepActive) {
3681 my $vollist = get_vm_volumes($conf);
3682 PVE::Storage::deactivate_volumes($storecfg, $vollist);
3683 }
961bfcb2 3684
ab6a046f 3685 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
3686 unlink "/var/run/qemu-server/${vmid}.$ext";
3687 }
745fed70
DM
3688 };
3689 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
3690}
3691
e6c3b671 3692# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
3693# We need that when migration VMs to other nodes (files already moved)
3694# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 3695sub vm_stop {
af30308f 3696 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 3697
9269013a 3698 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 3699
af30308f
DM
3700 if ($migratedfrom){
3701 my $pid = check_running($vmid, $nocheck, $migratedfrom);
3702 kill 15, $pid if $pid;
3703 my $conf = load_config($vmid, $migratedfrom);
3704 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
3705 return;
3706 }
3707
e6c3b671 3708 lock_config($vmid, sub {
1e3baf05 3709
e6c3b671 3710 my $pid = check_running($vmid, $nocheck);
ff1a2432 3711 return if !$pid;
1e3baf05 3712
ff1a2432 3713 my $conf;
e6c3b671 3714 if (!$nocheck) {
ff1a2432 3715 $conf = load_config($vmid);
e6c3b671 3716 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
3717 if (!defined($timeout) && $shutdown && $conf->{startup}) {
3718 my $opts = parse_startup($conf->{startup});
3719 $timeout = $opts->{down} if $opts->{down};
3720 }
e6c3b671 3721 }
19672434 3722
7f4a5b5a 3723 $timeout = 60 if !defined($timeout);
67fb9de6 3724
9269013a
DM
3725 eval {
3726 if ($shutdown) {
6fab033c 3727 if (!$nocheck && $conf->{agent}) {
2ea54503 3728 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
1c0c1c17 3729 } else {
2ea54503 3730 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
1c0c1c17 3731 }
9269013a 3732 } else {
2ea54503 3733 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
afdb31d5 3734 }
9269013a 3735 };
1e3baf05
DM
3736 my $err = $@;
3737
3738 if (!$err) {
1e3baf05 3739 my $count = 0;
e6c3b671 3740 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
3741 $count++;
3742 sleep 1;
3743 }
3744
3745 if ($count >= $timeout) {
9269013a
DM
3746 if ($force) {
3747 warn "VM still running - terminating now with SIGTERM\n";
3748 kill 15, $pid;
3749 } else {
3750 die "VM quit/powerdown failed - got timeout\n";
3751 }
3752 } else {
254575e9 3753 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 3754 return;
1e3baf05
DM
3755 }
3756 } else {
9269013a
DM
3757 if ($force) {
3758 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
3759 kill 15, $pid;
3760 } else {
afdb31d5 3761 die "VM quit/powerdown failed\n";
9269013a 3762 }
1e3baf05
DM
3763 }
3764
3765 # wait again
ff1a2432 3766 $timeout = 10;
1e3baf05
DM
3767
3768 my $count = 0;
e6c3b671 3769 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
3770 $count++;
3771 sleep 1;
3772 }
3773
3774 if ($count >= $timeout) {
ff1a2432 3775 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 3776 kill 9, $pid;
ff1a2432 3777 sleep 1;
1e3baf05
DM
3778 }
3779
254575e9 3780 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 3781 });
1e3baf05
DM
3782}
3783
3784sub vm_suspend {
3785 my ($vmid, $skiplock) = @_;
3786
6b64503e 3787 lock_config($vmid, sub {
1e3baf05 3788
6b64503e 3789 my $conf = load_config($vmid);
1e3baf05 3790
051347aa 3791 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 3792
f77f91f3 3793 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
3794 });
3795}
3796
3797sub vm_resume {
3798 my ($vmid, $skiplock) = @_;
3799
6b64503e 3800 lock_config($vmid, sub {
1e3baf05 3801
6b64503e 3802 my $conf = load_config($vmid);
1e3baf05 3803
051347aa 3804 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 3805
12060fe8 3806 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
3807 });
3808}
3809
5fdbe4f0
DM
3810sub vm_sendkey {
3811 my ($vmid, $skiplock, $key) = @_;
1e3baf05 3812
6b64503e 3813 lock_config($vmid, sub {
1e3baf05 3814
6b64503e 3815 my $conf = load_config($vmid);
f5eb281a 3816
7b7c6d1b
DM
3817 # there is no qmp command, so we use the human monitor command
3818 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
3819 });
3820}
3821
3822sub vm_destroy {
3823 my ($storecfg, $vmid, $skiplock) = @_;
3824
6b64503e 3825 lock_config($vmid, sub {
1e3baf05 3826
6b64503e 3827 my $conf = load_config($vmid);
1e3baf05 3828
6b64503e 3829 check_lock($conf) if !$skiplock;
1e3baf05 3830
ff1a2432
DM
3831 if (!check_running($vmid)) {
3832 fairsched_rmnod($vmid); # try to destroy group
3833 destroy_vm($storecfg, $vmid);
3834 } else {
3835 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
3836 }
3837 });
3838}
3839
1e3baf05
DM
3840# pci helpers
3841
3842sub file_write {
3843 my ($filename, $buf) = @_;
3844
6b64503e 3845 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
3846 return undef if !$fh;
3847
3848 my $res = print $fh $buf;
3849
3850 $fh->close();
3851
3852 return $res;
3853}
3854
3855sub pci_device_info {
3856 my ($name) = @_;
3857
3858 my $res;
3859
3860 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
3861 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
3862
3863 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
3864 return undef if !defined($irq) || $irq !~ m/^\d+$/;
3865
3866 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
3867 return undef if !defined($vendor) || $vendor !~ s/^0x//;
3868
3869 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
3870 return undef if !defined($product) || $product !~ s/^0x//;
3871
3872 $res = {
3873 name => $name,
3874 vendor => $vendor,
3875 product => $product,
3876 domain => $domain,
3877 bus => $bus,
3878 slot => $slot,
3879 func => $func,
3880 irq => $irq,
3881 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
3882 };
3883
3884 return $res;
3885}
3886
3887sub pci_dev_reset {
3888 my ($dev) = @_;
3889
3890 my $name = $dev->{name};
3891
3892 my $fn = "$pcisysfs/devices/$name/reset";
3893
6b64503e 3894 return file_write($fn, "1");
1e3baf05
DM
3895}
3896
3897sub pci_dev_bind_to_stub {
3898 my ($dev) = @_;
3899
3900 my $name = $dev->{name};
3901
3902 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
3903 return 1 if -d $testdir;
3904
3905 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 3906 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
3907
3908 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 3909 if (!file_write($fn, $name)) {
1e3baf05
DM
3910 return undef if -f $fn;
3911 }
3912
3913 $fn = "$pcisysfs/drivers/pci-stub/bind";
3914 if (! -d $testdir) {
6b64503e 3915 return undef if !file_write($fn, $name);
1e3baf05
DM
3916 }
3917
3918 return -d $testdir;
3919}
3920
000fc0a2
SP
3921sub pci_dev_bind_to_vfio {
3922 my ($dev) = @_;
3923
3924 my $name = $dev->{name};
3925
3926 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
3927
3928 if (!-d $vfio_basedir) {
3929 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
3930 }
3931 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
3932
3933 my $testdir = "$vfio_basedir/$name";
3934 return 1 if -d $testdir;
3935
3936 my $data = "$dev->{vendor} $dev->{product}";
3937 return undef if !file_write("$vfio_basedir/new_id", $data);
3938
3939 my $fn = "$pcisysfs/devices/$name/driver/unbind";
3940 if (!file_write($fn, $name)) {
3941 return undef if -f $fn;
3942 }
3943
3944 $fn = "$vfio_basedir/bind";
3945 if (! -d $testdir) {
3946 return undef if !file_write($fn, $name);
3947 }
3948
3949 return -d $testdir;
3950}
3951
3952sub pci_dev_group_bind_to_vfio {
3953 my ($pciid) = @_;
3954
3955 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
3956
3957 if (!-d $vfio_basedir) {
3958 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
3959 }
3960 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
3961
3962 # get IOMMU group devices
3963 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
3964 my @devs = grep /^0000:/, readdir($D);
3965 closedir($D);
3966
3967 foreach my $pciid (@devs) {
3968 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
3969 my $info = pci_device_info($1);
3970 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
3971 }
3972
3973 return 1;
3974}
3975
afdb31d5 3976sub print_pci_addr {
5bdcf937 3977 my ($id, $bridges) = @_;
6b64503e 3978
72a063e4 3979 my $res = '';
6b64503e 3980 my $devices = {
24f0d39a 3981 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 3982 #addr2 : first videocard
13b5a753 3983 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 3984 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
3985 scsihw0 => { bus => 0, addr => 5 },
3986 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 3987 ahci0 => { bus => 0, addr => 7 },
ab6a046f 3988 qga0 => { bus => 0, addr => 8 },
1011b570 3989 spice => { bus => 0, addr => 9 },
6b64503e
DM
3990 virtio0 => { bus => 0, addr => 10 },
3991 virtio1 => { bus => 0, addr => 11 },
3992 virtio2 => { bus => 0, addr => 12 },
3993 virtio3 => { bus => 0, addr => 13 },
3994 virtio4 => { bus => 0, addr => 14 },
3995 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
3996 hostpci0 => { bus => 0, addr => 16 },
3997 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
3998 net0 => { bus => 0, addr => 18 },
3999 net1 => { bus => 0, addr => 19 },
4000 net2 => { bus => 0, addr => 20 },
4001 net3 => { bus => 0, addr => 21 },
4002 net4 => { bus => 0, addr => 22 },
4003 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
4004 vga1 => { bus => 0, addr => 24 },
4005 vga2 => { bus => 0, addr => 25 },
4006 vga3 => { bus => 0, addr => 26 },
5cffb2d2
AD
4007 hostpci2 => { bus => 0, addr => 27 },
4008 hostpci3 => { bus => 0, addr => 28 },
e5f7f8ed 4009 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
4010 'pci.1' => { bus => 0, addr => 30 },
4011 'pci.2' => { bus => 0, addr => 31 },
4012 'net6' => { bus => 1, addr => 1 },
4013 'net7' => { bus => 1, addr => 2 },
4014 'net8' => { bus => 1, addr => 3 },
4015 'net9' => { bus => 1, addr => 4 },
4016 'net10' => { bus => 1, addr => 5 },
4017 'net11' => { bus => 1, addr => 6 },
4018 'net12' => { bus => 1, addr => 7 },
4019 'net13' => { bus => 1, addr => 8 },
4020 'net14' => { bus => 1, addr => 9 },
4021 'net15' => { bus => 1, addr => 10 },
4022 'net16' => { bus => 1, addr => 11 },
4023 'net17' => { bus => 1, addr => 12 },
4024 'net18' => { bus => 1, addr => 13 },
4025 'net19' => { bus => 1, addr => 14 },
4026 'net20' => { bus => 1, addr => 15 },
4027 'net21' => { bus => 1, addr => 16 },
4028 'net22' => { bus => 1, addr => 17 },
4029 'net23' => { bus => 1, addr => 18 },
4030 'net24' => { bus => 1, addr => 19 },
4031 'net25' => { bus => 1, addr => 20 },
4032 'net26' => { bus => 1, addr => 21 },
4033 'net27' => { bus => 1, addr => 22 },
4034 'net28' => { bus => 1, addr => 23 },
4035 'net29' => { bus => 1, addr => 24 },
4036 'net30' => { bus => 1, addr => 25 },
4037 'net31' => { bus => 1, addr => 26 },
4038 'virtio6' => { bus => 2, addr => 1 },
4039 'virtio7' => { bus => 2, addr => 2 },
4040 'virtio8' => { bus => 2, addr => 3 },
4041 'virtio9' => { bus => 2, addr => 4 },
4042 'virtio10' => { bus => 2, addr => 5 },
4043 'virtio11' => { bus => 2, addr => 6 },
4044 'virtio12' => { bus => 2, addr => 7 },
4045 'virtio13' => { bus => 2, addr => 8 },
4046 'virtio14' => { bus => 2, addr => 9 },
4047 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
4048 };
4049
4050 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 4051 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
4052 my $bus = $devices->{$id}->{bus};
4053 $res = ",bus=pci.$bus,addr=$addr";
98627641 4054 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
4055 }
4056 return $res;
4057
4058}
4059
2e3b7e2a
AD
4060sub print_pcie_addr {
4061 my ($id) = @_;
4062
4063 my $res = '';
4064 my $devices = {
4065 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4066 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4067 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4068 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4069 };
4070
4071 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4072 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4073 my $bus = $devices->{$id}->{bus};
4074 $res = ",bus=$bus,addr=$addr";
4075 }
4076 return $res;
4077
4078}
4079
3e16d5fc
DM
4080# vzdump restore implementaion
4081
ed221350 4082sub tar_archive_read_firstfile {
3e16d5fc 4083 my $archive = shift;
afdb31d5 4084
3e16d5fc
DM
4085 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4086
4087 # try to detect archive type first
4088 my $pid = open (TMP, "tar tf '$archive'|") ||
4089 die "unable to open file '$archive'\n";
4090 my $firstfile = <TMP>;
4091 kill 15, $pid;
4092 close TMP;
4093
4094 die "ERROR: archive contaions no data\n" if !$firstfile;
4095 chomp $firstfile;
4096
4097 return $firstfile;
4098}
4099
ed221350
DM
4100sub tar_restore_cleanup {
4101 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
4102
4103 print STDERR "starting cleanup\n";
4104
4105 if (my $fd = IO::File->new($statfile, "r")) {
4106 while (defined(my $line = <$fd>)) {
4107 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4108 my $volid = $2;
4109 eval {
4110 if ($volid =~ m|^/|) {
4111 unlink $volid || die 'unlink failed\n';
4112 } else {
ed221350 4113 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 4114 }
afdb31d5 4115 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
4116 };
4117 print STDERR "unable to cleanup '$volid' - $@" if $@;
4118 } else {
4119 print STDERR "unable to parse line in statfile - $line";
afdb31d5 4120 }
3e16d5fc
DM
4121 }
4122 $fd->close();
4123 }
4124}
4125
4126sub restore_archive {
a0d1b1a2 4127 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 4128
91bd6c90
DM
4129 my $format = $opts->{format};
4130 my $comp;
4131
4132 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4133 $format = 'tar' if !$format;
4134 $comp = 'gzip';
4135 } elsif ($archive =~ m/\.tar$/) {
4136 $format = 'tar' if !$format;
4137 } elsif ($archive =~ m/.tar.lzo$/) {
4138 $format = 'tar' if !$format;
4139 $comp = 'lzop';
4140 } elsif ($archive =~ m/\.vma$/) {
4141 $format = 'vma' if !$format;
4142 } elsif ($archive =~ m/\.vma\.gz$/) {
4143 $format = 'vma' if !$format;
4144 $comp = 'gzip';
4145 } elsif ($archive =~ m/\.vma\.lzo$/) {
4146 $format = 'vma' if !$format;
4147 $comp = 'lzop';
4148 } else {
4149 $format = 'vma' if !$format; # default
4150 }
4151
4152 # try to detect archive format
4153 if ($format eq 'tar') {
4154 return restore_tar_archive($archive, $vmid, $user, $opts);
4155 } else {
4156 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4157 }
4158}
4159
4160sub restore_update_config_line {
4161 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4162
4163 return if $line =~ m/^\#qmdump\#/;
4164 return if $line =~ m/^\#vzdump\#/;
4165 return if $line =~ m/^lock:/;
4166 return if $line =~ m/^unused\d+:/;
4167 return if $line =~ m/^parent:/;
ca3e4fa4 4168 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4169
4170 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4171 # try to convert old 1.X settings
4172 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4173 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4174 my ($model, $macaddr) = split(/\=/, $devconfig);
4175 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4176 my $net = {
4177 model => $model,
4178 bridge => "vmbr$ind",
4179 macaddr => $macaddr,
4180 };
4181 my $netstr = print_net($net);
4182
4183 print $outfd "net$cookie->{netcount}: $netstr\n";
4184 $cookie->{netcount}++;
4185 }
4186 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4187 my ($id, $netstr) = ($1, $2);
4188 my $net = parse_net($netstr);
4189 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4190 $netstr = print_net($net);
4191 print $outfd "$id: $netstr\n";
4192 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4193 my $virtdev = $1;
907ea891 4194 my $value = $3;
91bd6c90
DM
4195 if ($line =~ m/backup=no/) {
4196 print $outfd "#$line";
4197 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4198 my $di = parse_drive($virtdev, $value);
8fd57431 4199 delete $di->{format}; # format can change on restore
91bd6c90 4200 $di->{file} = $map->{$virtdev};
ed221350 4201 $value = print_drive($vmid, $di);
91bd6c90
DM
4202 print $outfd "$virtdev: $value\n";
4203 } else {
4204 print $outfd $line;
4205 }
4206 } else {
4207 print $outfd $line;
4208 }
4209}
4210
4211sub scan_volids {
4212 my ($cfg, $vmid) = @_;
4213
4214 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4215
4216 my $volid_hash = {};
4217 foreach my $storeid (keys %$info) {
4218 foreach my $item (@{$info->{$storeid}}) {
4219 next if !($item->{volid} && $item->{size});
5996a936 4220 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4221 $volid_hash->{$item->{volid}} = $item;
4222 }
4223 }
4224
4225 return $volid_hash;
4226}
4227
a8e2f942
DM
4228sub get_used_paths {
4229 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4230
4231 my $used_path = {};
4232
4233 my $scan_config = sub {
4234 my ($cref, $snapname) = @_;
4235
4236 foreach my $key (keys %$cref) {
4237 my $value = $cref->{$key};
4238 if (valid_drivename($key)) {
4239 next if $skip_drive && $key eq $skip_drive;
4240 my $drive = parse_drive($key, $value);
4241 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4242 if ($drive->{file} =~ m!^/!) {
4243 $used_path->{$drive->{file}}++; # = 1;
4244 } else {
4245 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4246 next if !$storeid;
4247 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4248 next if !$scfg;
4249 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4250 $used_path->{$path}++; # = 1;
4251 }
4252 }
4253 }
4254 };
4255
4256 &$scan_config($conf);
4257
4258 undef $skip_drive;
4259
4260 if ($scan_snapshots) {
4261 foreach my $snapname (keys %{$conf->{snapshots}}) {
4262 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4263 }
4264 }
4265
4266 return $used_path;
4267}
4268
91bd6c90
DM
4269sub update_disksize {
4270 my ($vmid, $conf, $volid_hash) = @_;
be190583 4271
91bd6c90
DM
4272 my $changes;
4273
4274 my $used = {};
4275
5996a936
DM
4276 # Note: it is allowed to define multiple storages with same path (alias), so
4277 # we need to check both 'volid' and real 'path' (two different volid can point
4278 # to the same path).
4279
4280 my $usedpath = {};
be190583 4281
91bd6c90
DM
4282 # update size info
4283 foreach my $opt (keys %$conf) {
ed221350
DM
4284 if (valid_drivename($opt)) {
4285 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4286 my $volid = $drive->{file};
4287 next if !$volid;
4288
4289 $used->{$volid} = 1;
be190583 4290 if ($volid_hash->{$volid} &&
5996a936
DM
4291 (my $path = $volid_hash->{$volid}->{path})) {
4292 $usedpath->{$path} = 1;
4293 }
91bd6c90 4294
ed221350 4295 next if drive_is_cdrom($drive);
91bd6c90
DM
4296 next if !$volid_hash->{$volid};
4297
4298 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4299 my $new = print_drive($vmid, $drive);
4300 if ($new ne $conf->{$opt}) {
4301 $changes = 1;
4302 $conf->{$opt} = $new;
4303 }
91bd6c90
DM
4304 }
4305 }
4306
5996a936
DM
4307 # remove 'unusedX' entry if volume is used
4308 foreach my $opt (keys %$conf) {
4309 next if $opt !~ m/^unused\d+$/;
4310 my $volid = $conf->{$opt};
4311 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4312 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4313 $changes = 1;
4314 delete $conf->{$opt};
4315 }
4316 }
4317
91bd6c90
DM
4318 foreach my $volid (sort keys %$volid_hash) {
4319 next if $volid =~ m/vm-$vmid-state-/;
4320 next if $used->{$volid};
5996a936
DM
4321 my $path = $volid_hash->{$volid}->{path};
4322 next if !$path; # just to be sure
4323 next if $usedpath->{$path};
91bd6c90 4324 $changes = 1;
ed221350 4325 add_unused_volume($conf, $volid);
05937a14 4326 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4327 }
4328
4329 return $changes;
4330}
4331
4332sub rescan {
4333 my ($vmid, $nolock) = @_;
4334
4335 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4336
4337 my $volid_hash = scan_volids($cfg, $vmid);
4338
4339 my $updatefn = sub {
4340 my ($vmid) = @_;
4341
ed221350 4342 my $conf = load_config($vmid);
be190583 4343
ed221350 4344 check_lock($conf);
91bd6c90 4345
03da3f0d
DM
4346 my $vm_volids = {};
4347 foreach my $volid (keys %$volid_hash) {
4348 my $info = $volid_hash->{$volid};
4349 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4350 }
4351
4352 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 4353
ed221350 4354 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
4355 };
4356
4357 if (defined($vmid)) {
4358 if ($nolock) {
4359 &$updatefn($vmid);
4360 } else {
ed221350 4361 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
4362 }
4363 } else {
4364 my $vmlist = config_list();
4365 foreach my $vmid (keys %$vmlist) {
4366 if ($nolock) {
4367 &$updatefn($vmid);
4368 } else {
ed221350 4369 lock_config($vmid, $updatefn, $vmid);
be190583 4370 }
91bd6c90
DM
4371 }
4372 }
4373}
4374
4375sub restore_vma_archive {
4376 my ($archive, $vmid, $user, $opts, $comp) = @_;
4377
4378 my $input = $archive eq '-' ? "<&STDIN" : undef;
4379 my $readfrom = $archive;
4380
4381 my $uncomp = '';
4382 if ($comp) {
4383 $readfrom = '-';
4384 my $qarchive = PVE::Tools::shellquote($archive);
4385 if ($comp eq 'gzip') {
4386 $uncomp = "zcat $qarchive|";
4387 } elsif ($comp eq 'lzop') {
4388 $uncomp = "lzop -d -c $qarchive|";
4389 } else {
4390 die "unknown compression method '$comp'\n";
4391 }
be190583 4392
91bd6c90
DM
4393 }
4394
4395 my $tmpdir = "/var/tmp/vzdumptmp$$";
4396 rmtree $tmpdir;
4397
4398 # disable interrupts (always do cleanups)
4399 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4400 warn "got interrupt - ignored\n";
4401 };
4402
4403 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4404 POSIX::mkfifo($mapfifo, 0600);
4405 my $fifofh;
4406
4407 my $openfifo = sub {
4408 open($fifofh, '>', $mapfifo) || die $!;
4409 };
4410
4411 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4412
4413 my $oldtimeout;
4414 my $timeout = 5;
4415
4416 my $devinfo = {};
4417
4418 my $rpcenv = PVE::RPCEnvironment::get();
4419
ed221350 4420 my $conffile = config_file($vmid);
91bd6c90
DM
4421 my $tmpfn = "$conffile.$$.tmp";
4422
ed221350
DM
4423 # Note: $oldconf is undef if VM does not exists
4424 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4425
91bd6c90
DM
4426 my $print_devmap = sub {
4427 my $virtdev_hash = {};
4428
4429 my $cfgfn = "$tmpdir/qemu-server.conf";
4430
4431 # we can read the config - that is already extracted
4432 my $fh = IO::File->new($cfgfn, "r") ||
4433 "unable to read qemu-server.conf - $!\n";
4434
4435 while (defined(my $line = <$fh>)) {
4436 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4437 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4438 die "archive does not contain data for drive '$virtdev'\n"
4439 if !$devinfo->{$devname};
4440 if (defined($opts->{storage})) {
4441 $storeid = $opts->{storage} || 'local';
4442 } elsif (!$storeid) {
4443 $storeid = 'local';
4444 }
4445 $format = 'raw' if !$format;
4446 $devinfo->{$devname}->{devname} = $devname;
4447 $devinfo->{$devname}->{virtdev} = $virtdev;
4448 $devinfo->{$devname}->{format} = $format;
4449 $devinfo->{$devname}->{storeid} = $storeid;
4450
be190583 4451 # check permission on storage
91bd6c90
DM
4452 my $pool = $opts->{pool}; # todo: do we need that?
4453 if ($user ne 'root@pam') {
4454 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4455 }
4456
4457 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4458 }
4459 }
4460
4461 foreach my $devname (keys %$devinfo) {
be190583
DM
4462 die "found no device mapping information for device '$devname'\n"
4463 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
4464 }
4465
91bd6c90 4466 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
4467
4468 # create empty/temp config
be190583 4469 if ($oldconf) {
ed221350
DM
4470 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4471 foreach_drive($oldconf, sub {
4472 my ($ds, $drive) = @_;
4473
4474 return if drive_is_cdrom($drive);
4475
4476 my $volid = $drive->{file};
4477
4478 return if !$volid || $volid =~ m|^/|;
4479
4480 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4481 return if !$path || !$owner || ($owner != $vmid);
4482
4483 # Note: only delete disk we want to restore
4484 # other volumes will become unused
4485 if ($virtdev_hash->{$ds}) {
4486 PVE::Storage::vdisk_free($cfg, $volid);
4487 }
4488 });
4489 }
4490
4491 my $map = {};
91bd6c90
DM
4492 foreach my $virtdev (sort keys %$virtdev_hash) {
4493 my $d = $virtdev_hash->{$virtdev};
4494 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4495 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
4496
4497 # test if requested format is supported
4498 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4499 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4500 $d->{format} = $defFormat if !$supported;
4501
91bd6c90
DM
4502 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4503 $d->{format}, undef, $alloc_size);
4504 print STDERR "new volume ID is '$volid'\n";
4505 $d->{volid} = $volid;
4506 my $path = PVE::Storage::path($cfg, $volid);
4507
4508 my $write_zeros = 1;
4509 # fixme: what other storages types initialize volumes with zero?
244f2577 4510 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 4511 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
4512 $write_zeros = 0;
4513 }
4514
4515 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4516
4517 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4518 $map->{$virtdev} = $volid;
4519 }
4520
4521 $fh->seek(0, 0) || die "seek failed - $!\n";
4522
4523 my $outfd = new IO::File ($tmpfn, "w") ||
4524 die "unable to write config for VM $vmid\n";
4525
4526 my $cookie = { netcount => 0 };
4527 while (defined(my $line = <$fh>)) {
be190583 4528 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
4529 }
4530
4531 $fh->close();
4532 $outfd->close();
4533 };
4534
4535 eval {
4536 # enable interrupts
4537 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4538 die "interrupted by signal\n";
4539 };
4540 local $SIG{ALRM} = sub { die "got timeout\n"; };
4541
4542 $oldtimeout = alarm($timeout);
4543
4544 my $parser = sub {
4545 my $line = shift;
4546
4547 print "$line\n";
4548
4549 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
4550 my ($dev_id, $size, $devname) = ($1, $2, $3);
4551 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
4552 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 4553 # we correctly received the vma config, so we can disable
3cf90d7a
DM
4554 # the timeout now for disk allocation (set to 10 minutes, so
4555 # that we always timeout if something goes wrong)
4556 alarm(600);
91bd6c90
DM
4557 &$print_devmap();
4558 print $fifofh "done\n";
4559 my $tmp = $oldtimeout || 0;
4560 $oldtimeout = undef;
4561 alarm($tmp);
4562 close($fifofh);
4563 }
4564 };
be190583 4565
91bd6c90
DM
4566 print "restore vma archive: $cmd\n";
4567 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
4568 };
4569 my $err = $@;
4570
4571 alarm($oldtimeout) if $oldtimeout;
4572
4573 unlink $mapfifo;
4574
4575 if ($err) {
4576 rmtree $tmpdir;
4577 unlink $tmpfn;
4578
4579 my $cfg = cfs_read_file('storage.cfg');
4580 foreach my $devname (keys %$devinfo) {
4581 my $volid = $devinfo->{$devname}->{volid};
4582 next if !$volid;
4583 eval {
4584 if ($volid =~ m|^/|) {
4585 unlink $volid || die 'unlink failed\n';
4586 } else {
4587 PVE::Storage::vdisk_free($cfg, $volid);
4588 }
4589 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4590 };
4591 print STDERR "unable to cleanup '$volid' - $@" if $@;
4592 }
4593 die $err;
4594 }
4595
4596 rmtree $tmpdir;
ed221350
DM
4597
4598 rename($tmpfn, $conffile) ||
91bd6c90
DM
4599 die "unable to commit configuration file '$conffile'\n";
4600
ed221350
DM
4601 PVE::Cluster::cfs_update(); # make sure we read new file
4602
91bd6c90
DM
4603 eval { rescan($vmid, 1); };
4604 warn $@ if $@;
4605}
4606
4607sub restore_tar_archive {
4608 my ($archive, $vmid, $user, $opts) = @_;
4609
9c502e26 4610 if ($archive ne '-') {
ed221350 4611 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
4612 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
4613 if $firstfile ne 'qemu-server.conf';
4614 }
3e16d5fc 4615
ed221350 4616 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 4617
ed221350 4618 # destroy existing data - keep empty config
ebb55558
DM
4619 my $vmcfgfn = PVE::QemuServer::config_file($vmid);
4620 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 4621
3e16d5fc
DM
4622 my $tocmd = "/usr/lib/qemu-server/qmextract";
4623
2415a446 4624 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 4625 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
4626 $tocmd .= ' --prealloc' if $opts->{prealloc};
4627 $tocmd .= ' --info' if $opts->{info};
4628
a0d1b1a2 4629 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 4630 # so we pipe to zcat
2415a446
DM
4631 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
4632 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
4633
4634 my $tmpdir = "/var/tmp/vzdumptmp$$";
4635 mkpath $tmpdir;
4636
4637 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
4638 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 4639 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 4640
ed221350 4641 my $conffile = config_file($vmid);
3e16d5fc
DM
4642 my $tmpfn = "$conffile.$$.tmp";
4643
4644 # disable interrupts (always do cleanups)
4645 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4646 print STDERR "got interrupt - ignored\n";
4647 };
4648
afdb31d5 4649 eval {
3e16d5fc
DM
4650 # enable interrupts
4651 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4652 die "interrupted by signal\n";
4653 };
4654
9c502e26
DM
4655 if ($archive eq '-') {
4656 print "extracting archive from STDIN\n";
4657 run_command($cmd, input => "<&STDIN");
4658 } else {
4659 print "extracting archive '$archive'\n";
4660 run_command($cmd);
4661 }
3e16d5fc
DM
4662
4663 return if $opts->{info};
4664
4665 # read new mapping
4666 my $map = {};
4667 my $statfile = "$tmpdir/qmrestore.stat";
4668 if (my $fd = IO::File->new($statfile, "r")) {
4669 while (defined (my $line = <$fd>)) {
4670 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4671 $map->{$1} = $2 if $1;
4672 } else {
4673 print STDERR "unable to parse line in statfile - $line\n";
4674 }
4675 }
4676 $fd->close();
4677 }
4678
4679 my $confsrc = "$tmpdir/qemu-server.conf";
4680
4681 my $srcfd = new IO::File($confsrc, "r") ||
4682 die "unable to open file '$confsrc'\n";
4683
4684 my $outfd = new IO::File ($tmpfn, "w") ||
4685 die "unable to write config for VM $vmid\n";
4686
91bd6c90 4687 my $cookie = { netcount => 0 };
3e16d5fc 4688 while (defined (my $line = <$srcfd>)) {
be190583 4689 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
4690 }
4691
4692 $srcfd->close();
4693 $outfd->close();
4694 };
4695 my $err = $@;
4696
afdb31d5 4697 if ($err) {
3e16d5fc
DM
4698
4699 unlink $tmpfn;
4700
ed221350 4701 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 4702
3e16d5fc 4703 die $err;
afdb31d5 4704 }
3e16d5fc
DM
4705
4706 rmtree $tmpdir;
4707
4708 rename $tmpfn, $conffile ||
4709 die "unable to commit configuration file '$conffile'\n";
91bd6c90 4710
ed221350
DM
4711 PVE::Cluster::cfs_update(); # make sure we read new file
4712
91bd6c90
DM
4713 eval { rescan($vmid, 1); };
4714 warn $@ if $@;
3e16d5fc
DM
4715};
4716
0d18dcfc
DM
4717
4718# Internal snapshots
4719
4720# NOTE: Snapshot create/delete involves several non-atomic
4721# action, and can take a long time.
4722# So we try to avoid locking the file and use 'lock' variable
4723# inside the config file instead.
4724
ef59d1ca
DM
4725my $snapshot_copy_config = sub {
4726 my ($source, $dest) = @_;
4727
4728 foreach my $k (keys %$source) {
4729 next if $k eq 'snapshots';
982c7f12
DM
4730 next if $k eq 'snapstate';
4731 next if $k eq 'snaptime';
18bfb361 4732 next if $k eq 'vmstate';
ef59d1ca
DM
4733 next if $k eq 'lock';
4734 next if $k eq 'digest';
db7c26e5 4735 next if $k eq 'description';
ef59d1ca 4736 next if $k =~ m/^unused\d+$/;
be190583 4737
ef59d1ca
DM
4738 $dest->{$k} = $source->{$k};
4739 }
4740};
4741
4742my $snapshot_apply_config = sub {
4743 my ($conf, $snap) = @_;
4744
4745 # copy snapshot list
4746 my $newconf = {
4747 snapshots => $conf->{snapshots},
4748 };
4749
db7c26e5 4750 # keep description and list of unused disks
ef59d1ca 4751 foreach my $k (keys %$conf) {
db7c26e5 4752 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
4753 $newconf->{$k} = $conf->{$k};
4754 }
4755
4756 &$snapshot_copy_config($snap, $newconf);
4757
4758 return $newconf;
4759};
4760
18bfb361
DM
4761sub foreach_writable_storage {
4762 my ($conf, $func) = @_;
4763
4764 my $sidhash = {};
4765
4766 foreach my $ds (keys %$conf) {
4767 next if !valid_drivename($ds);
4768
4769 my $drive = parse_drive($ds, $conf->{$ds});
4770 next if !$drive;
4771 next if drive_is_cdrom($drive);
4772
4773 my $volid = $drive->{file};
4774
4775 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 4776 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
4777 }
4778
4779 foreach my $sid (sort keys %$sidhash) {
4780 &$func($sid);
4781 }
4782}
4783
4784my $alloc_vmstate_volid = sub {
4785 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 4786
18bfb361
DM
4787 # Note: we try to be smart when selecting a $target storage
4788
4789 my $target;
4790
4791 # search shared storage first
4792 foreach_writable_storage($conf, sub {
4793 my ($sid) = @_;
4794 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4795 return if !$scfg->{shared};
4796
4797 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
4798 });
4799
4800 if (!$target) {
4801 # now search local storage
4802 foreach_writable_storage($conf, sub {
4803 my ($sid) = @_;
4804 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4805 return if $scfg->{shared};
4806
4807 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
4808 });
4809 }
4810
4811 $target = 'local' if !$target;
4812
fe6249f4
DM
4813 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
4814 # we abort live save after $conf->{memory}, so we need at max twice that space
4815 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
4816
4817 my $name = "vm-$vmid-state-$snapname";
4818 my $scfg = PVE::Storage::storage_config($storecfg, $target);
4819 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
4820 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
4821
4822 return $volid;
4823};
4824
0d18dcfc 4825my $snapshot_prepare = sub {
18bfb361 4826 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
4827
4828 my $snap;
0d18dcfc
DM
4829
4830 my $updatefn = sub {
4831
4832 my $conf = load_config($vmid);
4833
be190583 4834 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
4835 if is_template($conf);
4836
0d18dcfc
DM
4837 check_lock($conf);
4838
22c377f0
DM
4839 $conf->{lock} = 'snapshot';
4840
be190583
DM
4841 die "snapshot name '$snapname' already used\n"
4842 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 4843
ee2f90b1 4844 my $storecfg = PVE::Storage::config();
7ea975ef 4845 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 4846
782f4f75 4847 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 4848
18bfb361
DM
4849 if ($save_vmstate && check_running($vmid)) {
4850 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
4851 }
4852
ef59d1ca 4853 &$snapshot_copy_config($conf, $snap);
0d18dcfc 4854
782f4f75
DM
4855 $snap->{snapstate} = "prepare";
4856 $snap->{snaptime} = time();
4857 $snap->{description} = $comment if $comment;
4858
4b15803d
DM
4859 # always overwrite machine if we save vmstate. This makes sure we
4860 # can restore it later using correct machine type
4861 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
4862
0d18dcfc
DM
4863 update_config_nolock($vmid, $conf, 1);
4864 };
4865
4866 lock_config($vmid, $updatefn);
22c377f0
DM
4867
4868 return $snap;
0d18dcfc
DM
4869};
4870
4871my $snapshot_commit = sub {
4872 my ($vmid, $snapname) = @_;
4873
4874 my $updatefn = sub {
4875
4876 my $conf = load_config($vmid);
4877
be190583
DM
4878 die "missing snapshot lock\n"
4879 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc 4880
7946e0fa
DM
4881 my $has_machine_config = defined($conf->{machine});
4882
0d18dcfc
DM
4883 my $snap = $conf->{snapshots}->{$snapname};
4884
be190583
DM
4885 die "snapshot '$snapname' does not exist\n" if !defined($snap);
4886
4887 die "wrong snapshot state\n"
4888 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 4889
0d18dcfc 4890 delete $snap->{snapstate};
ee2f90b1 4891 delete $conf->{lock};
0d18dcfc 4892
ef59d1ca 4893 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 4894
7946e0fa
DM
4895 delete $newconf->{machine} if !$has_machine_config;
4896
05e5ad3f
DM
4897 $newconf->{parent} = $snapname;
4898
0d18dcfc
DM
4899 update_config_nolock($vmid, $newconf, 1);
4900 };
4901
4902 lock_config($vmid, $updatefn);
4903};
4904
22c377f0
DM
4905sub snapshot_rollback {
4906 my ($vmid, $snapname) = @_;
4907
4908 my $snap;
4909
4910 my $prepare = 1;
4911
a3222b91 4912 my $storecfg = PVE::Storage::config();
be190583 4913
22c377f0
DM
4914 my $updatefn = sub {
4915
4916 my $conf = load_config($vmid);
4917
8b43bc11 4918 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 4919
ab33a7c2
DM
4920 $snap = $conf->{snapshots}->{$snapname};
4921
be190583 4922 die "snapshot '$snapname' does not exist\n" if !defined($snap);
ab33a7c2 4923
be190583 4924 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
4925 if $snap->{snapstate};
4926
a3222b91
DM
4927 if ($prepare) {
4928 check_lock($conf);
4929 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
4930 }
22c377f0
DM
4931
4932 die "unable to rollback vm $vmid: vm is running\n"
4933 if check_running($vmid);
4934
4935 if ($prepare) {
4936 $conf->{lock} = 'rollback';
4937 } else {
4938 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
4939 delete $conf->{lock};
4940 }
4941
4b15803d
DM
4942 my $forcemachine;
4943
22c377f0 4944 if (!$prepare) {
4b15803d
DM
4945 my $has_machine_config = defined($conf->{machine});
4946
22c377f0 4947 # copy snapshot config to current config
ef59d1ca
DM
4948 $conf = &$snapshot_apply_config($conf, $snap);
4949 $conf->{parent} = $snapname;
4b15803d 4950
d8b916fd
DM
4951 # Note: old code did not store 'machine', so we try to be smart
4952 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
4953 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 4954 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
4955 # in the original config.
4956 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
4957 }
4958
4959 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
4960
4961 if (!$prepare && $snap->{vmstate}) {
4962 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 4963 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 4964 }
22c377f0
DM
4965 };
4966
4967 lock_config($vmid, $updatefn);
be190583 4968
22c377f0
DM
4969 foreach_drive($snap, sub {
4970 my ($ds, $drive) = @_;
4971
4972 return if drive_is_cdrom($drive);
4973
4974 my $volid = $drive->{file};
4975 my $device = "drive-$ds";
4976
79e57b29 4977 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
4978 });
4979
4980 $prepare = 0;
4981 lock_config($vmid, $updatefn);
4982}
4983
9dcf4909
DM
4984my $savevm_wait = sub {
4985 my ($vmid) = @_;
4986
4987 for(;;) {
ed221350 4988 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
4989 if (!$stat->{status}) {
4990 die "savevm not active\n";
4991 } elsif ($stat->{status} eq 'active') {
4992 sleep(1);
4993 next;
4994 } elsif ($stat->{status} eq 'completed') {
4995 last;
4996 } else {
4997 die "query-savevm returned status '$stat->{status}'\n";
4998 }
4999 }
5000};
5001
0d18dcfc 5002sub snapshot_create {
af9110dd 5003 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
0d18dcfc 5004
18bfb361 5005 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 5006
af9110dd 5007 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
18bfb361 5008
67fb9de6
DM
5009 my $config = load_config($vmid);
5010
af9110dd
WL
5011 my $running = check_running($vmid);
5012
67fb9de6 5013 my $freezefs = $running && $config->{agent};
af9110dd
WL
5014 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5015
5016 my $drivehash = {};
5017
5018 if ($freezefs) {
65994ad7
WL
5019 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5020 warn "guest-fsfreeze-freeze problems - $@" if $@;
5021 }
67fb9de6 5022
0d18dcfc
DM
5023 eval {
5024 # create internal snapshots of all drives
22c377f0
DM
5025
5026 my $storecfg = PVE::Storage::config();
a3222b91
DM
5027
5028 if ($running) {
5029 if ($snap->{vmstate}) {
be190583 5030 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
5031 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5032 &$savevm_wait($vmid);
a3222b91 5033 } else {
9dcf4909 5034 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
5035 }
5036 };
5037
22c377f0
DM
5038 foreach_drive($snap, sub {
5039 my ($ds, $drive) = @_;
5040
5041 return if drive_is_cdrom($drive);
0d18dcfc 5042
22c377f0
DM
5043 my $volid = $drive->{file};
5044 my $device = "drive-$ds";
5045
5046 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 5047 $drivehash->{$ds} = 1;
22c377f0 5048 });
0d18dcfc 5049 };
22c377f0
DM
5050 my $err = $@;
5051
65994ad7
WL
5052 if ($running) {
5053 eval { vm_mon_cmd($vmid, "savevm-end") };
5054 warn $@ if $@;
22c377f0 5055
af9110dd 5056 if ($freezefs) {
67fb9de6 5057 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
65994ad7
WL
5058 warn "guest-fsfreeze-thaw problems - $@" if $@;
5059 }
22c377f0 5060
65994ad7 5061 # savevm-end is async, we need to wait
f34ebd52 5062 for (;;) {
2c9e8036
AD
5063 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5064 if (!$stat->{bytes}) {
5065 last;
5066 } else {
5067 print "savevm not yet finished\n";
5068 sleep(1);
5069 next;
5070 }
5071 }
5072 }
5073
22c377f0 5074 if ($err) {
0d18dcfc 5075 warn "snapshot create failed: starting cleanup\n";
3ee28e38 5076 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
5077 warn $@ if $@;
5078 die $err;
5079 }
5080
5081 &$snapshot_commit($vmid, $snapname);
5082}
5083
3ee28e38 5084# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 5085sub snapshot_delete {
3ee28e38 5086 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
5087
5088 my $prepare = 1;
5089
22c377f0 5090 my $snap;
ee2f90b1 5091 my $unused = [];
0d18dcfc 5092
6cb1a8cf
DM
5093 my $unlink_parent = sub {
5094 my ($confref, $new_parent) = @_;
5095
5096 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5097 if ($new_parent) {
5098 $confref->{parent} = $new_parent;
5099 } else {
5100 delete $confref->{parent};
5101 }
5102 }
5103 };
be190583 5104
0d18dcfc 5105 my $updatefn = sub {
2009f324 5106 my ($remove_drive) = @_;
0d18dcfc 5107
22c377f0 5108 my $conf = load_config($vmid);
0d18dcfc 5109
5295b23d
DM
5110 if (!$drivehash) {
5111 check_lock($conf);
be190583 5112 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
5113 if is_template($conf);
5114 }
0d18dcfc 5115
22c377f0 5116 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 5117
be190583 5118 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
5119
5120 # remove parent refs
8fd882a4
SP
5121 if (!$prepare) {
5122 &$unlink_parent($conf, $snap->{parent});
5123 foreach my $sn (keys %{$conf->{snapshots}}) {
5124 next if $sn eq $snapname;
5125 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5126 }
0d18dcfc
DM
5127 }
5128
2009f324 5129 if ($remove_drive) {
18bfb361
DM
5130 if ($remove_drive eq 'vmstate') {
5131 delete $snap->{$remove_drive};
5132 } else {
5133 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5134 my $volid = $drive->{file};
5135 delete $snap->{$remove_drive};
5136 add_unused_volume($conf, $volid);
5137 }
2009f324
DM
5138 }
5139
0d18dcfc
DM
5140 if ($prepare) {
5141 $snap->{snapstate} = 'delete';
5142 } else {
5143 delete $conf->{snapshots}->{$snapname};
3ee28e38 5144 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
5145 foreach my $volid (@$unused) {
5146 add_unused_volume($conf, $volid);
5147 }
0d18dcfc
DM
5148 }
5149
5150 update_config_nolock($vmid, $conf, 1);
5151 };
5152
5153 lock_config($vmid, $updatefn);
5154
18bfb361 5155 # now remove vmstate file
0d18dcfc 5156
22c377f0
DM
5157 my $storecfg = PVE::Storage::config();
5158
18bfb361
DM
5159 if ($snap->{vmstate}) {
5160 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5161 if (my $err = $@) {
5162 die $err if !$force;
5163 warn $err;
5164 }
5165 # save changes (remove vmstate from snapshot)
5166 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5167 };
5168
5169 # now remove all internal snapshots
5170 foreach_drive($snap, sub {
22c377f0
DM
5171 my ($ds, $drive) = @_;
5172
5173 return if drive_is_cdrom($drive);
3ee28e38 5174
22c377f0
DM
5175 my $volid = $drive->{file};
5176 my $device = "drive-$ds";
5177
2009f324
DM
5178 if (!$drivehash || $drivehash->{$ds}) {
5179 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5180 if (my $err = $@) {
5181 die $err if !$force;
5182 warn $err;
5183 }
3ee28e38 5184 }
2009f324
DM
5185
5186 # save changes (remove drive fron snapshot)
5187 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5188 push @$unused, $volid;
22c377f0 5189 });
0d18dcfc
DM
5190
5191 # now cleanup config
5192 $prepare = 0;
5193 lock_config($vmid, $updatefn);
5194}
5195
9cd07842 5196sub has_feature {
7ea975ef
AD
5197 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5198
719893a9 5199 my $err;
7ea975ef
AD
5200 foreach_drive($conf, sub {
5201 my ($ds, $drive) = @_;
5202
5203 return if drive_is_cdrom($drive);
5204 my $volid = $drive->{file};
5205 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5206 });
5207
719893a9 5208 return $err ? 0 : 1;
7ea975ef 5209}
04a69bb4
AD
5210
5211sub template_create {
5212 my ($vmid, $conf, $disk) = @_;
5213
04a69bb4 5214 my $storecfg = PVE::Storage::config();
04a69bb4 5215
9cd07842
DM
5216 foreach_drive($conf, sub {
5217 my ($ds, $drive) = @_;
5218
5219 return if drive_is_cdrom($drive);
5220 return if $disk && $ds ne $disk;
5221
5222 my $volid = $drive->{file};
bbd56097 5223 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5224
04a69bb4
AD
5225 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5226 $drive->{file} = $voliddst;
152fe752
DM
5227 $conf->{$ds} = print_drive($vmid, $drive);
5228 update_config_nolock($vmid, $conf, 1);
04a69bb4 5229 });
04a69bb4
AD
5230}
5231
624361b3
AD
5232sub is_template {
5233 my ($conf) = @_;
5234
96d695c0 5235 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5236}
5237
5133de42
AD
5238sub qemu_img_convert {
5239 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5240
5241 my $storecfg = PVE::Storage::config();
5242 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5243 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5244
5245 if ($src_storeid && $dst_storeid) {
5246 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5247 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5248
5249 my $src_format = qemu_img_format($src_scfg, $src_volname);
5250 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5251
5252 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5253 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5254
5255 my $cmd = [];
71ddbff9 5256 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5257 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5258 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5259
5260 my $parser = sub {
5261 my $line = shift;
5262 if($line =~ m/\((\S+)\/100\%\)/){
5263 my $percent = $1;
5264 my $transferred = int($size * $percent / 100);
5265 my $remaining = $size - $transferred;
5266
5267 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5268 }
5269
5270 };
5271
5272 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5273 my $err = $@;
5274 die "copy failed: $err" if $err;
5275 }
5276}
5277
5278sub qemu_img_format {
5279 my ($scfg, $volname) = @_;
5280
ccb5c001 5281 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5282 return $1;
ccb5c001 5283 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5284 return "host_device";
be190583 5285 } else {
5133de42 5286 return "raw";
5133de42
AD
5287 }
5288}
5289
cfad42af 5290sub qemu_drive_mirror {
ab6ecffe 5291 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
cfad42af 5292
ab6ecffe 5293 my $count = 0;
cfad42af
AD
5294 my $old_len = 0;
5295 my $frozen = undef;
ab6ecffe 5296 my $maxwait = 120;
cfad42af
AD
5297
5298 my $storecfg = PVE::Storage::config();
08ac653f 5299 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
152fe752 5300
08ac653f 5301 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
cfad42af 5302
08ac653f
DM
5303 my $format;
5304 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5305 $format = $1;
5306 }
21ccdb50 5307
08ac653f 5308 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
21ccdb50 5309
88383920
DM
5310 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5311 $opts->{format} = $format if $format;
5312
5313 #fixme : sometime drive-mirror timeout, but works fine after.
5314 # (I have see the problem with big volume > 200GB), so we need to eval
f34ebd52 5315 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
88383920 5316 # ignore errors here
21ccdb50 5317
08ac653f
DM
5318 eval {
5319 while (1) {
5320 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5321 my $stat = @$stats[0];
5322 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5323 die "error job is not mirroring" if $stat->{type} ne "mirror";
5324
08ac653f
DM
5325 my $busy = $stat->{busy};
5326
6f708643
DM
5327 if (my $total = $stat->{len}) {
5328 my $transferred = $stat->{offset} || 0;
5329 my $remaining = $total - $transferred;
5330 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
67fb9de6 5331
6f708643
DM
5332 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
5333 }
f34ebd52 5334
08ac653f
DM
5335 if ($stat->{len} == $stat->{offset}) {
5336 if ($busy eq 'false') {
5337
5338 last if $vmiddst != $vmid;
f34ebd52 5339
08ac653f
DM
5340 # try to switch the disk if source and destination are on the same guest
5341 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
5342 last if !$@;
5343 die $@ if $@ !~ m/cannot be completed/;
cfad42af 5344 }
b467f79a 5345
08ac653f
DM
5346 if ($count > $maxwait) {
5347 # if too much writes to disk occurs at the end of migration
5348 #the disk needs to be freezed to be able to complete the migration
5349 vm_suspend($vmid,1);
5350 $frozen = 1;
bcc87408 5351 }
08ac653f
DM
5352 $count ++
5353 }
5354 $old_len = $stat->{offset};
5355 sleep 1;
cfad42af
AD
5356 }
5357
08ac653f
DM
5358 vm_resume($vmid, 1) if $frozen;
5359
5360 };
88383920 5361 my $err = $@;
08ac653f 5362
88383920 5363 my $cancel_job = sub {
08ac653f
DM
5364 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
5365 while (1) {
5366 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5367 my $stat = @$stats[0];
5368 last if !$stat;
5369 sleep 1;
cfad42af 5370 }
88383920
DM
5371 };
5372
5373 if ($err) {
f34ebd52 5374 eval { &$cancel_job(); };
88383920
DM
5375 die "mirroring error: $err";
5376 }
5377
5378 if ($vmiddst != $vmid) {
5379 # if we clone a disk for a new target vm, we don't switch the disk
5380 &$cancel_job(); # so we call block-job-cancel
cfad42af
AD
5381 }
5382}
5383
152fe752 5384sub clone_disk {
be190583 5385 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
5386 $newvmid, $storage, $format, $full, $newvollist) = @_;
5387
5388 my $newvolid;
5389
5390 if (!$full) {
5391 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 5392 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
5393 push @$newvollist, $newvolid;
5394 } else {
5395 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5396 $storeid = $storage if $storage;
5397
1377d7b0
DM
5398 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5399 if (!$format) {
5400 $format = $drive->{format} || $defFormat;
152fe752
DM
5401 }
5402
1377d7b0
DM
5403 # test if requested format is supported - else use default
5404 my $supported = grep { $_ eq $format } @$validFormats;
5405 $format = $defFormat if !$supported;
5406
152fe752
DM
5407 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5408
5409 print "create full clone of drive $drivename ($drive->{file})\n";
5410 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5411 push @$newvollist, $newvolid;
5412
5413 if (!$running || $snapname) {
5414 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5415 } else {
5416 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 5417 }
152fe752
DM
5418 }
5419
5420 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5421
5422 my $disk = $drive;
5423 $disk->{format} = undef;
5424 $disk->{file} = $newvolid;
5425 $disk->{size} = $size;
5426
5427 return $disk;
5428}
5429
ff556cf2
DM
5430# this only works if VM is running
5431sub get_current_qemu_machine {
5432 my ($vmid) = @_;
5433
5434 my $cmd = { execute => 'query-machines', arguments => {} };
be190583 5435 my $res = PVE::QemuServer::vm_qmp_command($vmid, $cmd);
ff556cf2
DM
5436
5437 my ($current, $default);
5438 foreach my $e (@$res) {
5439 $default = $e->{name} if $e->{'is-default'};
5440 $current = $e->{name} if $e->{'is-current'};
5441 }
5442
5443 # fallback to the default machine if current is not supported by qemu
5444 return $current || $default || 'pc';
5445}
5446
4543ecf0
AD
5447sub lspci {
5448
5449 my $devices = {};
5450
5451 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5452 my (undef, $id, $function) = @_;
5453 my $res = { id => $id, function => $function};
5454 push @{$devices->{$id}}, $res;
5455 });
5456
5457 return $devices;
5458}
5459
1e3baf05 54601;