]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
vga=none if x-vga passthrough is enabled
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05
DM
154my $confdesc = {
155 onboot => {
156 optional => 1,
157 type => 'boolean',
158 description => "Specifies whether a VM will be started during system bootup.",
159 default => 0,
160 },
161 autostart => {
162 optional => 1,
163 type => 'boolean',
164 description => "Automatic restart after crash (currently ignored).",
165 default => 0,
166 },
2ff09f52
DA
167 hotplug => {
168 optional => 1,
e8b9c17c 169 type => 'boolean',
6c52b679 170 description => "Allow hotplug for disk and network device",
2dbe827e 171 default => 0,
2ff09f52 172 },
1e3baf05
DM
173 reboot => {
174 optional => 1,
175 type => 'boolean',
176 description => "Allow reboot. If set to '0' the VM exit on reboot.",
177 default => 1,
178 },
179 lock => {
180 optional => 1,
181 type => 'string',
182 description => "Lock/unlock the VM.",
22c377f0 183 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
184 },
185 cpulimit => {
186 optional => 1,
187 type => 'integer',
188 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
189 minimum => 0,
190 default => 0,
191 },
192 cpuunits => {
193 optional => 1,
194 type => 'integer',
195 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
196 minimum => 0,
197 maximum => 500000,
198 default => 1000,
199 },
200 memory => {
201 optional => 1,
202 type => 'integer',
7878afeb 203 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
204 minimum => 16,
205 default => 512,
206 },
13a48620
DA
207 balloon => {
208 optional => 1,
209 type => 'integer',
8b1accf7
DM
210 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
211 minimum => 0,
212 },
213 shares => {
214 optional => 1,
215 type => 'integer',
216 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
217 minimum => 0,
218 maximum => 50000,
219 default => 1000,
13a48620 220 },
1e3baf05
DM
221 keyboard => {
222 optional => 1,
223 type => 'string',
224 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 225 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
226 default => 'en-us',
227 },
228 name => {
229 optional => 1,
7fabe17d 230 type => 'string', format => 'dns-name',
1e3baf05
DM
231 description => "Set a name for the VM. Only used on the configuration web interface.",
232 },
cdd20088
AD
233 scsihw => {
234 optional => 1,
235 type => 'string',
236 description => "scsi controller model",
5b952ff5 237 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
238 default => 'lsi',
239 },
1e3baf05
DM
240 description => {
241 optional => 1,
242 type => 'string',
0581fe4f 243 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
244 },
245 ostype => {
246 optional => 1,
247 type => 'string',
6b9d84cf 248 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
249 description => <<EODESC,
250Used to enable special optimization/features for specific
251operating systems:
252
253other => unspecified OS
254wxp => Microsoft Windows XP
255w2k => Microsoft Windows 2000
256w2k3 => Microsoft Windows 2003
257w2k8 => Microsoft Windows 2008
258wvista => Microsoft Windows Vista
259win7 => Microsoft Windows 7
a70ebde3 260win8 => Microsoft Windows 8/2012
1e3baf05
DM
261l24 => Linux 2.4 Kernel
262l26 => Linux 2.6/3.X Kernel
6b9d84cf 263solaris => solaris/opensolaris/openindiania kernel
1e3baf05 264
6b9d84cf 265other|l24|l26|solaris ... no special behaviour
a70ebde3 266wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
267EODESC
268 },
269 boot => {
270 optional => 1,
271 type => 'string',
272 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
273 pattern => '[acdn]{1,4}',
32baffb4 274 default => 'cdn',
1e3baf05
DM
275 },
276 bootdisk => {
277 optional => 1,
278 type => 'string', format => 'pve-qm-bootdisk',
279 description => "Enable booting from specified disk.",
03e480fc 280 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
281 },
282 smp => {
283 optional => 1,
284 type => 'integer',
285 description => "The number of CPUs. Please use option -sockets instead.",
286 minimum => 1,
287 default => 1,
288 },
289 sockets => {
290 optional => 1,
291 type => 'integer',
292 description => "The number of CPU sockets.",
293 minimum => 1,
294 default => 1,
295 },
296 cores => {
297 optional => 1,
298 type => 'integer',
299 description => "The number of cores per socket.",
300 minimum => 1,
301 default => 1,
302 },
3bd18e48
AD
303 maxcpus => {
304 optional => 1,
305 type => 'integer',
306 description => "Maximum cpus for hotplug.",
307 minimum => 1,
308 default => 1,
309 },
1e3baf05
DM
310 acpi => {
311 optional => 1,
312 type => 'boolean',
313 description => "Enable/disable ACPI.",
314 default => 1,
315 },
bc84dcca 316 agent => {
ab6a046f
AD
317 optional => 1,
318 type => 'boolean',
319 description => "Enable/disable Qemu GuestAgent.",
be79c214 320 default => 0,
ab6a046f 321 },
1e3baf05
DM
322 kvm => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable KVM hardware virtualization.",
326 default => 1,
327 },
328 tdf => {
329 optional => 1,
330 type => 'boolean',
8c559505
DM
331 description => "Enable/disable time drift fix.",
332 default => 0,
1e3baf05 333 },
19672434 334 localtime => {
1e3baf05
DM
335 optional => 1,
336 type => 'boolean',
337 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
338 },
339 freeze => {
340 optional => 1,
341 type => 'boolean',
342 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
343 },
344 vga => {
345 optional => 1,
346 type => 'string',
ef5e2be2 347 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 348 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 349 },
0ea9541d
DM
350 watchdog => {
351 optional => 1,
352 type => 'string', format => 'pve-qm-watchdog',
353 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
354 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
355 },
1e3baf05
DM
356 startdate => {
357 optional => 1,
19672434 358 type => 'string',
1e3baf05
DM
359 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
360 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
361 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
362 default => 'now',
363 },
59411c4e
DM
364 startup => {
365 optional => 1,
366 type => 'string', format => 'pve-qm-startup',
367 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
368 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
369 },
68eda3ab
AD
370 template => {
371 optional => 1,
372 type => 'boolean',
373 description => "Enable/disable Template.",
374 default => 0,
375 },
1e3baf05
DM
376 args => {
377 optional => 1,
378 type => 'string',
379 description => <<EODESCR,
380Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
381
382args: -no-reboot -no-hpet
383EODESCR
384 },
385 tablet => {
386 optional => 1,
387 type => 'boolean',
388 default => 1,
5acbfe9e 389 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
390 },
391 migrate_speed => {
392 optional => 1,
393 type => 'integer',
394 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
395 minimum => 0,
396 default => 0,
397 },
398 migrate_downtime => {
399 optional => 1,
04432191 400 type => 'number',
1e3baf05
DM
401 description => "Set maximum tolerated downtime (in seconds) for migrations.",
402 minimum => 0,
04432191 403 default => 0.1,
1e3baf05
DM
404 },
405 cdrom => {
406 optional => 1,
407 type => 'string', format => 'pve-qm-drive',
408 typetext => 'volume',
409 description => "This is an alias for option -ide2",
410 },
411 cpu => {
412 optional => 1,
413 description => "Emulated CPU type.",
414 type => 'string',
98a0dc5e 415 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 416 default => 'kvm64',
1e3baf05 417 },
b7ba6b79
DM
418 parent => get_standard_option('pve-snapshot-name', {
419 optional => 1,
420 description => "Parent snapshot name. This is used internally, and should not be modified.",
421 }),
982c7f12
DM
422 snaptime => {
423 optional => 1,
424 description => "Timestamp for snapshots.",
425 type => 'integer',
426 minimum => 0,
427 },
18bfb361
DM
428 vmstate => {
429 optional => 1,
430 type => 'string', format => 'pve-volume-id',
431 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
432 },
3bafc510
DM
433 machine => {
434 description => "Specific the Qemu machine type.",
435 type => 'string',
436 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
437 maxLength => 40,
438 optional => 1,
439 },
2796e7d5
DM
440 smbios1 => {
441 description => "Specify SMBIOS type 1 fields.",
442 type => 'string', format => 'pve-qm-smbios1',
443 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
444 maxLength => 256,
445 optional => 1,
446 },
1e3baf05
DM
447};
448
449# what about other qemu settings ?
450#cpu => 'string',
451#machine => 'string',
452#fda => 'file',
453#fdb => 'file',
454#mtdblock => 'file',
455#sd => 'file',
456#pflash => 'file',
457#snapshot => 'bool',
458#bootp => 'file',
459##tftp => 'dir',
460##smb => 'dir',
461#kernel => 'file',
462#append => 'string',
463#initrd => 'file',
464##soundhw => 'string',
465
466while (my ($k, $v) = each %$confdesc) {
467 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
468}
469
470my $MAX_IDE_DISKS = 4;
f62db2a4 471my $MAX_SCSI_DISKS = 14;
a2650619 472my $MAX_VIRTIO_DISKS = 16;
cdb0931f 473my $MAX_SATA_DISKS = 6;
1e3baf05 474my $MAX_USB_DEVICES = 5;
5bdcf937 475my $MAX_NETS = 32;
1e3baf05 476my $MAX_UNUSED_DISKS = 8;
040b06b7 477my $MAX_HOSTPCI_DEVICES = 2;
bae179aa 478my $MAX_SERIAL_PORTS = 4;
1989a89c 479my $MAX_PARALLEL_PORTS = 3;
1e3baf05
DM
480
481my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
e4c6e0b8 482 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
6b64503e 483my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 484
1e3baf05
DM
485my $netdesc = {
486 optional => 1,
487 type => 'string', format => 'pve-qm-net',
a9410357 488 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
1e3baf05 489 description => <<EODESCR,
19672434 490Specify network devices.
1e3baf05
DM
491
492MODEL is one of: $nic_model_list_txt
493
19672434 494XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
495automatically generated if not specified.
496
497The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
498
499Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
500
501If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
502
50310.0.2.2 Gateway
50410.0.2.3 DNS Server
50510.0.2.4 SMB Server
506
507The DHCP server assign addresses to the guest starting from 10.0.2.15.
508
509EODESCR
510};
511PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
512
513for (my $i = 0; $i < $MAX_NETS; $i++) {
514 $confdesc->{"net$i"} = $netdesc;
515}
516
517my $drivename_hash;
19672434 518
1e3baf05
DM
519my $idedesc = {
520 optional => 1,
521 type => 'string', format => 'pve-qm-drive',
8d87f8aa 522 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 523 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
524};
525PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
526
527my $scsidesc = {
528 optional => 1,
529 type => 'string', format => 'pve-qm-drive',
8d87f8aa 530 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 531 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
532};
533PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
534
cdb0931f
DA
535my $satadesc = {
536 optional => 1,
537 type => 'string', format => 'pve-qm-drive',
8d87f8aa 538 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 539 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
540};
541PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
542
1e3baf05
DM
543my $virtiodesc = {
544 optional => 1,
545 type => 'string', format => 'pve-qm-drive',
8d87f8aa 546 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 547 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
548};
549PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
550
551my $usbdesc = {
552 optional => 1,
553 type => 'string', format => 'pve-qm-usb-device',
80401dd8 554 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 555 description => <<EODESCR,
2fe1a152 556Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
557pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
558
19672434 559'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
560'vendor_id:product_id' (hexadeciaml numbers)
561
19672434 562You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
563
564Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
565
80401dd8
DM
566The value 'spice' can be used to add a usb redirection devices for spice.
567
1e3baf05
DM
568EODESCR
569};
570PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
571
040b06b7
DA
572my $hostpcidesc = {
573 optional => 1,
574 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 575 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
576 description => <<EODESCR,
577Map host pci devices. HOSTPCIDEVICE syntax is:
578
579'bus:dev.func' (hexadecimal numbers)
580
581You can us the 'lspci' command to list existing pci devices.
582
0cea6a01
DM
583The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
584
040b06b7
DA
585Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
586
587Experimental: user reported problems with this option.
588EODESCR
589};
590PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
591
bae179aa
DA
592my $serialdesc = {
593 optional => 1,
ca0cef26 594 type => 'string',
9f9d2fb2 595 pattern => '(/dev/ttyS\d+|socket)',
bae179aa 596 description => <<EODESCR,
9f9d2fb2 597Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device, or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
598
599Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
600
601Experimental: user reported problems with this option.
602EODESCR
603};
bae179aa 604
1989a89c
DA
605my $paralleldesc= {
606 optional => 1,
ca0cef26 607 type => 'string',
9ecc8431 608 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 609 description => <<EODESCR,
19672434 610Map host parallel devices (n is 0 to 2).
1989a89c
DA
611
612Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
613
614Experimental: user reported problems with this option.
615EODESCR
616};
1989a89c
DA
617
618for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
619 $confdesc->{"parallel$i"} = $paralleldesc;
620}
621
bae179aa
DA
622for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
623 $confdesc->{"serial$i"} = $serialdesc;
624}
625
040b06b7
DA
626for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
627 $confdesc->{"hostpci$i"} = $hostpcidesc;
628}
1e3baf05
DM
629
630for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
631 $drivename_hash->{"ide$i"} = 1;
632 $confdesc->{"ide$i"} = $idedesc;
633}
634
cdb0931f
DA
635for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
636 $drivename_hash->{"sata$i"} = 1;
637 $confdesc->{"sata$i"} = $satadesc;
638}
639
1e3baf05
DM
640for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
641 $drivename_hash->{"scsi$i"} = 1;
642 $confdesc->{"scsi$i"} = $scsidesc ;
643}
644
645for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
646 $drivename_hash->{"virtio$i"} = 1;
647 $confdesc->{"virtio$i"} = $virtiodesc;
648}
649
650for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
651 $confdesc->{"usb$i"} = $usbdesc;
652}
653
654my $unuseddesc = {
655 optional => 1,
656 type => 'string', format => 'pve-volume-id',
657 description => "Reference to unused volumes.",
658};
659
660for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
661 $confdesc->{"unused$i"} = $unuseddesc;
662}
663
664my $kvm_api_version = 0;
665
666sub kvm_version {
667
668 return $kvm_api_version if $kvm_api_version;
669
6b64503e 670 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
671 return 0;
672
6b64503e 673 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
674 $kvm_api_version = $v;
675 }
676
677 $fh->close();
678
679 return $kvm_api_version;
680}
681
682my $kvm_user_version;
683
684sub kvm_user_version {
685
686 return $kvm_user_version if $kvm_user_version;
687
688 $kvm_user_version = 'unknown';
689
690 my $tmp = `kvm -help 2>/dev/null`;
19672434 691
fa7ae705 692 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
693 $kvm_user_version = $2;
694 }
695
696 return $kvm_user_version;
697
698}
699
700my $kernel_has_vhost_net = -c '/dev/vhost-net';
701
702sub disknames {
703 # order is important - used to autoselect boot disk
19672434 704 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 705 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
706 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
707 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
708}
709
710sub valid_drivename {
711 my $dev = shift;
712
6b64503e 713 return defined($drivename_hash->{$dev});
1e3baf05
DM
714}
715
716sub option_exists {
717 my $key = shift;
718 return defined($confdesc->{$key});
19672434 719}
1e3baf05
DM
720
721sub nic_models {
722 return $nic_model_list;
723}
724
725sub os_list_description {
726
727 return {
728 other => 'Other',
729 wxp => 'Windows XP',
730 w2k => 'Windows 2000',
731 w2k3 =>, 'Windows 2003',
732 w2k8 => 'Windows 2008',
733 wvista => 'Windows Vista',
734 win7 => 'Windows 7',
a70ebde3 735 win8 => 'Windows 8/2012',
1e3baf05
DM
736 l24 => 'Linux 2.4',
737 l26 => 'Linux 2.6',
19672434 738 };
1e3baf05
DM
739}
740
1e3baf05
DM
741my $cdrom_path;
742
743sub get_cdrom_path {
744
745 return $cdrom_path if $cdrom_path;
746
747 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
748 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
749 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
750}
751
752sub get_iso_path {
753 my ($storecfg, $vmid, $cdrom) = @_;
754
755 if ($cdrom eq 'cdrom') {
756 return get_cdrom_path();
757 } elsif ($cdrom eq 'none') {
758 return '';
759 } elsif ($cdrom =~ m|^/|) {
760 return $cdrom;
761 } else {
6b64503e 762 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
763 }
764}
765
766# try to convert old style file names to volume IDs
767sub filename_to_volume_id {
768 my ($vmid, $file, $media) = @_;
769
770 if (!($file eq 'none' || $file eq 'cdrom' ||
771 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 772
1e3baf05 773 return undef if $file =~ m|/|;
19672434 774
1e3baf05
DM
775 if ($media && $media eq 'cdrom') {
776 $file = "local:iso/$file";
777 } else {
778 $file = "local:$vmid/$file";
779 }
780 }
781
782 return $file;
783}
784
785sub verify_media_type {
786 my ($opt, $vtype, $media) = @_;
787
788 return if !$media;
789
790 my $etype;
791 if ($media eq 'disk') {
a125592c 792 $etype = 'images';
1e3baf05
DM
793 } elsif ($media eq 'cdrom') {
794 $etype = 'iso';
795 } else {
796 die "internal error";
797 }
798
799 return if ($vtype eq $etype);
19672434 800
1e3baf05
DM
801 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
802}
803
804sub cleanup_drive_path {
805 my ($opt, $storecfg, $drive) = @_;
806
807 # try to convert filesystem paths to volume IDs
808
809 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
810 ($drive->{file} !~ m|^/dev/.+|) &&
811 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 812 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
813 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
814 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
815 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
816 verify_media_type($opt, $vtype, $drive->{media});
817 $drive->{file} = $volid;
818 }
819
820 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
821}
822
823sub create_conf_nolock {
824 my ($vmid, $settings) = @_;
825
6b64503e 826 my $filename = config_file($vmid);
1e3baf05
DM
827
828 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 829
1e3baf05
DM
830 my $defaults = load_defaults();
831
832 $settings->{name} = "vm$vmid" if !$settings->{name};
833 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
834
835 my $data = '';
836 foreach my $opt (keys %$settings) {
837 next if !$confdesc->{$opt};
838
839 my $value = $settings->{$opt};
840 next if !$value;
841
842 $data .= "$opt: $value\n";
843 }
844
845 PVE::Tools::file_set_contents($filename, $data);
846}
847
f36ed4f4
DM
848my $parse_size = sub {
849 my ($value) = @_;
850
9bf371a6 851 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
852 my ($size, $unit) = ($1, $3);
853 if ($unit) {
854 if ($unit eq 'K') {
855 $size = $size * 1024;
856 } elsif ($unit eq 'M') {
857 $size = $size * 1024 * 1024;
858 } elsif ($unit eq 'G') {
859 $size = $size * 1024 * 1024 * 1024;
860 }
861 }
862 return int($size);
863};
864
865my $format_size = sub {
866 my ($size) = @_;
867
868 $size = int($size);
869
870 my $kb = int($size/1024);
871 return $size if $kb*1024 != $size;
872
873 my $mb = int($kb/1024);
874 return "${kb}K" if $mb*1024 != $kb;
875
876 my $gb = int($mb/1024);
877 return "${mb}M" if $gb*1024 != $mb;
878
879 return "${gb}G";
880};
881
1e3baf05
DM
882# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
883# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 884# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 885# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
886
887sub parse_drive {
888 my ($key, $data) = @_;
889
890 my $res = {};
19672434 891
1e3baf05
DM
892 # $key may be undefined - used to verify JSON parameters
893 if (!defined($key)) {
894 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
895 $res->{index} = 0;
896 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
897 $res->{interface} = $1;
898 $res->{index} = $2;
899 } else {
900 return undef;
901 }
902
903 foreach my $p (split (/,/, $data)) {
904 next if $p =~ m/^\s*$/;
905
74edd76b 906 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
907 my ($k, $v) = ($1, $2);
908
909 $k = 'file' if $k eq 'volume';
910
911 return undef if defined $res->{$k};
19672434 912
9bf371a6
DM
913 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
914 return undef if !$v || $v !~ m/^\d+/;
915 $k = "m$k";
916 $v = sprintf("%.3f", $v / (1024*1024));
917 }
1e3baf05
DM
918 $res->{$k} = $v;
919 } else {
920 if (!$res->{file} && $p !~ m/=/) {
921 $res->{file} = $p;
922 } else {
923 return undef;
924 }
925 }
926 }
927
928 return undef if !$res->{file};
929
bdf3f362
AD
930 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
931 $res->{format} = $1;
932 }
933
19672434 934 return undef if $res->{cache} &&
e482cec3 935 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
936 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
937 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
938 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
939 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
940 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
941 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
942 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
943 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
944 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
945 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
946 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 947 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 948
9bf371a6
DM
949 return undef if $res->{mbps_rd} && $res->{mbps};
950 return undef if $res->{mbps_wr} && $res->{mbps};
951
952 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 953 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 954 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 955 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 956 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 957 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 958
affd2f88
AD
959 return undef if $res->{iops_rd} && $res->{iops};
960 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
961
962
affd2f88 963 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 964 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 965 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 966 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 967 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 968 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
969
970
24afaca0 971 if ($res->{size}) {
be190583 972 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
973 }
974
1e3baf05
DM
975 if ($res->{media} && ($res->{media} eq 'cdrom')) {
976 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 977 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
978 return undef if $res->{interface} eq 'virtio';
979 }
980
981 # rerror does not work with scsi drives
982 if ($res->{rerror}) {
983 return undef if $res->{interface} eq 'scsi';
984 }
985
986 return $res;
987}
988
74edd76b 989my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
990
991sub print_drive {
992 my ($vmid, $drive) = @_;
993
994 my $opts = '';
74edd76b 995 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
996 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
997 }
998
24afaca0
DM
999 if ($drive->{size}) {
1000 $opts .= ",size=" . &$format_size($drive->{size});
1001 }
1002
1e3baf05
DM
1003 return "$drive->{file}$opts";
1004}
1005
28ef82d3
DM
1006sub scsi_inquiry {
1007 my($fh, $noerr) = @_;
1008
1009 my $SG_IO = 0x2285;
1010 my $SG_GET_VERSION_NUM = 0x2282;
1011
1012 my $versionbuf = "\x00" x 8;
1013 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1014 if (!$ret) {
1015 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1016 return undef;
1017 }
97d62eb7 1018 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1019 if ($version < 30000) {
1020 die "scsi generic interface too old\n" if !$noerr;
1021 return undef;
1022 }
97d62eb7 1023
28ef82d3
DM
1024 my $buf = "\x00" x 36;
1025 my $sensebuf = "\x00" x 8;
f334aa3e 1026 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1027
28ef82d3
DM
1028 # see /usr/include/scsi/sg.h
1029 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1030
97d62eb7
DM
1031 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1032 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1033 $cmd, $sensebuf, 6000);
1034
1035 $ret = ioctl($fh, $SG_IO, $packet);
1036 if (!$ret) {
1037 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1038 return undef;
1039 }
97d62eb7 1040
28ef82d3
DM
1041 my @res = unpack($sg_io_hdr_t, $packet);
1042 if ($res[17] || $res[18]) {
1043 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1044 return undef;
1045 }
1046
1047 my $res = {};
09984754 1048 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1049 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1050
09984754
DM
1051 $res->{removable} = $byte1 & 128 ? 1 : 0;
1052 $res->{type} = $byte0 & 31;
1053
28ef82d3
DM
1054 return $res;
1055}
1056
1057sub path_is_scsi {
1058 my ($path) = @_;
1059
1060 my $fh = IO::File->new("+<$path") || return undef;
1061 my $res = scsi_inquiry($fh, 1);
1062 close($fh);
1063
1064 return $res;
1065}
1066
db656e5f
DM
1067sub machine_type_is_q35 {
1068 my ($conf) = @_;
1069
1070 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1071}
1072
1073sub print_tabletdevice_full {
1074 my ($conf) = @_;
1075
1076 my $q35 = machine_type_is_q35($conf);
1077
1078 # we use uhci for old VMs because tablet driver was buggy in older qemu
1079 my $usbbus = $q35 ? "ehci" : "uhci";
1080
1081 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1082}
1083
ca916ecc 1084sub print_drivedevice_full {
5bdcf937 1085 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1086
1087 my $device = '';
1088 my $maxdev = 0;
19672434 1089
ca916ecc 1090 if ($drive->{interface} eq 'virtio') {
5bdcf937 1091 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41
DM
1092 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
1093 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1094 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1095 my $controller = int($drive->{index} / $maxdev);
1096 my $unit = $drive->{index} % $maxdev;
1097 my $devicetype = 'hd';
231f2e13
DA
1098 my $path = '';
1099 if (drive_is_cdrom($drive)) {
1100 $devicetype = 'cd';
29b19529 1101 } else {
231f2e13
DA
1102 if ($drive->{file} =~ m|^/|) {
1103 $path = $drive->{file};
1104 } else {
1105 $path = PVE::Storage::path($storecfg, $drive->{file});
1106 }
d454d040
AD
1107
1108 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1109 $devicetype = 'generic';
1110 } else {
09984754
DM
1111 if (my $info = path_is_scsi($path)) {
1112 if ($info->{type} == 0) {
1113 $devicetype = 'block';
1114 } elsif ($info->{type} == 1) { # tape
1115 $devicetype = 'generic';
1116 }
1117 }
d454d040 1118 }
231f2e13 1119 }
ca916ecc 1120
5b952ff5
DM
1121 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1122 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1123 } else {
1124 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1125 }
1126
2ed36a41
DM
1127 } elsif ($drive->{interface} eq 'ide'){
1128 $maxdev = 2;
1129 my $controller = int($drive->{index} / $maxdev);
1130 my $unit = $drive->{index} % $maxdev;
1131 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1132
7ebe888a 1133 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1134 } elsif ($drive->{interface} eq 'sata'){
1135 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1136 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1137 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1138 } elsif ($drive->{interface} eq 'usb') {
1139 die "implement me";
1140 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1141 } else {
1142 die "unsupported interface type";
ca916ecc
DA
1143 }
1144
3b408e82
DM
1145 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1146
ca916ecc
DA
1147 return $device;
1148}
1149
15b21acc 1150sub get_initiator_name {
46f58b5f 1151 my $initiator;
15b21acc 1152
46f58b5f
DM
1153 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1154 while (defined(my $line = <$fh>)) {
1155 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1156 $initiator = $1;
1157 last;
1158 }
46f58b5f
DM
1159 $fh->close();
1160
15b21acc
MR
1161 return $initiator;
1162}
1163
1e3baf05
DM
1164sub print_drive_full {
1165 my ($storecfg, $vmid, $drive) = @_;
1166
1167 my $opts = '';
1168 foreach my $o (@qemu_drive_options) {
3b408e82 1169 next if $o eq 'bootindex';
1e3baf05 1170 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1171 }
1e3baf05 1172
9bf371a6
DM
1173 foreach my $o (qw(bps bps_rd bps_wr)) {
1174 my $v = $drive->{"m$o"};
1175 $opts .= ",$o=" . int($v*1024*1024) if $v;
1176 }
1177
1e3baf05 1178 # use linux-aio by default (qemu default is threads)
19672434 1179 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1180
1181 my $path;
1182 my $volid = $drive->{file};
6b64503e
DM
1183 if (drive_is_cdrom($drive)) {
1184 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1185 } else {
1186 if ($volid =~ m|^/|) {
1187 $path = $volid;
1188 } else {
6b64503e 1189 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1190 }
1191 }
1192
ef86170e 1193 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1194
1e3baf05
DM
1195 my $pathinfo = $path ? "file=$path," : '';
1196
3ebfcc86 1197 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1198}
1199
cc4d6182 1200sub print_netdevice_full {
5bdcf937 1201 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1202
1203 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1204
1205 my $device = $net->{model};
1206 if ($net->{model} eq 'virtio') {
1207 $device = 'virtio-net-pci';
1208 };
1209
1210 # qemu > 0.15 always try to boot from network - we disable that by
1211 # not loading the pxe rom file
1212 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
5bdcf937 1213 my $pciaddr = print_pci_addr("$netid", $bridges);
cc4d6182 1214 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1215 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1216 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1217 my $vectors = $net->{queues} * 2 + 2;
1218 $tmpstr .= ",vectors=$vectors,mq=on";
1219 }
cc4d6182
DA
1220 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1221 return $tmpstr;
1222}
1223
1224sub print_netdev_full {
1225 my ($vmid, $conf, $net, $netid) = @_;
1226
1227 my $i = '';
1228 if ($netid =~ m/^net(\d+)$/) {
1229 $i = int($1);
1230 }
1231
1232 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1233
1234 my $ifname = "tap${vmid}i$i";
1235
1236 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1237 die "interface name '$ifname' is too long (max 15 character)\n"
1238 if length($ifname) >= 16;
1239
1240 my $vhostparam = '';
1241 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1242
1243 my $vmname = $conf->{name} || "vm$vmid";
1244
a9410357
AD
1245 my $netdev = "";
1246
cc4d6182 1247 if ($net->{bridge}) {
a9410357 1248 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1249 } else {
a9410357 1250 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1251 }
a9410357
AD
1252
1253 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1254
1255 return $netdev;
cc4d6182 1256}
1e3baf05
DM
1257
1258sub drive_is_cdrom {
1259 my ($drive) = @_;
1260
1261 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1262
1263}
1264
040b06b7
DA
1265sub parse_hostpci {
1266 my ($value) = @_;
1267
1268 return undef if !$value;
1269
0cea6a01
DM
1270
1271 my @list = split(/,/, $value);
1272 my $found;
1273
040b06b7 1274 my $res = {};
0cea6a01 1275 foreach my $kv (@list) {
040b06b7 1276
4543ecf0 1277 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1278 $found = 1;
4543ecf0
AD
1279 if(defined($4)){
1280 push @{$res->{pciid}}, { id => $2 , function => $4};
1281
1282 }else{
1283 my $pcidevices = lspci($2);
1284 $res->{pciid} = $pcidevices->{$2};
1285 }
0cea6a01
DM
1286 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1287 $res->{driver} = $1;
1288 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1289 $res->{rombar} = $1;
2e3b7e2a
AD
1290 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1291 $res->{'x-vga'} = $1;
1292 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1293 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1294 } else {
1295 warn "unknown hostpci setting '$kv'\n";
1296 }
040b06b7
DA
1297 }
1298
0cea6a01
DM
1299 return undef if !$found;
1300
040b06b7
DA
1301 return $res;
1302}
1303
1e3baf05
DM
1304# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1305sub parse_net {
1306 my ($data) = @_;
1307
1308 my $res = {};
1309
6b64503e 1310 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1311
e4c6e0b8 1312 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1313 my $model = lc($1);
92f0fedc 1314 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1315 $res->{model} = $model;
1316 $res->{macaddr} = $mac;
1317 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1318 $res->{bridge} = $1;
a9410357
AD
1319 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1320 $res->{queues} = $1;
1e3baf05
DM
1321 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1322 $res->{rate} = $1;
5070f384
DA
1323 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1324 $res->{tag} = $1;
2dd4aa4c
AD
1325 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1326 $res->{firewall} = $1;
1e3baf05
DM
1327 } else {
1328 return undef;
1329 }
19672434 1330
1e3baf05
DM
1331 }
1332
1333 return undef if !$res->{model};
1334
1335 return $res;
1336}
1337
1338sub print_net {
1339 my $net = shift;
1340
1341 my $res = "$net->{model}";
1342 $res .= "=$net->{macaddr}" if $net->{macaddr};
1343 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1344 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1345 $res .= ",tag=$net->{tag}" if $net->{tag};
28138e9a 1346 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1e3baf05
DM
1347
1348 return $res;
1349}
1350
1351sub add_random_macs {
1352 my ($settings) = @_;
1353
1354 foreach my $opt (keys %$settings) {
1355 next if $opt !~ m/^net(\d+)$/;
1356 my $net = parse_net($settings->{$opt});
1357 next if !$net;
1358 $settings->{$opt} = print_net($net);
1359 }
1360}
1361
1362sub add_unused_volume {
1858638f 1363 my ($config, $volid) = @_;
1e3baf05
DM
1364
1365 my $key;
1366 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1367 my $test = "unused$ind";
1368 if (my $vid = $config->{$test}) {
1369 return if $vid eq $volid; # do not add duplicates
1370 } else {
1371 $key = $test;
19672434 1372 }
1e3baf05
DM
1373 }
1374
1375 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1376
1858638f 1377 $config->{$key} = $volid;
1e3baf05 1378
1858638f 1379 return $key;
1e3baf05
DM
1380}
1381
2796e7d5
DM
1382my $valid_smbios1_options = {
1383 manufacturer => '\S+',
1384 product => '\S+',
1385 version => '\S+',
1386 serial => '\S+',
1387 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1388 sku => '\S+',
1389 family => '\S+',
1390};
1391
1392# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1393sub parse_smbios1 {
1394 my ($data) = @_;
1395
1396 my $res = {};
1397
1398 foreach my $kvp (split(/,/, $data)) {
1399 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1400 my ($k, $v) = split(/=/, $kvp);
1401 return undef if !defined($k) || !defined($v);
1402 return undef if !$valid_smbios1_options->{$k};
1403 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1404 $res->{$k} = $v;
1405 }
1406
1407 return $res;
1408}
1409
1410PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1411sub verify_smbios1 {
1412 my ($value, $noerr) = @_;
1413
1414 return $value if parse_smbios1($value);
1415
1416 return undef if $noerr;
1417
1418 die "unable to parse smbios (type 1) options\n";
1419}
1420
1e3baf05
DM
1421PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1422sub verify_bootdisk {
1423 my ($value, $noerr) = @_;
1424
19672434 1425 return $value if valid_drivename($value);
1e3baf05
DM
1426
1427 return undef if $noerr;
1428
1429 die "invalid boot disk '$value'\n";
1430}
1431
1432PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1433sub verify_net {
1434 my ($value, $noerr) = @_;
1435
1436 return $value if parse_net($value);
1437
1438 return undef if $noerr;
19672434 1439
1e3baf05
DM
1440 die "unable to parse network options\n";
1441}
1442
1443PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1444sub verify_drive {
1445 my ($value, $noerr) = @_;
1446
6b64503e 1447 return $value if parse_drive(undef, $value);
1e3baf05
DM
1448
1449 return undef if $noerr;
19672434 1450
1e3baf05
DM
1451 die "unable to parse drive options\n";
1452}
1453
1454PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1455sub verify_hostpci {
1456 my ($value, $noerr) = @_;
1457
040b06b7
DA
1458 return $value if parse_hostpci($value);
1459
1460 return undef if $noerr;
1461
1462 die "unable to parse pci id\n";
1e3baf05
DM
1463}
1464
0ea9541d
DM
1465PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1466sub verify_watchdog {
1467 my ($value, $noerr) = @_;
1468
1469 return $value if parse_watchdog($value);
1470
1471 return undef if $noerr;
19672434 1472
0ea9541d
DM
1473 die "unable to parse watchdog options\n";
1474}
1475
1476sub parse_watchdog {
1477 my ($value) = @_;
1478
1479 return undef if !$value;
1480
1481 my $res = {};
1482
6b64503e 1483 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1484 next if $p =~ m/^\s*$/;
1485
1486 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1487 $res->{model} = $2;
1488 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1489 $res->{action} = $2;
1490 } else {
1491 return undef;
1492 }
1493 }
1494
1495 return $res;
1496}
1497
59411c4e
DM
1498PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1499sub verify_startup {
1500 my ($value, $noerr) = @_;
1501
1502 return $value if parse_startup($value);
1503
1504 return undef if $noerr;
1505
1506 die "unable to parse startup options\n";
1507}
1508
1509sub parse_startup {
1510 my ($value) = @_;
1511
1512 return undef if !$value;
1513
1514 my $res = {};
1515
1516 foreach my $p (split(/,/, $value)) {
1517 next if $p =~ m/^\s*$/;
1518
1519 if ($p =~ m/^(order=)?(\d+)$/) {
1520 $res->{order} = $2;
1521 } elsif ($p =~ m/^up=(\d+)$/) {
1522 $res->{up} = $1;
1523 } elsif ($p =~ m/^down=(\d+)$/) {
1524 $res->{down} = $1;
1525 } else {
1526 return undef;
1527 }
1528 }
1529
1530 return $res;
1531}
1532
1e3baf05
DM
1533sub parse_usb_device {
1534 my ($value) = @_;
1535
1536 return undef if !$value;
1537
6b64503e 1538 my @dl = split(/,/, $value);
1e3baf05
DM
1539 my $found;
1540
1541 my $res = {};
1542 foreach my $v (@dl) {
036e0e2b 1543 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1544 $found = 1;
036e0e2b
DM
1545 $res->{vendorid} = $2;
1546 $res->{productid} = $4;
1e3baf05
DM
1547 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1548 $found = 1;
1549 $res->{hostbus} = $1;
1550 $res->{hostport} = $2;
80401dd8
DM
1551 } elsif ($v =~ m/^spice$/) {
1552 $found = 1;
1553 $res->{spice} = 1;
1e3baf05
DM
1554 } else {
1555 return undef;
1556 }
1557 }
1558 return undef if !$found;
1559
1560 return $res;
1561}
19672434 1562
1e3baf05
DM
1563PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1564sub verify_usb_device {
1565 my ($value, $noerr) = @_;
1566
1567 return $value if parse_usb_device($value);
1568
1569 return undef if $noerr;
19672434 1570
1e3baf05
DM
1571 die "unable to parse usb device\n";
1572}
1573
1e3baf05
DM
1574# add JSON properties for create and set function
1575sub json_config_properties {
1576 my $prop = shift;
1577
1578 foreach my $opt (keys %$confdesc) {
18bfb361 1579 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1580 $prop->{$opt} = $confdesc->{$opt};
1581 }
1582
1583 return $prop;
1584}
1585
1586sub check_type {
1587 my ($key, $value) = @_;
1588
1589 die "unknown setting '$key'\n" if !$confdesc->{$key};
1590
1591 my $type = $confdesc->{$key}->{type};
1592
6b64503e 1593 if (!defined($value)) {
1e3baf05
DM
1594 die "got undefined value\n";
1595 }
1596
1597 if ($value =~ m/[\n\r]/) {
1598 die "property contains a line feed\n";
1599 }
1600
1601 if ($type eq 'boolean') {
19672434
DM
1602 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1603 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1604 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1605 } elsif ($type eq 'integer') {
1606 return int($1) if $value =~ m/^(\d+)$/;
1607 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1608 } elsif ($type eq 'number') {
1609 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1610 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1611 } elsif ($type eq 'string') {
1612 if (my $fmt = $confdesc->{$key}->{format}) {
1613 if ($fmt eq 'pve-qm-drive') {
1614 # special case - we need to pass $key to parse_drive()
6b64503e 1615 my $drive = parse_drive($key, $value);
1e3baf05
DM
1616 return $value if $drive;
1617 die "unable to parse drive options\n";
1618 }
1619 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1620 return $value;
1621 }
1e3baf05 1622 $value =~ s/^\"(.*)\"$/$1/;
19672434 1623 return $value;
1e3baf05
DM
1624 } else {
1625 die "internal error"
1626 }
1627}
1628
191435c6
DM
1629sub lock_config_full {
1630 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1631
6b64503e 1632 my $filename = config_file_lock($vmid);
1e3baf05 1633
191435c6 1634 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1635
1636 die $@ if $@;
5fdbe4f0
DM
1637
1638 return $res;
1e3baf05
DM
1639}
1640
4e4f83fe
DM
1641sub lock_config_mode {
1642 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1643
1644 my $filename = config_file_lock($vmid);
1645
4e4f83fe 1646 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1647
1648 die $@ if $@;
1649
1650 return $res;
1651}
1652
191435c6
DM
1653sub lock_config {
1654 my ($vmid, $code, @param) = @_;
1655
1656 return lock_config_full($vmid, 10, $code, @param);
1657}
1658
1e3baf05 1659sub cfs_config_path {
a78ccf26 1660 my ($vmid, $node) = @_;
1e3baf05 1661
a78ccf26
DM
1662 $node = $nodename if !$node;
1663 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1664}
1665
040b06b7
DA
1666sub check_iommu_support{
1667 #fixme : need to check IOMMU support
1668 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1669
1670 my $iommu=1;
1671 return $iommu;
1672
1673}
1674
1e3baf05 1675sub config_file {
a78ccf26 1676 my ($vmid, $node) = @_;
1e3baf05 1677
a78ccf26 1678 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1679 return "/etc/pve/$cfspath";
1680}
1681
1682sub config_file_lock {
1683 my ($vmid) = @_;
1684
1685 return "$lock_dir/lock-$vmid.conf";
1686}
1687
1688sub touch_config {
1689 my ($vmid) = @_;
1690
6b64503e 1691 my $conf = config_file($vmid);
1e3baf05
DM
1692 utime undef, undef, $conf;
1693}
1694
1e3baf05 1695sub destroy_vm {
a6af7b3e 1696 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1697
6b64503e 1698 my $conffile = config_file($vmid);
1e3baf05 1699
6b64503e 1700 my $conf = load_config($vmid);
1e3baf05 1701
6b64503e 1702 check_lock($conf);
1e3baf05 1703
19672434 1704 # only remove disks owned by this VM
1e3baf05
DM
1705 foreach_drive($conf, sub {
1706 my ($ds, $drive) = @_;
1707
6b64503e 1708 return if drive_is_cdrom($drive);
1e3baf05
DM
1709
1710 my $volid = $drive->{file};
ed221350 1711
ff1a2432 1712 return if !$volid || $volid =~ m|^/|;
1e3baf05 1713
6b64503e 1714 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1715 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1716
6b64503e 1717 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1718 });
19672434 1719
a6af7b3e 1720 if ($keep_empty_config) {
9c502e26 1721 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1722 } else {
1723 unlink $conffile;
1724 }
1e3baf05
DM
1725
1726 # also remove unused disk
1727 eval {
6b64503e 1728 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1729
1730 eval {
6b64503e 1731 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1732 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1733 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1734 });
1735 };
1736 warn $@ if $@;
1737
1738 };
1739 warn $@ if $@;
1740}
1741
1e3baf05 1742sub load_config {
7e8dcf2c 1743 my ($vmid, $node) = @_;
1e3baf05 1744
7e8dcf2c 1745 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1746
1747 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1748
1749 die "no such VM ('$vmid')\n" if !defined($conf);
1750
1751 return $conf;
19672434 1752}
1e3baf05
DM
1753
1754sub parse_vm_config {
1755 my ($filename, $raw) = @_;
1756
1757 return undef if !defined($raw);
1758
554ac7e7 1759 my $res = {
fc1ddcdc 1760 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1761 snapshots => {},
554ac7e7 1762 };
1e3baf05 1763
19672434 1764 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1765 || die "got strange filename '$filename'";
1766
1767 my $vmid = $1;
1768
0d18dcfc 1769 my $conf = $res;
0581fe4f
DM
1770 my $descr = '';
1771
0d18dcfc
DM
1772 my @lines = split(/\n/, $raw);
1773 foreach my $line (@lines) {
1e3baf05 1774 next if $line =~ m/^\s*$/;
be190583 1775
0d18dcfc
DM
1776 if ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
1777 my $snapname = $1;
1778 $conf->{description} = $descr if $descr;
782f4f75 1779 $descr = '';
be190583 1780 $conf = $res->{snapshots}->{$snapname} = {};
0d18dcfc
DM
1781 next;
1782 }
1e3baf05 1783
0581fe4f
DM
1784 if ($line =~ m/^\#(.*)\s*$/) {
1785 $descr .= PVE::Tools::decode_text($1) . "\n";
1786 next;
1787 }
1788
1e3baf05 1789 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1790 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1791 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1792 $conf->{snapstate} = $1;
1e3baf05
DM
1793 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1794 my $key = $1;
1795 my $value = $2;
0d18dcfc 1796 $conf->{$key} = $value;
1e3baf05
DM
1797 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1798 my $key = $1;
1799 my $value = $2;
1800 eval { $value = check_type($key, $value); };
1801 if ($@) {
1802 warn "vm $vmid - unable to parse value of '$key' - $@";
1803 } else {
1804 my $fmt = $confdesc->{$key}->{format};
1805 if ($fmt && $fmt eq 'pve-qm-drive') {
1806 my $v = parse_drive($key, $value);
1807 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1808 $v->{file} = $volid;
6b64503e 1809 $value = print_drive($vmid, $v);
1e3baf05
DM
1810 } else {
1811 warn "vm $vmid - unable to parse value of '$key'\n";
1812 next;
1813 }
1814 }
1815
1816 if ($key eq 'cdrom') {
0d18dcfc 1817 $conf->{ide2} = $value;
1e3baf05 1818 } else {
0d18dcfc 1819 $conf->{$key} = $value;
1e3baf05
DM
1820 }
1821 }
1822 }
1823 }
1824
0d18dcfc 1825 $conf->{description} = $descr if $descr;
0581fe4f 1826
0d18dcfc 1827 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
1828
1829 return $res;
1830}
1831
1858638f
DM
1832sub write_vm_config {
1833 my ($filename, $conf) = @_;
1e3baf05 1834
0d18dcfc
DM
1835 delete $conf->{snapstate}; # just to be sure
1836
1858638f
DM
1837 if ($conf->{cdrom}) {
1838 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
1839 $conf->{ide2} = $conf->{cdrom};
1840 delete $conf->{cdrom};
1841 }
1e3baf05
DM
1842
1843 # we do not use 'smp' any longer
1858638f
DM
1844 if ($conf->{sockets}) {
1845 delete $conf->{smp};
1846 } elsif ($conf->{smp}) {
1847 $conf->{sockets} = $conf->{smp};
1848 delete $conf->{cores};
1849 delete $conf->{smp};
1e3baf05
DM
1850 }
1851
264e519f 1852 if ($conf->{maxcpus} && $conf->{sockets}) {
3bd18e48
AD
1853 delete $conf->{sockets};
1854 }
264e519f 1855
ee2f90b1 1856 my $used_volids = {};
0d18dcfc 1857
ee2f90b1 1858 my $cleanup_config = sub {
a8e2f942 1859 my ($cref, $snapname) = @_;
1858638f 1860
ee2f90b1
DM
1861 foreach my $key (keys %$cref) {
1862 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
1863 $key eq 'snapstate';
1864 my $value = $cref->{$key};
1865 eval { $value = check_type($key, $value); };
1866 die "unable to parse value of '$key' - $@" if $@;
1858638f 1867
ee2f90b1
DM
1868 $cref->{$key} = $value;
1869
a8e2f942 1870 if (!$snapname && valid_drivename($key)) {
ed221350 1871 my $drive = parse_drive($key, $value);
ee2f90b1
DM
1872 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
1873 }
1e3baf05 1874 }
ee2f90b1
DM
1875 };
1876
1877 &$cleanup_config($conf);
1878 foreach my $snapname (keys %{$conf->{snapshots}}) {
a8e2f942 1879 &$cleanup_config($conf->{snapshots}->{$snapname}, $snapname);
1e3baf05
DM
1880 }
1881
1858638f
DM
1882 # remove 'unusedX' settings if we re-add a volume
1883 foreach my $key (keys %$conf) {
1884 my $value = $conf->{$key};
ee2f90b1 1885 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 1886 delete $conf->{$key};
1e3baf05 1887 }
1858638f 1888 }
be190583 1889
0d18dcfc
DM
1890 my $generate_raw_config = sub {
1891 my ($conf) = @_;
0581fe4f 1892
0d18dcfc
DM
1893 my $raw = '';
1894
1895 # add description as comment to top of file
1896 my $descr = $conf->{description} || '';
1897 foreach my $cl (split(/\n/, $descr)) {
1898 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
1899 }
1900
1901 foreach my $key (sort keys %$conf) {
1902 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots';
1903 $raw .= "$key: $conf->{$key}\n";
1904 }
1905 return $raw;
1906 };
0581fe4f 1907
0d18dcfc
DM
1908 my $raw = &$generate_raw_config($conf);
1909 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
1910 $raw .= "\n[$snapname]\n";
1911 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 1912 }
1e3baf05 1913
1858638f
DM
1914 return $raw;
1915}
1e3baf05 1916
1858638f
DM
1917sub update_config_nolock {
1918 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 1919
1858638f 1920 check_lock($conf) if !$skiplock;
97d62eb7 1921
1858638f 1922 my $cfspath = cfs_config_path($vmid);
1e3baf05 1923
1858638f
DM
1924 PVE::Cluster::cfs_write_file($cfspath, $conf);
1925}
1e3baf05 1926
1858638f
DM
1927sub update_config {
1928 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 1929
1858638f 1930 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
1931}
1932
19672434 1933sub load_defaults {
1e3baf05
DM
1934
1935 my $res = {};
1936
1937 # we use static defaults from our JSON schema configuration
1938 foreach my $key (keys %$confdesc) {
1939 if (defined(my $default = $confdesc->{$key}->{default})) {
1940 $res->{$key} = $default;
1941 }
1942 }
19672434 1943
1e3baf05
DM
1944 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
1945 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
1946
1947 return $res;
1948}
1949
1950sub config_list {
1951 my $vmlist = PVE::Cluster::get_vmlist();
1952 my $res = {};
1953 return $res if !$vmlist || !$vmlist->{ids};
1954 my $ids = $vmlist->{ids};
1955
1e3baf05
DM
1956 foreach my $vmid (keys %$ids) {
1957 my $d = $ids->{$vmid};
1958 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 1959 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
1960 $res->{$vmid}->{exists} = 1;
1961 }
1962 return $res;
1963}
1964
64e13401
DM
1965# test if VM uses local resources (to prevent migration)
1966sub check_local_resources {
1967 my ($conf, $noerr) = @_;
1968
1969 my $loc_res = 0;
19672434 1970
e0ab7331
DM
1971 $loc_res = 1 if $conf->{hostusb}; # old syntax
1972 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 1973
0d29ab3b 1974 foreach my $k (keys %$conf) {
49ca581d 1975 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 1976 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
1977 }
1978
1979 die "VM uses local resources\n" if $loc_res && !$noerr;
1980
1981 return $loc_res;
1982}
1983
719893a9 1984# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
1985sub check_storage_availability {
1986 my ($storecfg, $conf, $node) = @_;
1987
1988 foreach_drive($conf, sub {
1989 my ($ds, $drive) = @_;
1990
1991 my $volid = $drive->{file};
1992 return if !$volid;
1993
1994 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
1995 return if !$sid;
1996
1997 # check if storage is available on both nodes
1998 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
1999 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2000 });
2001}
2002
719893a9
DM
2003# list nodes where all VM images are available (used by has_feature API)
2004sub shared_nodes {
2005 my ($conf, $storecfg) = @_;
2006
2007 my $nodelist = PVE::Cluster::get_nodelist();
2008 my $nodehash = { map { $_ => 1 } @$nodelist };
2009 my $nodename = PVE::INotify::nodename();
be190583 2010
719893a9
DM
2011 foreach_drive($conf, sub {
2012 my ($ds, $drive) = @_;
2013
2014 my $volid = $drive->{file};
2015 return if !$volid;
2016
2017 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2018 if ($storeid) {
2019 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2020 if ($scfg->{disable}) {
2021 $nodehash = {};
2022 } elsif (my $avail = $scfg->{nodes}) {
2023 foreach my $node (keys %$nodehash) {
2024 delete $nodehash->{$node} if !$avail->{$node};
2025 }
2026 } elsif (!$scfg->{shared}) {
2027 foreach my $node (keys %$nodehash) {
2028 delete $nodehash->{$node} if $node ne $nodename
2029 }
2030 }
2031 }
2032 });
2033
2034 return $nodehash
2035}
2036
1e3baf05
DM
2037sub check_lock {
2038 my ($conf) = @_;
2039
2040 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2041}
2042
2043sub check_cmdline {
2044 my ($pidfile, $pid) = @_;
2045
6b64503e
DM
2046 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2047 if (defined($fh)) {
1e3baf05
DM
2048 my $line = <$fh>;
2049 $fh->close;
2050 return undef if !$line;
6b64503e 2051 my @param = split(/\0/, $line);
1e3baf05
DM
2052
2053 my $cmd = $param[0];
06094efd 2054 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2055
2056 for (my $i = 0; $i < scalar (@param); $i++) {
2057 my $p = $param[$i];
2058 next if !$p;
2059 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2060 my $p = $param[$i+1];
2061 return 1 if $p && ($p eq $pidfile);
2062 return undef;
2063 }
2064 }
2065 }
2066 return undef;
2067}
2068
2069sub check_running {
7e8dcf2c 2070 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2071
7e8dcf2c 2072 my $filename = config_file($vmid, $node);
1e3baf05
DM
2073
2074 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2075 if !$nocheck && ! -f $filename;
1e3baf05 2076
e6c3b671 2077 my $pidfile = pidfile_name($vmid);
1e3baf05 2078
e6c3b671
DM
2079 if (my $fd = IO::File->new("<$pidfile")) {
2080 my $st = stat($fd);
1e3baf05 2081 my $line = <$fd>;
6b64503e 2082 close($fd);
1e3baf05
DM
2083
2084 my $mtime = $st->mtime;
2085 if ($mtime > time()) {
2086 warn "file '$filename' modified in future\n";
2087 }
2088
2089 if ($line =~ m/^(\d+)$/) {
2090 my $pid = $1;
e6c3b671
DM
2091 if (check_cmdline($pidfile, $pid)) {
2092 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2093 return $pid;
2094 }
2095 }
1e3baf05
DM
2096 }
2097 }
2098
2099 return undef;
2100}
2101
2102sub vzlist {
19672434 2103
1e3baf05
DM
2104 my $vzlist = config_list();
2105
6b64503e 2106 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2107
19672434 2108 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2109 next if $de !~ m/^(\d+)\.pid$/;
2110 my $vmid = $1;
6b64503e
DM
2111 next if !defined($vzlist->{$vmid});
2112 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2113 $vzlist->{$vmid}->{pid} = $pid;
2114 }
2115 }
2116
2117 return $vzlist;
2118}
2119
1e3baf05
DM
2120sub disksize {
2121 my ($storecfg, $conf) = @_;
2122
2123 my $bootdisk = $conf->{bootdisk};
2124 return undef if !$bootdisk;
2125 return undef if !valid_drivename($bootdisk);
2126
2127 return undef if !$conf->{$bootdisk};
2128
2129 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2130 return undef if !defined($drive);
2131
2132 return undef if drive_is_cdrom($drive);
2133
2134 my $volid = $drive->{file};
2135 return undef if !$volid;
2136
24afaca0 2137 return $drive->{size};
1e3baf05
DM
2138}
2139
2140my $last_proc_pid_stat;
2141
03a33f30
DM
2142# get VM status information
2143# This must be fast and should not block ($full == false)
2144# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2145sub vmstatus {
03a33f30 2146 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2147
2148 my $res = {};
2149
19672434 2150 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2151
2152 my $list = vzlist();
694fcad4 2153 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2154
ae4915a2
DM
2155 my $cpucount = $cpuinfo->{cpus} || 1;
2156
1e3baf05
DM
2157 foreach my $vmid (keys %$list) {
2158 next if $opt_vmid && ($vmid ne $opt_vmid);
2159
2160 my $cfspath = cfs_config_path($vmid);
2161 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2162
2163 my $d = {};
2164 $d->{pid} = $list->{$vmid}->{pid};
2165
2166 # fixme: better status?
2167 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2168
af990afe
DM
2169 my $size = disksize($storecfg, $conf);
2170 if (defined($size)) {
2171 $d->{disk} = 0; # no info available
1e3baf05
DM
2172 $d->{maxdisk} = $size;
2173 } else {
2174 $d->{disk} = 0;
2175 $d->{maxdisk} = 0;
2176 }
2177
2178 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2179 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2180
1e3baf05 2181 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2182 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2183
8b1accf7 2184 if ($conf->{balloon}) {
4bdb0514 2185 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2186 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2187 }
2188
1e3baf05
DM
2189 $d->{uptime} = 0;
2190 $d->{cpu} = 0;
1e3baf05
DM
2191 $d->{mem} = 0;
2192
2193 $d->{netout} = 0;
2194 $d->{netin} = 0;
2195
2196 $d->{diskread} = 0;
2197 $d->{diskwrite} = 0;
2198
4d8c851b
AD
2199 $d->{template} = is_template($conf);
2200
1e3baf05
DM
2201 $res->{$vmid} = $d;
2202 }
2203
2204 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2205 foreach my $dev (keys %$netdev) {
2206 next if $dev !~ m/^tap([1-9]\d*)i/;
2207 my $vmid = $1;
2208 my $d = $res->{$vmid};
2209 next if !$d;
19672434 2210
1e3baf05
DM
2211 $d->{netout} += $netdev->{$dev}->{receive};
2212 $d->{netin} += $netdev->{$dev}->{transmit};
2213 }
2214
1e3baf05
DM
2215 my $ctime = gettimeofday;
2216
2217 foreach my $vmid (keys %$list) {
2218
2219 my $d = $res->{$vmid};
2220 my $pid = $d->{pid};
2221 next if !$pid;
2222
694fcad4
DM
2223 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2224 next if !$pstat; # not running
19672434 2225
694fcad4 2226 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2227
694fcad4 2228 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2229
694fcad4 2230 if ($pstat->{vsize}) {
6b64503e 2231 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2232 }
2233
2234 my $old = $last_proc_pid_stat->{$pid};
2235 if (!$old) {
19672434
DM
2236 $last_proc_pid_stat->{$pid} = {
2237 time => $ctime,
1e3baf05
DM
2238 used => $used,
2239 cpu => 0,
1e3baf05
DM
2240 };
2241 next;
2242 }
2243
7f0b5beb 2244 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2245
2246 if ($dtime > 1000) {
2247 my $dutime = $used - $old->{used};
2248
ae4915a2 2249 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2250 $last_proc_pid_stat->{$pid} = {
19672434 2251 time => $ctime,
1e3baf05
DM
2252 used => $used,
2253 cpu => $d->{cpu},
1e3baf05
DM
2254 };
2255 } else {
2256 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2257 }
2258 }
2259
f5eb281a 2260 return $res if !$full;
03a33f30
DM
2261
2262 my $qmpclient = PVE::QMPClient->new();
2263
64e7fcf2
DM
2264 my $ballooncb = sub {
2265 my ($vmid, $resp) = @_;
2266
2267 my $info = $resp->{'return'};
2268 return if !$info->{max_mem};
be190583 2269
64e7fcf2
DM
2270 my $d = $res->{$vmid};
2271
2272 # use memory assigned to VM
2273 $d->{maxmem} = $info->{max_mem};
2274 $d->{balloon} = $info->{actual};
be190583 2275
64e7fcf2
DM
2276 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2277 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2278 $d->{freemem} = $info->{free_mem};
2279 }
2280
2281 };
2282
03a33f30
DM
2283 my $blockstatscb = sub {
2284 my ($vmid, $resp) = @_;
2285 my $data = $resp->{'return'} || [];
2286 my $totalrdbytes = 0;
2287 my $totalwrbytes = 0;
2288 for my $blockstat (@$data) {
2289 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2290 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2291 }
2292 $res->{$vmid}->{diskread} = $totalrdbytes;
2293 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2294 };
2295
2296 my $statuscb = sub {
2297 my ($vmid, $resp) = @_;
64e7fcf2 2298
03a33f30 2299 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2300 # this fails if ballon driver is not loaded, so this must be
2301 # the last commnand (following command are aborted if this fails).
2302 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2303
2304 my $status = 'unknown';
2305 if (!defined($status = $resp->{'return'}->{status})) {
2306 warn "unable to get VM status\n";
2307 return;
2308 }
2309
2310 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2311 };
2312
2313 foreach my $vmid (keys %$list) {
2314 next if $opt_vmid && ($vmid ne $opt_vmid);
2315 next if !$res->{$vmid}->{pid}; # not running
2316 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2317 }
2318
2319 $qmpclient->queue_execute();
2320
2321 foreach my $vmid (keys %$list) {
2322 next if $opt_vmid && ($vmid ne $opt_vmid);
2323 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2324 }
2325
1e3baf05
DM
2326 return $res;
2327}
2328
2329sub foreach_drive {
2330 my ($conf, $func) = @_;
2331
2332 foreach my $ds (keys %$conf) {
2333 next if !valid_drivename($ds);
2334
6b64503e 2335 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2336 next if !$drive;
2337
2338 &$func($ds, $drive);
2339 }
2340}
2341
d5769dc2
DM
2342sub foreach_volid {
2343 my ($conf, $func) = @_;
be190583 2344
d5769dc2
DM
2345 my $volhash = {};
2346
2347 my $test_volid = sub {
2348 my ($volid, $is_cdrom) = @_;
2349
2350 return if !$volid;
be190583 2351
d5769dc2
DM
2352 $volhash->{$volid} = $is_cdrom || 0;
2353 };
2354
ed221350 2355 foreach_drive($conf, sub {
d5769dc2
DM
2356 my ($ds, $drive) = @_;
2357 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2358 });
2359
2360 foreach my $snapname (keys %{$conf->{snapshots}}) {
2361 my $snap = $conf->{snapshots}->{$snapname};
2362 &$test_volid($snap->{vmstate}, 0);
ed221350 2363 foreach_drive($snap, sub {
d5769dc2
DM
2364 my ($ds, $drive) = @_;
2365 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2366 });
2367 }
2368
2369 foreach my $volid (keys %$volhash) {
be190583 2370 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2371 }
2372}
2373
86b8228b
DM
2374sub vga_conf_has_spice {
2375 my ($vga) = @_;
2376
590e698c
DM
2377 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2378
2379 return $1 || 1;
86b8228b
DM
2380}
2381
1e3baf05 2382sub config_to_command {
952958bc 2383 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2384
2385 my $cmd = [];
8c559505
DM
2386 my $globalFlags = [];
2387 my $machineFlags = [];
2388 my $rtcFlags = [];
519ed28c 2389 my $cpuFlags = [];
5bdcf937 2390 my $devices = [];
b78ebef7 2391 my $pciaddr = '';
5bdcf937 2392 my $bridges = {};
1e3baf05
DM
2393 my $kvmver = kvm_user_version();
2394 my $vernum = 0; # unknown
a3c52213
DM
2395 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2396 $vernum = $1*1000000+$2*1000;
2397 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2398 $vernum = $1*1000000+$2*1000+$3;
2399 }
2400
a3c52213 2401 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2402
2403 my $have_ovz = -f '/proc/vz/vestat';
2404
db656e5f
DM
2405 my $q35 = machine_type_is_q35($conf);
2406
1e3baf05
DM
2407 push @$cmd, '/usr/bin/kvm';
2408
2409 push @$cmd, '-id', $vmid;
2410
2411 my $use_virtio = 0;
2412
c971c4f2
AD
2413 my $qmpsocket = qmp_socket($vmid);
2414 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2415 push @$cmd, '-mon', "chardev=qmp,mode=control";
2416
7b7c6d1b 2417 my $socket = vnc_socket($vmid);
1e3baf05
DM
2418 push @$cmd, '-vnc', "unix:$socket,x509,password";
2419
6b64503e 2420 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2421
1e3baf05
DM
2422 push @$cmd, '-daemonize';
2423
2796e7d5
DM
2424 if ($conf->{smbios1}) {
2425 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2426 }
2427
db656e5f
DM
2428 if ($q35) {
2429 # the q35 chipset support native usb2, so we enable usb controller
2430 # by default for this machine type
f8e83f05 2431 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2432 } else {
f8e83f05
AD
2433 $pciaddr = print_pci_addr("piix3", $bridges);
2434 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2435
f8e83f05 2436 my $use_usb2 = 0;
db656e5f
DM
2437 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2438 next if !$conf->{"usb$i"};
2439 $use_usb2 = 1;
2440 }
2441 # include usb device config
2442 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2443 }
19672434 2444
5acbfe9e 2445 my $vga = $conf->{vga};
2fa3151e 2446
590e698c
DM
2447 my $qxlnum = vga_conf_has_spice($vga);
2448 $vga = 'qxl' if $qxlnum;
2fa3151e 2449
5acbfe9e 2450 if (!$vga) {
264e519f
DM
2451 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2452 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2453 $conf->{ostype} eq 'w2k8')) {
2454 $vga = 'std';
2455 } else {
2456 $vga = 'cirrus';
2457 }
2458 }
2459
1e3baf05 2460 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2461 my $tablet;
2462 if (defined($conf->{tablet})) {
2463 $tablet = $conf->{tablet};
2464 } else {
2465 $tablet = $defaults->{tablet};
590e698c 2466 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2467 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2468 }
2469
db656e5f 2470 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
90404354 2471
1e3baf05 2472 # host pci devices
040b06b7 2473 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2474 my $d = parse_hostpci($conf->{"hostpci$i"});
2475 next if !$d;
2476
2477 my $pcie = $d->{pcie};
2478 if($pcie){
2479 die "q35 machine model is not enabled" if !$q35;
2480 $pciaddr = print_pcie_addr("hostpci$i");
2481 }else{
2482 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2483 }
2484
2485 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2486 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2487 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2488 if ($xvga && $xvga ne '') {
2489 push @$cpuFlags, 'kvm=off';
2490 $vga = 'none';
2491 }
2e3b7e2a 2492 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2493 my $pcidevices = $d->{pciid};
2494 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2495
4543ecf0
AD
2496 my $j=0;
2497 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2498
4543ecf0
AD
2499 my $id = "hostpci$i";
2500 $id .= ".$j" if $multifunction;
2501 my $addr = $pciaddr;
2502 $addr .= ".$j" if $multifunction;
2503 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2504
2505 if($j == 0){
2506 $devicestr .= "$rombar$xvga";
2507 $devicestr .= ",multifunction=on" if $multifunction;
2508 }
2509
2510 push @$devices, '-device', $devicestr;
2511 $j++;
2512 }
1e3baf05
DM
2513 }
2514
2515 # usb devices
2516 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2517 my $d = parse_usb_device($conf->{"usb$i"});
2518 next if !$d;
2519 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2520 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2521 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2522 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2523 } elsif ($d->{spice}) {
2524 # usb redir support for spice
2525 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2526 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2527 }
2528 }
2529
1e3baf05 2530 # serial devices
bae179aa 2531 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2532 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2533 if ($path eq 'socket') {
2534 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2535 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2536 push @$devices, '-device', "isa-serial,chardev=serial$i";
2537 } else {
2538 die "no such serial device\n" if ! -c $path;
2539 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2540 push @$devices, '-device', "isa-serial,chardev=serial$i";
2541 }
34978be3 2542 }
1e3baf05
DM
2543 }
2544
2545 # parallel devices
1989a89c 2546 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2547 if (my $path = $conf->{"parallel$i"}) {
19672434 2548 die "no such parallel device\n" if ! -c $path;
32e69805 2549 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2550 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2551 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2552 }
1e3baf05
DM
2553 }
2554
2555 my $vmname = $conf->{name} || "vm$vmid";
2556
2557 push @$cmd, '-name', $vmname;
19672434 2558
1e3baf05
DM
2559 my $sockets = 1;
2560 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2561 $sockets = $conf->{sockets} if $conf->{sockets};
2562
2563 my $cores = $conf->{cores} || 1;
3bd18e48
AD
2564 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2565
264e519f 2566 if ($maxcpus) {
3bd18e48 2567 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
264e519f 2568 } else {
3bd18e48
AD
2569 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2570 }
1e3baf05 2571
1e3baf05
DM
2572 push @$cmd, '-nodefaults';
2573
32baffb4 2574 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2575
0888fdce
DM
2576 my $bootindex_hash = {};
2577 my $i = 1;
2578 foreach my $o (split(//, $bootorder)) {
2579 $bootindex_hash->{$o} = $i*100;
2580 $i++;
afdb31d5 2581 }
3b408e82
DM
2582
2583 push @$cmd, '-boot', "menu=on";
1e3baf05 2584
6b64503e 2585 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2586
6b64503e 2587 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2588
ef5e2be2 2589 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2590
2591 # time drift fix
6b64503e 2592 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2593
6b64503e 2594 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2595 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2596
2597 if (my $ost = $conf->{ostype}) {
6b9d84cf 2598 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2599
2600 if ($ost =~ m/^w/) { # windows
8c559505 2601 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2602
8c559505 2603 # use time drift fix when acpi is enabled
6b64503e 2604 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2605 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2606 }
2607 }
2608
be190583 2609 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2610 $ost eq 'wvista') {
8c559505 2611 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2612 push @$cmd, '-no-hpet';
462e8d19
AD
2613 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2614 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2615 }
2616
2617 if ($ost eq 'win7' || $ost eq 'win8') {
2618 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2619 }
1e3baf05
DM
2620 }
2621
8c559505
DM
2622 push @$rtcFlags, 'driftfix=slew' if $tdf;
2623
7f0b5beb 2624 if ($nokvm) {
8c559505 2625 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2626 } else {
2627 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2628 }
1e3baf05 2629
952958bc
DM
2630 my $machine_type = $forcemachine || $conf->{machine};
2631 if ($machine_type) {
2632 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2633 }
2634
8c559505
DM
2635 if ($conf->{startdate}) {
2636 push @$rtcFlags, "base=$conf->{startdate}";
2637 } elsif ($useLocaltime) {
2638 push @$rtcFlags, 'base=localtime';
2639 }
1e3baf05 2640
519ed28c
AD
2641 my $cpu = $nokvm ? "qemu64" : "kvm64";
2642 $cpu = $conf->{cpu} if $conf->{cpu};
2643
4dc339e7
AD
2644 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2645
6b9d84cf
AD
2646 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2647
2648 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2649
2e1a5389
AD
2650 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2651
be190583 2652 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2653
c0efd8cd
DM
2654 # Note: enforce needs kernel 3.10, so we do not use it for now
2655 # push @$cmd, '-cpu', "$cpu,enforce";
2656 push @$cmd, '-cpu', $cpu;
519ed28c 2657
1e3baf05
DM
2658 push @$cmd, '-S' if $conf->{freeze};
2659
2660 # set keyboard layout
2661 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2662 push @$cmd, '-k', $kb if $kb;
2663
2664 # enable sound
2665 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2666 #push @$cmd, '-soundhw', 'es1370';
2667 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 2668
bc84dcca 2669 if($conf->{agent}) {
ab6a046f
AD
2670 my $qgasocket = qga_socket($vmid);
2671 my $pciaddr = print_pci_addr("qga0", $bridges);
2672 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2673 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2674 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2675 }
2676
1d794448 2677 my $spice_port;
2fa3151e 2678
590e698c
DM
2679 if ($qxlnum) {
2680 if ($qxlnum > 1) {
2681 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2682 for(my $i = 1; $i < $qxlnum; $i++){
2683 my $pciaddr = print_pci_addr("vga$i", $bridges);
2684 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2685 }
2686 } else {
2687 # assume other OS works like Linux
2688 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2689 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
2690 }
2691 }
2692
1011b570 2693 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 2694
cd339d1f 2695 $spice_port = PVE::Tools::next_spice_port();
943340a6 2696
1d794448 2697 push @$cmd, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 2698
1011b570
DM
2699 push @$cmd, '-device', "virtio-serial,id=spice$pciaddr";
2700 push @$cmd, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2701 push @$cmd, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
2702 }
2703
8d9ae0d2
DM
2704 # enable balloon by default, unless explicitly disabled
2705 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2706 $pciaddr = print_pci_addr("balloon0", $bridges);
2707 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2708 }
1e3baf05 2709
0ea9541d
DM
2710 if ($conf->{watchdog}) {
2711 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 2712 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 2713 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
2714 push @$devices, '-device', "$watchdog$pciaddr";
2715 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
2716 }
2717
1e3baf05 2718 my $vollist = [];
941e0c42 2719 my $scsicontroller = {};
26ee04b6 2720 my $ahcicontroller = {};
cdd20088 2721 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 2722
5881b913
DM
2723 # Add iscsi initiator name if available
2724 if (my $initiator = get_initiator_name()) {
2725 push @$devices, '-iscsi', "initiator-name=$initiator";
2726 }
2727
1e3baf05
DM
2728 foreach_drive($conf, sub {
2729 my ($ds, $drive) = @_;
2730
ff1a2432 2731 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 2732 push @$vollist, $drive->{file};
ff1a2432 2733 }
afdb31d5 2734
1e3baf05 2735 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
2736
2737 if (drive_is_cdrom ($drive)) {
2738 if ($bootindex_hash->{d}) {
2739 $drive->{bootindex} = $bootindex_hash->{d};
2740 $bootindex_hash->{d} += 1;
2741 }
2742 } else {
2743 if ($bootindex_hash->{c}) {
2744 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
2745 $bootindex_hash->{c} += 1;
2746 }
2747 }
2748
941e0c42 2749 if ($drive->{interface} eq 'scsi') {
cdd20088 2750
5b952ff5 2751 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 2752 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
2753 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
2754 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 2755 $scsicontroller->{$controller}=1;
941e0c42 2756 }
3b408e82 2757
26ee04b6
DA
2758 if ($drive->{interface} eq 'sata') {
2759 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
2760 $pciaddr = print_pci_addr("ahci$controller", $bridges);
2761 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
2762 $ahcicontroller->{$controller}=1;
2763 }
46f58b5f 2764
15b21acc
MR
2765 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
2766 push @$devices, '-drive',$drive_cmd;
46f58b5f 2767 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
2768 });
2769
2770 push @$cmd, '-m', $conf->{memory} || $defaults->{memory};
19672434 2771
cc4d6182 2772 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 2773 next if !$conf->{"net$i"};
cc4d6182
DA
2774 my $d = parse_net($conf->{"net$i"});
2775 next if !$d;
1e3baf05 2776
cc4d6182 2777 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 2778
cc4d6182
DA
2779 if ($bootindex_hash->{n}) {
2780 $d->{bootindex} = $bootindex_hash->{n};
2781 $bootindex_hash->{n} += 1;
2782 }
1e3baf05 2783
cc4d6182 2784 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
2785 push @$devices, '-netdev', $netdevfull;
2786
2787 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
2788 push @$devices, '-device', $netdevicefull;
2789 }
1e3baf05 2790
db656e5f
DM
2791 if (!$q35) {
2792 # add pci bridges
f8e83f05
AD
2793 while (my ($k, $v) = each %$bridges) {
2794 $pciaddr = print_pci_addr("pci.$k");
2795 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
2796 }
19672434
DM
2797 }
2798
1e3baf05
DM
2799 # hack: virtio with fairsched is unreliable, so we do not use fairsched
2800 # when the VM uses virtio devices.
19672434
DM
2801 if (!$use_virtio && $have_ovz) {
2802
6b64503e 2803 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
2804 $conf->{cpuunits} : $defaults->{cpuunits};
2805
2806 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
2807
2808 # fixme: cpulimit is currently ignored
2809 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
2810 }
2811
2812 # add custom args
2813 if ($conf->{args}) {
3ada46c9 2814 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
2815 push @$cmd, @$aa;
2816 }
2817
5bdcf937 2818 push @$cmd, @$devices;
be190583 2819 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 2820 if scalar(@$rtcFlags);
be190583 2821 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
2822 if scalar(@$machineFlags);
2823 push @$cmd, '-global', join(',', @$globalFlags)
2824 if scalar(@$globalFlags);
2825
1d794448 2826 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 2827}
19672434 2828
1e3baf05
DM
2829sub vnc_socket {
2830 my ($vmid) = @_;
2831 return "${var_run_tmpdir}/$vmid.vnc";
2832}
2833
943340a6 2834sub spice_port {
1011b570 2835 my ($vmid) = @_;
943340a6 2836
1d794448 2837 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
2838
2839 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
2840}
2841
c971c4f2
AD
2842sub qmp_socket {
2843 my ($vmid) = @_;
2844 return "${var_run_tmpdir}/$vmid.qmp";
2845}
2846
ab6a046f
AD
2847sub qga_socket {
2848 my ($vmid) = @_;
2849 return "${var_run_tmpdir}/$vmid.qga";
2850}
2851
1e3baf05
DM
2852sub pidfile_name {
2853 my ($vmid) = @_;
2854 return "${var_run_tmpdir}/$vmid.pid";
2855}
2856
86fdcfb2
DA
2857sub vm_devices_list {
2858 my ($vmid) = @_;
2859
ceea9078
DM
2860 my $res = vm_mon_cmd($vmid, 'query-pci');
2861
2862 my $devices = {};
2863 foreach my $pcibus (@$res) {
2864 foreach my $device (@{$pcibus->{devices}}) {
2865 next if !$device->{'qdev_id'};
2866 $devices->{$device->{'qdev_id'}} = $device;
1dc4f496
DM
2867 }
2868 }
86fdcfb2 2869
1dc4f496 2870 return $devices;
86fdcfb2
DA
2871}
2872
ec21aa11 2873sub vm_deviceplug {
f19d1c47 2874 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 2875
cd6ecb89 2876 return 1 if !check_running($vmid);
db656e5f
DM
2877
2878 my $q35 = machine_type_is_q35($conf);
2879
cd6ecb89 2880 if ($deviceid eq 'tablet') {
db656e5f 2881 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
cd6ecb89
AD
2882 return 1;
2883 }
2884
2dbe827e 2885 return 1 if !$conf->{hotplug};
afdb31d5 2886
95d6343b
DA
2887 my $devices_list = vm_devices_list($vmid);
2888 return 1 if defined($devices_list->{$deviceid});
2889
40f28a9f
AD
2890 qemu_bridgeadd($storecfg, $conf, $vmid, $deviceid); #add bridge if we need it for the device
2891
5e5dcb73
DA
2892 if ($deviceid =~ m/^(virtio)(\d+)$/) {
2893 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 2894 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
5e5dcb73
DA
2895 qemu_deviceadd($vmid, $devicefull);
2896 if(!qemu_deviceaddverify($vmid, $deviceid)) {
2897 qemu_drivedel($vmid, $deviceid);
2898 return undef;
2899 }
f19d1c47 2900 }
cfc817c7 2901
cdd20088
AD
2902 if ($deviceid =~ m/^(scsihw)(\d+)$/) {
2903 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 2904 my $pciaddr = print_pci_addr($deviceid);
cdd20088 2905 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
cfc817c7
DA
2906 qemu_deviceadd($vmid, $devicefull);
2907 return undef if(!qemu_deviceaddverify($vmid, $deviceid));
2908 }
2909
a4f091a0 2910 if ($deviceid =~ m/^(scsi)(\d+)$/) {
5b952ff5 2911 return 1 if ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)); #virtio-scsi not yet support hotplug
cdd20088 2912 return undef if !qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
a4f091a0 2913 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 2914 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
a4f091a0
DA
2915 if(!qemu_deviceadd($vmid, $devicefull)) {
2916 qemu_drivedel($vmid, $deviceid);
2917 return undef;
2918 }
2919 }
2920
2630d2a9
DA
2921 if ($deviceid =~ m/^(net)(\d+)$/) {
2922 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
2923 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
2924 qemu_deviceadd($vmid, $netdevicefull);
2925 if(!qemu_deviceaddverify($vmid, $deviceid)) {
2926 qemu_netdevdel($vmid, $deviceid);
2927 return undef;
2928 }
2929 }
2930
f8e83f05
AD
2931
2932 if (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
40f28a9f
AD
2933 my $bridgeid = $2;
2934 my $pciaddr = print_pci_addr($deviceid);
2935 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
2936 qemu_deviceadd($vmid, $devicefull);
2937 return undef if !qemu_deviceaddverify($vmid, $deviceid);
2938 }
2939
5e5dcb73 2940 return 1;
a4dea331
DA
2941}
2942
ec21aa11 2943sub vm_deviceunplug {
f19d1c47 2944 my ($vmid, $conf, $deviceid) = @_;
873c2d69 2945
cd6ecb89
AD
2946 return 1 if !check_running ($vmid);
2947
2948 if ($deviceid eq 'tablet') {
2949 qemu_devicedel($vmid, $deviceid);
2950 return 1;
2951 }
2952
2dbe827e 2953 return 1 if !$conf->{hotplug};
873c2d69 2954
95d6343b
DA
2955 my $devices_list = vm_devices_list($vmid);
2956 return 1 if !defined($devices_list->{$deviceid});
2957
ae57f6b3 2958 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
f19d1c47 2959
5e5dcb73 2960 if ($deviceid =~ m/^(virtio)(\d+)$/) {
5e5dcb73
DA
2961 qemu_devicedel($vmid, $deviceid);
2962 return undef if !qemu_devicedelverify($vmid, $deviceid);
1f219ef5 2963 return undef if !qemu_drivedel($vmid, $deviceid);
5e5dcb73 2964 }
cfc817c7
DA
2965
2966 if ($deviceid =~ m/^(lsi)(\d+)$/) {
2967 return undef if !qemu_devicedel($vmid, $deviceid);
2968 }
2969
a4f091a0
DA
2970 if ($deviceid =~ m/^(scsi)(\d+)$/) {
2971 return undef if !qemu_devicedel($vmid, $deviceid);
2972 return undef if !qemu_drivedel($vmid, $deviceid);
2973 }
2974
2630d2a9 2975 if ($deviceid =~ m/^(net)(\d+)$/) {
2630d2a9
DA
2976 qemu_devicedel($vmid, $deviceid);
2977 return undef if !qemu_devicedelverify($vmid, $deviceid);
750886f8 2978 return undef if !qemu_netdevdel($vmid, $deviceid);
2630d2a9
DA
2979 }
2980
5e5dcb73
DA
2981 return 1;
2982}
2983
2984sub qemu_deviceadd {
2985 my ($vmid, $devicefull) = @_;
873c2d69 2986
d695b5b7
AD
2987 $devicefull = "driver=".$devicefull;
2988 my %options = split(/[=,]/, $devicefull);
f19d1c47 2989
d695b5b7
AD
2990 vm_mon_cmd($vmid, "device_add" , %options);
2991 return 1;
5e5dcb73 2992}
afdb31d5 2993
5e5dcb73
DA
2994sub qemu_devicedel {
2995 my($vmid, $deviceid) = @_;
5a77d8c1
AD
2996 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
2997 return 1;
5e5dcb73
DA
2998}
2999
3000sub qemu_driveadd {
3001 my($storecfg, $vmid, $device) = @_;
3002
3003 my $drive = print_drive_full($storecfg, $vmid, $device);
7b7c6d1b 3004 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
5e5dcb73
DA
3005 # If the command succeeds qemu prints: "OK"
3006 if ($ret !~ m/OK/s) {
3007 syslog("err", "adding drive failed: $ret");
3008 return undef;
f19d1c47 3009 }
5e5dcb73
DA
3010 return 1;
3011}
afdb31d5 3012
5e5dcb73
DA
3013sub qemu_drivedel {
3014 my($vmid, $deviceid) = @_;
873c2d69 3015
7b7c6d1b 3016 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73
DA
3017 $ret =~ s/^\s+//;
3018 if ($ret =~ m/Device \'.*?\' not found/s) {
afdb31d5 3019 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
5e5dcb73
DA
3020 }
3021 elsif ($ret ne "") {
3022 syslog("err", "deleting drive $deviceid failed : $ret");
3023 return undef;
873c2d69 3024 }
5e5dcb73
DA
3025 return 1;
3026}
f19d1c47 3027
5e5dcb73
DA
3028sub qemu_deviceaddverify {
3029 my ($vmid,$deviceid) = @_;
873c2d69 3030
5e5dcb73
DA
3031 for (my $i = 0; $i <= 5; $i++) {
3032 my $devices_list = vm_devices_list($vmid);
3033 return 1 if defined($devices_list->{$deviceid});
3034 sleep 1;
afdb31d5 3035 }
5e5dcb73
DA
3036 syslog("err", "error on hotplug device $deviceid");
3037 return undef;
3038}
afdb31d5 3039
5e5dcb73
DA
3040
3041sub qemu_devicedelverify {
3042 my ($vmid,$deviceid) = @_;
3043
3044 #need to verify the device is correctly remove as device_del is async and empty return is not reliable
3045 for (my $i = 0; $i <= 5; $i++) {
3046 my $devices_list = vm_devices_list($vmid);
3047 return 1 if !defined($devices_list->{$deviceid});
3048 sleep 1;
afdb31d5 3049 }
5e5dcb73
DA
3050 syslog("err", "error on hot-unplugging device $deviceid");
3051 return undef;
873c2d69
DA
3052}
3053
cdd20088 3054sub qemu_findorcreatescsihw {
cfc817c7
DA
3055 my ($storecfg, $conf, $vmid, $device) = @_;
3056
5b952ff5 3057 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3058 my $controller = int($device->{index} / $maxdev);
cdd20088 3059 my $scsihwid="scsihw$controller";
cfc817c7
DA
3060 my $devices_list = vm_devices_list($vmid);
3061
cdd20088
AD
3062 if(!defined($devices_list->{$scsihwid})) {
3063 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7
DA
3064 }
3065 return 1;
3066}
3067
40f28a9f
AD
3068sub qemu_bridgeadd {
3069 my ($storecfg, $conf, $vmid, $device) = @_;
3070
3071 my $bridges = {};
3072 my $bridgeid = undef;
3073 print_pci_addr($device, $bridges);
3074
3075 while (my ($k, $v) = each %$bridges) {
3076 $bridgeid = $k;
3077 }
0e616534 3078 return if !$bridgeid || $bridgeid < 1;
40f28a9f
AD
3079 my $bridge = "pci.$bridgeid";
3080 my $devices_list = vm_devices_list($vmid);
3081
3082 if(!defined($devices_list->{$bridge})) {
3083 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $bridge);
3084 }
3085 return 1;
3086}
3087
2630d2a9
DA
3088sub qemu_netdevadd {
3089 my ($vmid, $conf, $device, $deviceid) = @_;
3090
3091 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3092 my %options = split(/[=,]/, $netdev);
2630d2a9 3093
73aa03b8
AD
3094 vm_mon_cmd($vmid, "netdev_add", %options);
3095 return 1;
2630d2a9
DA
3096}
3097
3098sub qemu_netdevdel {
3099 my ($vmid, $deviceid) = @_;
3100
89c1e0f4
AD
3101 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
3102 return 1;
2630d2a9
DA
3103}
3104
838776ab
AD
3105sub qemu_cpu_hotplug {
3106 my ($vmid, $conf, $cores) = @_;
3107
3108 die "new cores config is not defined" if !$cores;
264e519f
DM
3109 die "you can't add more cores than maxcpus"
3110 if $conf->{maxcpus} && ($cores > $conf->{maxcpus});
838776ab
AD
3111 return if !check_running($vmid);
3112
3113 my $currentcores = $conf->{cores} if $conf->{cores};
3114 die "current cores is not defined" if !$currentcores;
3115 die "maxcpus is not defined" if !$conf->{maxcpus};
264e519f
DM
3116 raise_param_exc({ 'cores' => "online cpu unplug is not yet possible" })
3117 if($cores < $currentcores);
838776ab
AD
3118
3119 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
264e519f
DM
3120 raise_param_exc({ 'cores' => "cores number if running vm is different than configuration" })
3121 if scalar (@{$currentrunningcores}) != $currentcores;
838776ab 3122
264e519f 3123 for(my $i = $currentcores; $i < $cores; $i++) {
838776ab
AD
3124 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3125 }
3126}
3127
affd2f88
AD
3128sub qemu_block_set_io_throttle {
3129 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3130
f3f323a3
AD
3131 return if !check_running($vmid) ;
3132
f3f323a3
AD
3133 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3134
affd2f88
AD
3135}
3136
f5eb281a 3137# old code, only used to shutdown old VM after update
dab36e1e
DM
3138sub __read_avail {
3139 my ($fh, $timeout) = @_;
3140
3141 my $sel = new IO::Select;
3142 $sel->add($fh);
3143
3144 my $res = '';
3145 my $buf;
3146
3147 my @ready;
3148 while (scalar (@ready = $sel->can_read($timeout))) {
3149 my $count;
3150 if ($count = $fh->sysread($buf, 8192)) {
3151 if ($buf =~ /^(.*)\(qemu\) $/s) {
3152 $res .= $1;
3153 last;
3154 } else {
3155 $res .= $buf;
3156 }
3157 } else {
3158 if (!defined($count)) {
3159 die "$!\n";
3160 }
3161 last;
3162 }
3163 }
3164
3165 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3166
dab36e1e
DM
3167 return $res;
3168}
3169
f5eb281a 3170# old code, only used to shutdown old VM after update
dab36e1e
DM
3171sub vm_monitor_command {
3172 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3173
dab36e1e
DM
3174 my $res;
3175
3176 eval {
3177 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3178
3179 my $sname = "${var_run_tmpdir}/$vmid.mon";
3180
3181 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3182 die "unable to connect to VM $vmid socket - $!\n";
3183
3184 my $timeout = 3;
3185
3186 # hack: migrate sometime blocks the monitor (when migrate_downtime
3187 # is set)
3188 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3189 $timeout = 60*60; # 1 hour
3190 }
3191
3192 # read banner;
3193 my $data = __read_avail($sock, $timeout);
3194
3195 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3196 die "got unexpected qemu monitor banner\n";
3197 }
3198
3199 my $sel = new IO::Select;
3200 $sel->add($sock);
3201
3202 if (!scalar(my @ready = $sel->can_write($timeout))) {
3203 die "monitor write error - timeout";
3204 }
3205
3206 my $fullcmd = "$cmdstr\r";
3207
3208 # syslog('info', "VM $vmid monitor command: $cmdstr");
3209
3210 my $b;
3211 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3212 die "monitor write error - $!";
3213 }
3214
3215 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3216
3217 $timeout = 20;
3218
3219 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3220 $timeout = 60*60; # 1 hour
3221 } elsif ($cmdstr =~ m/^(eject|change)/) {
3222 $timeout = 60; # note: cdrom mount command is slow
3223 }
3224 if ($res = __read_avail($sock, $timeout)) {
3225
3226 my @lines = split("\r?\n", $res);
f5eb281a 3227
dab36e1e 3228 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3229
dab36e1e
DM
3230 $res = join("\n", @lines);
3231 $res .= "\n";
3232 }
3233 };
3234
3235 my $err = $@;
3236
3237 if ($err) {
3238 syslog("err", "VM $vmid monitor command failed - $err");
3239 die $err;
3240 }
f5eb281a 3241
dab36e1e
DM
3242 return $res;
3243}
3244
c1175c92
AD
3245sub qemu_block_resize {
3246 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3247
ed221350 3248 my $running = check_running($vmid);
c1175c92
AD
3249
3250 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3251
3252 return if !$running;
3253
3254 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3255
3256}
3257
1ab0057c
AD
3258sub qemu_volume_snapshot {
3259 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3260
ed221350 3261 my $running = check_running($vmid);
1ab0057c
AD
3262
3263 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3264
3265 return if !$running;
3266
3267 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3268
3269}
3270
fc46aff9
AD
3271sub qemu_volume_snapshot_delete {
3272 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3273
ed221350 3274 my $running = check_running($vmid);
fc46aff9
AD
3275
3276 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3277
3278 return if !$running;
3279
18bfb361 3280 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3281}
3282
3d5149c9
AD
3283sub qga_freezefs {
3284 my ($vmid) = @_;
3285
3286 #need to impplement call to qemu-ga
3287}
3288
e8f3f18e
AD
3289sub qga_unfreezefs {
3290 my ($vmid) = @_;
3291
3292 #need to impplement call to qemu-ga
3293}
3294
264e519f
DM
3295sub set_migration_caps {
3296 my ($vmid) = @_;
a89fded1 3297
8b8345f3 3298 my $cap_ref = [];
a89fded1
AD
3299
3300 my $enabled_cap = {
8b8345f3
DM
3301 "auto-converge" => 1,
3302 "xbzrle" => 0,
3303 "x-rdma-pin-all" => 0,
3304 "zero-blocks" => 0,
a89fded1
AD
3305 };
3306
8b8345f3 3307 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3308
8b8345f3 3309 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3310 push @$cap_ref, {
3311 capability => $supported_capability->{capability},
22430fa2
DM
3312 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3313 };
a89fded1
AD
3314 }
3315
8b8345f3
DM
3316 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3317}
a89fded1 3318
1e3baf05 3319sub vm_start {
1d794448 3320 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 3321
6b64503e 3322 lock_config($vmid, sub {
7e8dcf2c 3323 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 3324
8b43bc11 3325 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 3326
6b64503e 3327 check_lock($conf) if !$skiplock;
1e3baf05 3328
7e8dcf2c 3329 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 3330
6c47d546
DM
3331 my $defaults = load_defaults();
3332
3333 # set environment variable useful inside network script
3334 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3335
1d794448 3336 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 3337
1e3baf05 3338 my $migrate_port = 0;
5bc1e039 3339 my $migrate_uri;
1e3baf05
DM
3340 if ($statefile) {
3341 if ($statefile eq 'tcp') {
5bc1e039
SP
3342 my $localip = "localhost";
3343 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3344 if ($datacenterconf->{migration_unsecure}) {
3345 my $nodename = PVE::INotify::nodename();
3346 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3347 }
f9a971e0 3348 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 3349 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
3350 push @$cmd, '-incoming', $migrate_uri;
3351 push @$cmd, '-S';
1e3baf05 3352 } else {
6c47d546 3353 push @$cmd, '-loadstate', $statefile;
1e3baf05 3354 }
91bd6c90
DM
3355 } elsif ($paused) {
3356 push @$cmd, '-S';
1e3baf05
DM
3357 }
3358
1e3baf05 3359 # host pci devices
040b06b7
DA
3360 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3361 my $d = parse_hostpci($conf->{"hostpci$i"});
3362 next if !$d;
b1f72af6
AD
3363 my $pcidevices = $d->{pciid};
3364 foreach my $pcidevice (@$pcidevices) {
3365 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 3366
b1f72af6
AD
3367 my $info = pci_device_info("0000:$pciid");
3368 die "IOMMU not present\n" if !check_iommu_support();
3369 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 3370
b1f72af6
AD
3371 if ($d->{driver} && $d->{driver} eq "vfio") {
3372 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3373 } else {
3374 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3375 }
3376
8f3e88af 3377 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 3378 }
040b06b7 3379 }
1e3baf05
DM
3380
3381 PVE::Storage::activate_volumes($storecfg, $vollist);
3382
585b6e28
DM
3383 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3384 umask => 0077); };
1e3baf05 3385 my $err = $@;
ff1a2432 3386 die "start failed: $err" if $err;
1e3baf05 3387
5bc1e039 3388 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 3389
8c609afd 3390 if ($statefile && $statefile ne 'tcp') {
95381ce0 3391 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 3392 warn $@ if $@;
62de2cbd
DM
3393 }
3394
1d794448 3395 if ($migratedfrom) {
a89fded1
AD
3396
3397 eval {
3398 PVE::QemuServer::set_migration_caps($vmid);
3399 };
1d794448 3400 warn $@ if $@;
a89fded1 3401
1d794448
DM
3402 if ($spice_port) {
3403 print "spice listens on port $spice_port\n";
3404 if ($spice_ticket) {
3405 PVE::QemuServer::vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
3406 PVE::QemuServer::vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
3407 }
3408 }
3409
1d794448 3410 } else {
4ec05c4c 3411
15b1fc93 3412 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 3413 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 3414 if $conf->{balloon};
be190583
DM
3415 vm_mon_cmd_nocheck($vmid, 'qom-set',
3416 path => "machine/peripheral/balloon0",
3417 property => "guest-stats-polling-interval",
4ec05c4c
AD
3418 value => 2);
3419 }
e18b0b99 3420 }
1e3baf05
DM
3421 });
3422}
3423
0eedc444
AD
3424sub vm_mon_cmd {
3425 my ($vmid, $execute, %params) = @_;
3426
26f11676
DM
3427 my $cmd = { execute => $execute, arguments => \%params };
3428 vm_qmp_command($vmid, $cmd);
0eedc444
AD
3429}
3430
3431sub vm_mon_cmd_nocheck {
3432 my ($vmid, $execute, %params) = @_;
3433
26f11676
DM
3434 my $cmd = { execute => $execute, arguments => \%params };
3435 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
3436}
3437
c971c4f2 3438sub vm_qmp_command {
d967756b 3439 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 3440
c971c4f2 3441 my $res;
26f11676 3442
14db5366
DM
3443 my $timeout;
3444 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
3445 $timeout = $cmd->{arguments}->{timeout};
3446 delete $cmd->{arguments}->{timeout};
3447 }
be190583 3448
c971c4f2
AD
3449 eval {
3450 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
ed221350 3451 my $sname = qmp_socket($vmid);
f5eb281a 3452 if (-e $sname) {
dab36e1e
DM
3453 my $qmpclient = PVE::QMPClient->new();
3454
14db5366 3455 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
dab36e1e
DM
3456 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
3457 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
3458 if scalar(%{$cmd->{arguments}});
3459 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
3460 } else {
3461 die "unable to open monitor socket\n";
3462 }
c971c4f2 3463 };
26f11676 3464 if (my $err = $@) {
c971c4f2
AD
3465 syslog("err", "VM $vmid qmp command failed - $err");
3466 die $err;
3467 }
3468
3469 return $res;
3470}
3471
9df5cbcc
DM
3472sub vm_human_monitor_command {
3473 my ($vmid, $cmdline) = @_;
3474
3475 my $res;
3476
f5eb281a 3477 my $cmd = {
9df5cbcc
DM
3478 execute => 'human-monitor-command',
3479 arguments => { 'command-line' => $cmdline},
3480 };
3481
3482 return vm_qmp_command($vmid, $cmd);
3483}
3484
1e3baf05
DM
3485sub vm_commandline {
3486 my ($storecfg, $vmid) = @_;
3487
6b64503e 3488 my $conf = load_config($vmid);
1e3baf05
DM
3489
3490 my $defaults = load_defaults();
3491
6b64503e 3492 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 3493
6b64503e 3494 return join(' ', @$cmd);
1e3baf05
DM
3495}
3496
3497sub vm_reset {
3498 my ($vmid, $skiplock) = @_;
3499
6b64503e 3500 lock_config($vmid, sub {
1e3baf05 3501
6b64503e 3502 my $conf = load_config($vmid);
1e3baf05 3503
6b64503e 3504 check_lock($conf) if !$skiplock;
1e3baf05 3505
816e2c4a 3506 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
3507 });
3508}
3509
3510sub get_vm_volumes {
3511 my ($conf) = @_;
1e3baf05 3512
ff1a2432 3513 my $vollist = [];
d5769dc2
DM
3514 foreach_volid($conf, sub {
3515 my ($volid, $is_cdrom) = @_;
ff1a2432 3516
d5769dc2 3517 return if $volid =~ m|^/|;
ff1a2432 3518
d5769dc2
DM
3519 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
3520 return if !$sid;
ff1a2432
DM
3521
3522 push @$vollist, $volid;
1e3baf05 3523 });
ff1a2432
DM
3524
3525 return $vollist;
3526}
3527
3528sub vm_stop_cleanup {
254575e9 3529 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 3530
745fed70
DM
3531 eval {
3532 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 3533
254575e9
DM
3534 if (!$keepActive) {
3535 my $vollist = get_vm_volumes($conf);
3536 PVE::Storage::deactivate_volumes($storecfg, $vollist);
3537 }
961bfcb2 3538
ab6a046f 3539 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
3540 unlink "/var/run/qemu-server/${vmid}.$ext";
3541 }
745fed70
DM
3542 };
3543 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
3544}
3545
e6c3b671 3546# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
3547# We need that when migration VMs to other nodes (files already moved)
3548# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 3549sub vm_stop {
af30308f 3550 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 3551
9269013a 3552 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 3553
af30308f
DM
3554 if ($migratedfrom){
3555 my $pid = check_running($vmid, $nocheck, $migratedfrom);
3556 kill 15, $pid if $pid;
3557 my $conf = load_config($vmid, $migratedfrom);
3558 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
3559 return;
3560 }
3561
e6c3b671 3562 lock_config($vmid, sub {
1e3baf05 3563
e6c3b671 3564 my $pid = check_running($vmid, $nocheck);
ff1a2432 3565 return if !$pid;
1e3baf05 3566
ff1a2432 3567 my $conf;
e6c3b671 3568 if (!$nocheck) {
ff1a2432 3569 $conf = load_config($vmid);
e6c3b671 3570 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
3571 if (!defined($timeout) && $shutdown && $conf->{startup}) {
3572 my $opts = parse_startup($conf->{startup});
3573 $timeout = $opts->{down} if $opts->{down};
3574 }
e6c3b671 3575 }
19672434 3576
7f4a5b5a
DM
3577 $timeout = 60 if !defined($timeout);
3578
9269013a
DM
3579 eval {
3580 if ($shutdown) {
988903ca 3581 $nocheck ? vm_mon_cmd_nocheck($vmid, "system_powerdown") : vm_mon_cmd($vmid, "system_powerdown");
bcb7c9cf 3582
9269013a 3583 } else {
988903ca 3584 $nocheck ? vm_mon_cmd_nocheck($vmid, "quit") : vm_mon_cmd($vmid, "quit");
afdb31d5 3585 }
9269013a 3586 };
1e3baf05
DM
3587 my $err = $@;
3588
3589 if (!$err) {
1e3baf05 3590 my $count = 0;
e6c3b671 3591 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
3592 $count++;
3593 sleep 1;
3594 }
3595
3596 if ($count >= $timeout) {
9269013a
DM
3597 if ($force) {
3598 warn "VM still running - terminating now with SIGTERM\n";
3599 kill 15, $pid;
3600 } else {
3601 die "VM quit/powerdown failed - got timeout\n";
3602 }
3603 } else {
254575e9 3604 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 3605 return;
1e3baf05
DM
3606 }
3607 } else {
9269013a
DM
3608 if ($force) {
3609 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
3610 kill 15, $pid;
3611 } else {
afdb31d5 3612 die "VM quit/powerdown failed\n";
9269013a 3613 }
1e3baf05
DM
3614 }
3615
3616 # wait again
ff1a2432 3617 $timeout = 10;
1e3baf05
DM
3618
3619 my $count = 0;
e6c3b671 3620 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
3621 $count++;
3622 sleep 1;
3623 }
3624
3625 if ($count >= $timeout) {
ff1a2432 3626 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 3627 kill 9, $pid;
ff1a2432 3628 sleep 1;
1e3baf05
DM
3629 }
3630
254575e9 3631 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 3632 });
1e3baf05
DM
3633}
3634
3635sub vm_suspend {
3636 my ($vmid, $skiplock) = @_;
3637
6b64503e 3638 lock_config($vmid, sub {
1e3baf05 3639
6b64503e 3640 my $conf = load_config($vmid);
1e3baf05 3641
051347aa 3642 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 3643
f77f91f3 3644 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
3645 });
3646}
3647
3648sub vm_resume {
3649 my ($vmid, $skiplock) = @_;
3650
6b64503e 3651 lock_config($vmid, sub {
1e3baf05 3652
6b64503e 3653 my $conf = load_config($vmid);
1e3baf05 3654
051347aa 3655 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 3656
12060fe8 3657 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
3658 });
3659}
3660
5fdbe4f0
DM
3661sub vm_sendkey {
3662 my ($vmid, $skiplock, $key) = @_;
1e3baf05 3663
6b64503e 3664 lock_config($vmid, sub {
1e3baf05 3665
6b64503e 3666 my $conf = load_config($vmid);
f5eb281a 3667
7b7c6d1b
DM
3668 # there is no qmp command, so we use the human monitor command
3669 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
3670 });
3671}
3672
3673sub vm_destroy {
3674 my ($storecfg, $vmid, $skiplock) = @_;
3675
6b64503e 3676 lock_config($vmid, sub {
1e3baf05 3677
6b64503e 3678 my $conf = load_config($vmid);
1e3baf05 3679
6b64503e 3680 check_lock($conf) if !$skiplock;
1e3baf05 3681
ff1a2432
DM
3682 if (!check_running($vmid)) {
3683 fairsched_rmnod($vmid); # try to destroy group
3684 destroy_vm($storecfg, $vmid);
3685 } else {
3686 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
3687 }
3688 });
3689}
3690
1e3baf05
DM
3691# pci helpers
3692
3693sub file_write {
3694 my ($filename, $buf) = @_;
3695
6b64503e 3696 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
3697 return undef if !$fh;
3698
3699 my $res = print $fh $buf;
3700
3701 $fh->close();
3702
3703 return $res;
3704}
3705
3706sub pci_device_info {
3707 my ($name) = @_;
3708
3709 my $res;
3710
3711 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
3712 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
3713
3714 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
3715 return undef if !defined($irq) || $irq !~ m/^\d+$/;
3716
3717 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
3718 return undef if !defined($vendor) || $vendor !~ s/^0x//;
3719
3720 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
3721 return undef if !defined($product) || $product !~ s/^0x//;
3722
3723 $res = {
3724 name => $name,
3725 vendor => $vendor,
3726 product => $product,
3727 domain => $domain,
3728 bus => $bus,
3729 slot => $slot,
3730 func => $func,
3731 irq => $irq,
3732 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
3733 };
3734
3735 return $res;
3736}
3737
3738sub pci_dev_reset {
3739 my ($dev) = @_;
3740
3741 my $name = $dev->{name};
3742
3743 my $fn = "$pcisysfs/devices/$name/reset";
3744
6b64503e 3745 return file_write($fn, "1");
1e3baf05
DM
3746}
3747
3748sub pci_dev_bind_to_stub {
3749 my ($dev) = @_;
3750
3751 my $name = $dev->{name};
3752
3753 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
3754 return 1 if -d $testdir;
3755
3756 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 3757 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
3758
3759 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 3760 if (!file_write($fn, $name)) {
1e3baf05
DM
3761 return undef if -f $fn;
3762 }
3763
3764 $fn = "$pcisysfs/drivers/pci-stub/bind";
3765 if (! -d $testdir) {
6b64503e 3766 return undef if !file_write($fn, $name);
1e3baf05
DM
3767 }
3768
3769 return -d $testdir;
3770}
3771
000fc0a2
SP
3772sub pci_dev_bind_to_vfio {
3773 my ($dev) = @_;
3774
3775 my $name = $dev->{name};
3776
3777 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
3778
3779 if (!-d $vfio_basedir) {
3780 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
3781 }
3782 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
3783
3784 my $testdir = "$vfio_basedir/$name";
3785 return 1 if -d $testdir;
3786
3787 my $data = "$dev->{vendor} $dev->{product}";
3788 return undef if !file_write("$vfio_basedir/new_id", $data);
3789
3790 my $fn = "$pcisysfs/devices/$name/driver/unbind";
3791 if (!file_write($fn, $name)) {
3792 return undef if -f $fn;
3793 }
3794
3795 $fn = "$vfio_basedir/bind";
3796 if (! -d $testdir) {
3797 return undef if !file_write($fn, $name);
3798 }
3799
3800 return -d $testdir;
3801}
3802
3803sub pci_dev_group_bind_to_vfio {
3804 my ($pciid) = @_;
3805
3806 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
3807
3808 if (!-d $vfio_basedir) {
3809 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
3810 }
3811 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
3812
3813 # get IOMMU group devices
3814 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
3815 my @devs = grep /^0000:/, readdir($D);
3816 closedir($D);
3817
3818 foreach my $pciid (@devs) {
3819 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
3820 my $info = pci_device_info($1);
3821 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
3822 }
3823
3824 return 1;
3825}
3826
afdb31d5 3827sub print_pci_addr {
5bdcf937 3828 my ($id, $bridges) = @_;
6b64503e 3829
72a063e4 3830 my $res = '';
6b64503e 3831 my $devices = {
24f0d39a 3832 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 3833 #addr2 : first videocard
13b5a753 3834 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 3835 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
3836 scsihw0 => { bus => 0, addr => 5 },
3837 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 3838 ahci0 => { bus => 0, addr => 7 },
ab6a046f 3839 qga0 => { bus => 0, addr => 8 },
1011b570 3840 spice => { bus => 0, addr => 9 },
6b64503e
DM
3841 virtio0 => { bus => 0, addr => 10 },
3842 virtio1 => { bus => 0, addr => 11 },
3843 virtio2 => { bus => 0, addr => 12 },
3844 virtio3 => { bus => 0, addr => 13 },
3845 virtio4 => { bus => 0, addr => 14 },
3846 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
3847 hostpci0 => { bus => 0, addr => 16 },
3848 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
3849 net0 => { bus => 0, addr => 18 },
3850 net1 => { bus => 0, addr => 19 },
3851 net2 => { bus => 0, addr => 20 },
3852 net3 => { bus => 0, addr => 21 },
3853 net4 => { bus => 0, addr => 22 },
3854 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
3855 vga1 => { bus => 0, addr => 24 },
3856 vga2 => { bus => 0, addr => 25 },
3857 vga3 => { bus => 0, addr => 26 },
e5f7f8ed 3858 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
3859 'pci.1' => { bus => 0, addr => 30 },
3860 'pci.2' => { bus => 0, addr => 31 },
3861 'net6' => { bus => 1, addr => 1 },
3862 'net7' => { bus => 1, addr => 2 },
3863 'net8' => { bus => 1, addr => 3 },
3864 'net9' => { bus => 1, addr => 4 },
3865 'net10' => { bus => 1, addr => 5 },
3866 'net11' => { bus => 1, addr => 6 },
3867 'net12' => { bus => 1, addr => 7 },
3868 'net13' => { bus => 1, addr => 8 },
3869 'net14' => { bus => 1, addr => 9 },
3870 'net15' => { bus => 1, addr => 10 },
3871 'net16' => { bus => 1, addr => 11 },
3872 'net17' => { bus => 1, addr => 12 },
3873 'net18' => { bus => 1, addr => 13 },
3874 'net19' => { bus => 1, addr => 14 },
3875 'net20' => { bus => 1, addr => 15 },
3876 'net21' => { bus => 1, addr => 16 },
3877 'net22' => { bus => 1, addr => 17 },
3878 'net23' => { bus => 1, addr => 18 },
3879 'net24' => { bus => 1, addr => 19 },
3880 'net25' => { bus => 1, addr => 20 },
3881 'net26' => { bus => 1, addr => 21 },
3882 'net27' => { bus => 1, addr => 22 },
3883 'net28' => { bus => 1, addr => 23 },
3884 'net29' => { bus => 1, addr => 24 },
3885 'net30' => { bus => 1, addr => 25 },
3886 'net31' => { bus => 1, addr => 26 },
3887 'virtio6' => { bus => 2, addr => 1 },
3888 'virtio7' => { bus => 2, addr => 2 },
3889 'virtio8' => { bus => 2, addr => 3 },
3890 'virtio9' => { bus => 2, addr => 4 },
3891 'virtio10' => { bus => 2, addr => 5 },
3892 'virtio11' => { bus => 2, addr => 6 },
3893 'virtio12' => { bus => 2, addr => 7 },
3894 'virtio13' => { bus => 2, addr => 8 },
3895 'virtio14' => { bus => 2, addr => 9 },
3896 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
3897 };
3898
3899 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 3900 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
3901 my $bus = $devices->{$id}->{bus};
3902 $res = ",bus=pci.$bus,addr=$addr";
98627641 3903 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
3904 }
3905 return $res;
3906
3907}
3908
2e3b7e2a
AD
3909sub print_pcie_addr {
3910 my ($id) = @_;
3911
3912 my $res = '';
3913 my $devices = {
3914 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
3915 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
3916 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
3917 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
3918 };
3919
3920 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
3921 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
3922 my $bus = $devices->{$id}->{bus};
3923 $res = ",bus=$bus,addr=$addr";
3924 }
3925 return $res;
3926
3927}
3928
3e16d5fc
DM
3929# vzdump restore implementaion
3930
ed221350 3931sub tar_archive_read_firstfile {
3e16d5fc 3932 my $archive = shift;
afdb31d5 3933
3e16d5fc
DM
3934 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
3935
3936 # try to detect archive type first
3937 my $pid = open (TMP, "tar tf '$archive'|") ||
3938 die "unable to open file '$archive'\n";
3939 my $firstfile = <TMP>;
3940 kill 15, $pid;
3941 close TMP;
3942
3943 die "ERROR: archive contaions no data\n" if !$firstfile;
3944 chomp $firstfile;
3945
3946 return $firstfile;
3947}
3948
ed221350
DM
3949sub tar_restore_cleanup {
3950 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
3951
3952 print STDERR "starting cleanup\n";
3953
3954 if (my $fd = IO::File->new($statfile, "r")) {
3955 while (defined(my $line = <$fd>)) {
3956 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
3957 my $volid = $2;
3958 eval {
3959 if ($volid =~ m|^/|) {
3960 unlink $volid || die 'unlink failed\n';
3961 } else {
ed221350 3962 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 3963 }
afdb31d5 3964 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
3965 };
3966 print STDERR "unable to cleanup '$volid' - $@" if $@;
3967 } else {
3968 print STDERR "unable to parse line in statfile - $line";
afdb31d5 3969 }
3e16d5fc
DM
3970 }
3971 $fd->close();
3972 }
3973}
3974
3975sub restore_archive {
a0d1b1a2 3976 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 3977
91bd6c90
DM
3978 my $format = $opts->{format};
3979 my $comp;
3980
3981 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
3982 $format = 'tar' if !$format;
3983 $comp = 'gzip';
3984 } elsif ($archive =~ m/\.tar$/) {
3985 $format = 'tar' if !$format;
3986 } elsif ($archive =~ m/.tar.lzo$/) {
3987 $format = 'tar' if !$format;
3988 $comp = 'lzop';
3989 } elsif ($archive =~ m/\.vma$/) {
3990 $format = 'vma' if !$format;
3991 } elsif ($archive =~ m/\.vma\.gz$/) {
3992 $format = 'vma' if !$format;
3993 $comp = 'gzip';
3994 } elsif ($archive =~ m/\.vma\.lzo$/) {
3995 $format = 'vma' if !$format;
3996 $comp = 'lzop';
3997 } else {
3998 $format = 'vma' if !$format; # default
3999 }
4000
4001 # try to detect archive format
4002 if ($format eq 'tar') {
4003 return restore_tar_archive($archive, $vmid, $user, $opts);
4004 } else {
4005 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4006 }
4007}
4008
4009sub restore_update_config_line {
4010 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4011
4012 return if $line =~ m/^\#qmdump\#/;
4013 return if $line =~ m/^\#vzdump\#/;
4014 return if $line =~ m/^lock:/;
4015 return if $line =~ m/^unused\d+:/;
4016 return if $line =~ m/^parent:/;
ca3e4fa4 4017 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4018
4019 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4020 # try to convert old 1.X settings
4021 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4022 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4023 my ($model, $macaddr) = split(/\=/, $devconfig);
4024 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4025 my $net = {
4026 model => $model,
4027 bridge => "vmbr$ind",
4028 macaddr => $macaddr,
4029 };
4030 my $netstr = print_net($net);
4031
4032 print $outfd "net$cookie->{netcount}: $netstr\n";
4033 $cookie->{netcount}++;
4034 }
4035 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4036 my ($id, $netstr) = ($1, $2);
4037 my $net = parse_net($netstr);
4038 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4039 $netstr = print_net($net);
4040 print $outfd "$id: $netstr\n";
4041 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4042 my $virtdev = $1;
907ea891 4043 my $value = $3;
91bd6c90
DM
4044 if ($line =~ m/backup=no/) {
4045 print $outfd "#$line";
4046 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4047 my $di = parse_drive($virtdev, $value);
8fd57431 4048 delete $di->{format}; # format can change on restore
91bd6c90 4049 $di->{file} = $map->{$virtdev};
ed221350 4050 $value = print_drive($vmid, $di);
91bd6c90
DM
4051 print $outfd "$virtdev: $value\n";
4052 } else {
4053 print $outfd $line;
4054 }
4055 } else {
4056 print $outfd $line;
4057 }
4058}
4059
4060sub scan_volids {
4061 my ($cfg, $vmid) = @_;
4062
4063 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4064
4065 my $volid_hash = {};
4066 foreach my $storeid (keys %$info) {
4067 foreach my $item (@{$info->{$storeid}}) {
4068 next if !($item->{volid} && $item->{size});
5996a936 4069 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4070 $volid_hash->{$item->{volid}} = $item;
4071 }
4072 }
4073
4074 return $volid_hash;
4075}
4076
a8e2f942
DM
4077sub get_used_paths {
4078 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4079
4080 my $used_path = {};
4081
4082 my $scan_config = sub {
4083 my ($cref, $snapname) = @_;
4084
4085 foreach my $key (keys %$cref) {
4086 my $value = $cref->{$key};
4087 if (valid_drivename($key)) {
4088 next if $skip_drive && $key eq $skip_drive;
4089 my $drive = parse_drive($key, $value);
4090 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4091 if ($drive->{file} =~ m!^/!) {
4092 $used_path->{$drive->{file}}++; # = 1;
4093 } else {
4094 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4095 next if !$storeid;
4096 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4097 next if !$scfg;
4098 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4099 $used_path->{$path}++; # = 1;
4100 }
4101 }
4102 }
4103 };
4104
4105 &$scan_config($conf);
4106
4107 undef $skip_drive;
4108
4109 if ($scan_snapshots) {
4110 foreach my $snapname (keys %{$conf->{snapshots}}) {
4111 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4112 }
4113 }
4114
4115 return $used_path;
4116}
4117
91bd6c90
DM
4118sub update_disksize {
4119 my ($vmid, $conf, $volid_hash) = @_;
be190583 4120
91bd6c90
DM
4121 my $changes;
4122
4123 my $used = {};
4124
5996a936
DM
4125 # Note: it is allowed to define multiple storages with same path (alias), so
4126 # we need to check both 'volid' and real 'path' (two different volid can point
4127 # to the same path).
4128
4129 my $usedpath = {};
be190583 4130
91bd6c90
DM
4131 # update size info
4132 foreach my $opt (keys %$conf) {
ed221350
DM
4133 if (valid_drivename($opt)) {
4134 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4135 my $volid = $drive->{file};
4136 next if !$volid;
4137
4138 $used->{$volid} = 1;
be190583 4139 if ($volid_hash->{$volid} &&
5996a936
DM
4140 (my $path = $volid_hash->{$volid}->{path})) {
4141 $usedpath->{$path} = 1;
4142 }
91bd6c90 4143
ed221350 4144 next if drive_is_cdrom($drive);
91bd6c90
DM
4145 next if !$volid_hash->{$volid};
4146
4147 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4148 my $new = print_drive($vmid, $drive);
4149 if ($new ne $conf->{$opt}) {
4150 $changes = 1;
4151 $conf->{$opt} = $new;
4152 }
91bd6c90
DM
4153 }
4154 }
4155
5996a936
DM
4156 # remove 'unusedX' entry if volume is used
4157 foreach my $opt (keys %$conf) {
4158 next if $opt !~ m/^unused\d+$/;
4159 my $volid = $conf->{$opt};
4160 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4161 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4162 $changes = 1;
4163 delete $conf->{$opt};
4164 }
4165 }
4166
91bd6c90
DM
4167 foreach my $volid (sort keys %$volid_hash) {
4168 next if $volid =~ m/vm-$vmid-state-/;
4169 next if $used->{$volid};
5996a936
DM
4170 my $path = $volid_hash->{$volid}->{path};
4171 next if !$path; # just to be sure
4172 next if $usedpath->{$path};
91bd6c90 4173 $changes = 1;
ed221350 4174 add_unused_volume($conf, $volid);
05937a14 4175 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4176 }
4177
4178 return $changes;
4179}
4180
4181sub rescan {
4182 my ($vmid, $nolock) = @_;
4183
4184 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4185
4186 my $volid_hash = scan_volids($cfg, $vmid);
4187
4188 my $updatefn = sub {
4189 my ($vmid) = @_;
4190
ed221350 4191 my $conf = load_config($vmid);
be190583 4192
ed221350 4193 check_lock($conf);
91bd6c90 4194
03da3f0d
DM
4195 my $vm_volids = {};
4196 foreach my $volid (keys %$volid_hash) {
4197 my $info = $volid_hash->{$volid};
4198 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4199 }
4200
4201 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 4202
ed221350 4203 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
4204 };
4205
4206 if (defined($vmid)) {
4207 if ($nolock) {
4208 &$updatefn($vmid);
4209 } else {
ed221350 4210 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
4211 }
4212 } else {
4213 my $vmlist = config_list();
4214 foreach my $vmid (keys %$vmlist) {
4215 if ($nolock) {
4216 &$updatefn($vmid);
4217 } else {
ed221350 4218 lock_config($vmid, $updatefn, $vmid);
be190583 4219 }
91bd6c90
DM
4220 }
4221 }
4222}
4223
4224sub restore_vma_archive {
4225 my ($archive, $vmid, $user, $opts, $comp) = @_;
4226
4227 my $input = $archive eq '-' ? "<&STDIN" : undef;
4228 my $readfrom = $archive;
4229
4230 my $uncomp = '';
4231 if ($comp) {
4232 $readfrom = '-';
4233 my $qarchive = PVE::Tools::shellquote($archive);
4234 if ($comp eq 'gzip') {
4235 $uncomp = "zcat $qarchive|";
4236 } elsif ($comp eq 'lzop') {
4237 $uncomp = "lzop -d -c $qarchive|";
4238 } else {
4239 die "unknown compression method '$comp'\n";
4240 }
be190583 4241
91bd6c90
DM
4242 }
4243
4244 my $tmpdir = "/var/tmp/vzdumptmp$$";
4245 rmtree $tmpdir;
4246
4247 # disable interrupts (always do cleanups)
4248 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4249 warn "got interrupt - ignored\n";
4250 };
4251
4252 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4253 POSIX::mkfifo($mapfifo, 0600);
4254 my $fifofh;
4255
4256 my $openfifo = sub {
4257 open($fifofh, '>', $mapfifo) || die $!;
4258 };
4259
4260 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4261
4262 my $oldtimeout;
4263 my $timeout = 5;
4264
4265 my $devinfo = {};
4266
4267 my $rpcenv = PVE::RPCEnvironment::get();
4268
ed221350 4269 my $conffile = config_file($vmid);
91bd6c90
DM
4270 my $tmpfn = "$conffile.$$.tmp";
4271
ed221350
DM
4272 # Note: $oldconf is undef if VM does not exists
4273 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4274
91bd6c90
DM
4275 my $print_devmap = sub {
4276 my $virtdev_hash = {};
4277
4278 my $cfgfn = "$tmpdir/qemu-server.conf";
4279
4280 # we can read the config - that is already extracted
4281 my $fh = IO::File->new($cfgfn, "r") ||
4282 "unable to read qemu-server.conf - $!\n";
4283
4284 while (defined(my $line = <$fh>)) {
4285 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4286 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4287 die "archive does not contain data for drive '$virtdev'\n"
4288 if !$devinfo->{$devname};
4289 if (defined($opts->{storage})) {
4290 $storeid = $opts->{storage} || 'local';
4291 } elsif (!$storeid) {
4292 $storeid = 'local';
4293 }
4294 $format = 'raw' if !$format;
4295 $devinfo->{$devname}->{devname} = $devname;
4296 $devinfo->{$devname}->{virtdev} = $virtdev;
4297 $devinfo->{$devname}->{format} = $format;
4298 $devinfo->{$devname}->{storeid} = $storeid;
4299
be190583 4300 # check permission on storage
91bd6c90
DM
4301 my $pool = $opts->{pool}; # todo: do we need that?
4302 if ($user ne 'root@pam') {
4303 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4304 }
4305
4306 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4307 }
4308 }
4309
4310 foreach my $devname (keys %$devinfo) {
be190583
DM
4311 die "found no device mapping information for device '$devname'\n"
4312 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
4313 }
4314
91bd6c90 4315 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
4316
4317 # create empty/temp config
be190583 4318 if ($oldconf) {
ed221350
DM
4319 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4320 foreach_drive($oldconf, sub {
4321 my ($ds, $drive) = @_;
4322
4323 return if drive_is_cdrom($drive);
4324
4325 my $volid = $drive->{file};
4326
4327 return if !$volid || $volid =~ m|^/|;
4328
4329 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4330 return if !$path || !$owner || ($owner != $vmid);
4331
4332 # Note: only delete disk we want to restore
4333 # other volumes will become unused
4334 if ($virtdev_hash->{$ds}) {
4335 PVE::Storage::vdisk_free($cfg, $volid);
4336 }
4337 });
4338 }
4339
4340 my $map = {};
91bd6c90
DM
4341 foreach my $virtdev (sort keys %$virtdev_hash) {
4342 my $d = $virtdev_hash->{$virtdev};
4343 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4344 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
4345
4346 # test if requested format is supported
4347 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4348 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4349 $d->{format} = $defFormat if !$supported;
4350
91bd6c90
DM
4351 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4352 $d->{format}, undef, $alloc_size);
4353 print STDERR "new volume ID is '$volid'\n";
4354 $d->{volid} = $volid;
4355 my $path = PVE::Storage::path($cfg, $volid);
4356
4357 my $write_zeros = 1;
4358 # fixme: what other storages types initialize volumes with zero?
244f2577 4359 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 4360 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
4361 $write_zeros = 0;
4362 }
4363
4364 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4365
4366 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4367 $map->{$virtdev} = $volid;
4368 }
4369
4370 $fh->seek(0, 0) || die "seek failed - $!\n";
4371
4372 my $outfd = new IO::File ($tmpfn, "w") ||
4373 die "unable to write config for VM $vmid\n";
4374
4375 my $cookie = { netcount => 0 };
4376 while (defined(my $line = <$fh>)) {
be190583 4377 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
4378 }
4379
4380 $fh->close();
4381 $outfd->close();
4382 };
4383
4384 eval {
4385 # enable interrupts
4386 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4387 die "interrupted by signal\n";
4388 };
4389 local $SIG{ALRM} = sub { die "got timeout\n"; };
4390
4391 $oldtimeout = alarm($timeout);
4392
4393 my $parser = sub {
4394 my $line = shift;
4395
4396 print "$line\n";
4397
4398 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
4399 my ($dev_id, $size, $devname) = ($1, $2, $3);
4400 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
4401 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 4402 # we correctly received the vma config, so we can disable
3cf90d7a
DM
4403 # the timeout now for disk allocation (set to 10 minutes, so
4404 # that we always timeout if something goes wrong)
4405 alarm(600);
91bd6c90
DM
4406 &$print_devmap();
4407 print $fifofh "done\n";
4408 my $tmp = $oldtimeout || 0;
4409 $oldtimeout = undef;
4410 alarm($tmp);
4411 close($fifofh);
4412 }
4413 };
be190583 4414
91bd6c90
DM
4415 print "restore vma archive: $cmd\n";
4416 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
4417 };
4418 my $err = $@;
4419
4420 alarm($oldtimeout) if $oldtimeout;
4421
4422 unlink $mapfifo;
4423
4424 if ($err) {
4425 rmtree $tmpdir;
4426 unlink $tmpfn;
4427
4428 my $cfg = cfs_read_file('storage.cfg');
4429 foreach my $devname (keys %$devinfo) {
4430 my $volid = $devinfo->{$devname}->{volid};
4431 next if !$volid;
4432 eval {
4433 if ($volid =~ m|^/|) {
4434 unlink $volid || die 'unlink failed\n';
4435 } else {
4436 PVE::Storage::vdisk_free($cfg, $volid);
4437 }
4438 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4439 };
4440 print STDERR "unable to cleanup '$volid' - $@" if $@;
4441 }
4442 die $err;
4443 }
4444
4445 rmtree $tmpdir;
ed221350
DM
4446
4447 rename($tmpfn, $conffile) ||
91bd6c90
DM
4448 die "unable to commit configuration file '$conffile'\n";
4449
ed221350
DM
4450 PVE::Cluster::cfs_update(); # make sure we read new file
4451
91bd6c90
DM
4452 eval { rescan($vmid, 1); };
4453 warn $@ if $@;
4454}
4455
4456sub restore_tar_archive {
4457 my ($archive, $vmid, $user, $opts) = @_;
4458
9c502e26 4459 if ($archive ne '-') {
ed221350 4460 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
4461 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
4462 if $firstfile ne 'qemu-server.conf';
4463 }
3e16d5fc 4464
ed221350 4465 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 4466
ed221350 4467 # destroy existing data - keep empty config
ebb55558
DM
4468 my $vmcfgfn = PVE::QemuServer::config_file($vmid);
4469 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 4470
3e16d5fc
DM
4471 my $tocmd = "/usr/lib/qemu-server/qmextract";
4472
2415a446 4473 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 4474 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
4475 $tocmd .= ' --prealloc' if $opts->{prealloc};
4476 $tocmd .= ' --info' if $opts->{info};
4477
a0d1b1a2 4478 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 4479 # so we pipe to zcat
2415a446
DM
4480 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
4481 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
4482
4483 my $tmpdir = "/var/tmp/vzdumptmp$$";
4484 mkpath $tmpdir;
4485
4486 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
4487 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 4488 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 4489
ed221350 4490 my $conffile = config_file($vmid);
3e16d5fc
DM
4491 my $tmpfn = "$conffile.$$.tmp";
4492
4493 # disable interrupts (always do cleanups)
4494 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4495 print STDERR "got interrupt - ignored\n";
4496 };
4497
afdb31d5 4498 eval {
3e16d5fc
DM
4499 # enable interrupts
4500 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4501 die "interrupted by signal\n";
4502 };
4503
9c502e26
DM
4504 if ($archive eq '-') {
4505 print "extracting archive from STDIN\n";
4506 run_command($cmd, input => "<&STDIN");
4507 } else {
4508 print "extracting archive '$archive'\n";
4509 run_command($cmd);
4510 }
3e16d5fc
DM
4511
4512 return if $opts->{info};
4513
4514 # read new mapping
4515 my $map = {};
4516 my $statfile = "$tmpdir/qmrestore.stat";
4517 if (my $fd = IO::File->new($statfile, "r")) {
4518 while (defined (my $line = <$fd>)) {
4519 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4520 $map->{$1} = $2 if $1;
4521 } else {
4522 print STDERR "unable to parse line in statfile - $line\n";
4523 }
4524 }
4525 $fd->close();
4526 }
4527
4528 my $confsrc = "$tmpdir/qemu-server.conf";
4529
4530 my $srcfd = new IO::File($confsrc, "r") ||
4531 die "unable to open file '$confsrc'\n";
4532
4533 my $outfd = new IO::File ($tmpfn, "w") ||
4534 die "unable to write config for VM $vmid\n";
4535
91bd6c90 4536 my $cookie = { netcount => 0 };
3e16d5fc 4537 while (defined (my $line = <$srcfd>)) {
be190583 4538 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
4539 }
4540
4541 $srcfd->close();
4542 $outfd->close();
4543 };
4544 my $err = $@;
4545
afdb31d5 4546 if ($err) {
3e16d5fc
DM
4547
4548 unlink $tmpfn;
4549
ed221350 4550 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 4551
3e16d5fc 4552 die $err;
afdb31d5 4553 }
3e16d5fc
DM
4554
4555 rmtree $tmpdir;
4556
4557 rename $tmpfn, $conffile ||
4558 die "unable to commit configuration file '$conffile'\n";
91bd6c90 4559
ed221350
DM
4560 PVE::Cluster::cfs_update(); # make sure we read new file
4561
91bd6c90
DM
4562 eval { rescan($vmid, 1); };
4563 warn $@ if $@;
3e16d5fc
DM
4564};
4565
0d18dcfc
DM
4566
4567# Internal snapshots
4568
4569# NOTE: Snapshot create/delete involves several non-atomic
4570# action, and can take a long time.
4571# So we try to avoid locking the file and use 'lock' variable
4572# inside the config file instead.
4573
ef59d1ca
DM
4574my $snapshot_copy_config = sub {
4575 my ($source, $dest) = @_;
4576
4577 foreach my $k (keys %$source) {
4578 next if $k eq 'snapshots';
982c7f12
DM
4579 next if $k eq 'snapstate';
4580 next if $k eq 'snaptime';
18bfb361 4581 next if $k eq 'vmstate';
ef59d1ca
DM
4582 next if $k eq 'lock';
4583 next if $k eq 'digest';
db7c26e5 4584 next if $k eq 'description';
ef59d1ca 4585 next if $k =~ m/^unused\d+$/;
be190583 4586
ef59d1ca
DM
4587 $dest->{$k} = $source->{$k};
4588 }
4589};
4590
4591my $snapshot_apply_config = sub {
4592 my ($conf, $snap) = @_;
4593
4594 # copy snapshot list
4595 my $newconf = {
4596 snapshots => $conf->{snapshots},
4597 };
4598
db7c26e5 4599 # keep description and list of unused disks
ef59d1ca 4600 foreach my $k (keys %$conf) {
db7c26e5 4601 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
4602 $newconf->{$k} = $conf->{$k};
4603 }
4604
4605 &$snapshot_copy_config($snap, $newconf);
4606
4607 return $newconf;
4608};
4609
18bfb361
DM
4610sub foreach_writable_storage {
4611 my ($conf, $func) = @_;
4612
4613 my $sidhash = {};
4614
4615 foreach my $ds (keys %$conf) {
4616 next if !valid_drivename($ds);
4617
4618 my $drive = parse_drive($ds, $conf->{$ds});
4619 next if !$drive;
4620 next if drive_is_cdrom($drive);
4621
4622 my $volid = $drive->{file};
4623
4624 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 4625 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
4626 }
4627
4628 foreach my $sid (sort keys %$sidhash) {
4629 &$func($sid);
4630 }
4631}
4632
4633my $alloc_vmstate_volid = sub {
4634 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 4635
18bfb361
DM
4636 # Note: we try to be smart when selecting a $target storage
4637
4638 my $target;
4639
4640 # search shared storage first
4641 foreach_writable_storage($conf, sub {
4642 my ($sid) = @_;
4643 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4644 return if !$scfg->{shared};
4645
4646 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
4647 });
4648
4649 if (!$target) {
4650 # now search local storage
4651 foreach_writable_storage($conf, sub {
4652 my ($sid) = @_;
4653 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4654 return if $scfg->{shared};
4655
4656 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
4657 });
4658 }
4659
4660 $target = 'local' if !$target;
4661
fe6249f4
DM
4662 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
4663 # we abort live save after $conf->{memory}, so we need at max twice that space
4664 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
4665
4666 my $name = "vm-$vmid-state-$snapname";
4667 my $scfg = PVE::Storage::storage_config($storecfg, $target);
4668 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
4669 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
4670
4671 return $volid;
4672};
4673
0d18dcfc 4674my $snapshot_prepare = sub {
18bfb361 4675 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
4676
4677 my $snap;
0d18dcfc
DM
4678
4679 my $updatefn = sub {
4680
4681 my $conf = load_config($vmid);
4682
be190583 4683 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
4684 if is_template($conf);
4685
0d18dcfc
DM
4686 check_lock($conf);
4687
22c377f0
DM
4688 $conf->{lock} = 'snapshot';
4689
be190583
DM
4690 die "snapshot name '$snapname' already used\n"
4691 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 4692
ee2f90b1 4693 my $storecfg = PVE::Storage::config();
7ea975ef 4694 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 4695
782f4f75 4696 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 4697
18bfb361
DM
4698 if ($save_vmstate && check_running($vmid)) {
4699 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
4700 }
4701
ef59d1ca 4702 &$snapshot_copy_config($conf, $snap);
0d18dcfc 4703
782f4f75
DM
4704 $snap->{snapstate} = "prepare";
4705 $snap->{snaptime} = time();
4706 $snap->{description} = $comment if $comment;
4707
4b15803d
DM
4708 # always overwrite machine if we save vmstate. This makes sure we
4709 # can restore it later using correct machine type
4710 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
4711
0d18dcfc
DM
4712 update_config_nolock($vmid, $conf, 1);
4713 };
4714
4715 lock_config($vmid, $updatefn);
22c377f0
DM
4716
4717 return $snap;
0d18dcfc
DM
4718};
4719
4720my $snapshot_commit = sub {
4721 my ($vmid, $snapname) = @_;
4722
4723 my $updatefn = sub {
4724
4725 my $conf = load_config($vmid);
4726
be190583
DM
4727 die "missing snapshot lock\n"
4728 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc
DM
4729
4730 my $snap = $conf->{snapshots}->{$snapname};
4731
be190583
DM
4732 die "snapshot '$snapname' does not exist\n" if !defined($snap);
4733
4734 die "wrong snapshot state\n"
4735 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 4736
0d18dcfc 4737 delete $snap->{snapstate};
ee2f90b1 4738 delete $conf->{lock};
0d18dcfc 4739
ef59d1ca 4740 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 4741
05e5ad3f
DM
4742 $newconf->{parent} = $snapname;
4743
0d18dcfc
DM
4744 update_config_nolock($vmid, $newconf, 1);
4745 };
4746
4747 lock_config($vmid, $updatefn);
4748};
4749
22c377f0
DM
4750sub snapshot_rollback {
4751 my ($vmid, $snapname) = @_;
4752
4753 my $snap;
4754
4755 my $prepare = 1;
4756
a3222b91 4757 my $storecfg = PVE::Storage::config();
be190583 4758
22c377f0
DM
4759 my $updatefn = sub {
4760
4761 my $conf = load_config($vmid);
4762
8b43bc11 4763 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 4764
ab33a7c2
DM
4765 $snap = $conf->{snapshots}->{$snapname};
4766
be190583 4767 die "snapshot '$snapname' does not exist\n" if !defined($snap);
ab33a7c2 4768
be190583 4769 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
4770 if $snap->{snapstate};
4771
a3222b91
DM
4772 if ($prepare) {
4773 check_lock($conf);
4774 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
4775 }
22c377f0
DM
4776
4777 die "unable to rollback vm $vmid: vm is running\n"
4778 if check_running($vmid);
4779
4780 if ($prepare) {
4781 $conf->{lock} = 'rollback';
4782 } else {
4783 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
4784 delete $conf->{lock};
4785 }
4786
4b15803d
DM
4787 my $forcemachine;
4788
22c377f0 4789 if (!$prepare) {
4b15803d
DM
4790 my $has_machine_config = defined($conf->{machine});
4791
22c377f0 4792 # copy snapshot config to current config
ef59d1ca
DM
4793 $conf = &$snapshot_apply_config($conf, $snap);
4794 $conf->{parent} = $snapname;
4b15803d 4795
d8b916fd
DM
4796 # Note: old code did not store 'machine', so we try to be smart
4797 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
4798 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 4799 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
4800 # in the original config.
4801 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
4802 }
4803
4804 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
4805
4806 if (!$prepare && $snap->{vmstate}) {
4807 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 4808 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 4809 }
22c377f0
DM
4810 };
4811
4812 lock_config($vmid, $updatefn);
be190583 4813
22c377f0
DM
4814 foreach_drive($snap, sub {
4815 my ($ds, $drive) = @_;
4816
4817 return if drive_is_cdrom($drive);
4818
4819 my $volid = $drive->{file};
4820 my $device = "drive-$ds";
4821
79e57b29 4822 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
4823 });
4824
4825 $prepare = 0;
4826 lock_config($vmid, $updatefn);
4827}
4828
9dcf4909
DM
4829my $savevm_wait = sub {
4830 my ($vmid) = @_;
4831
4832 for(;;) {
ed221350 4833 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
4834 if (!$stat->{status}) {
4835 die "savevm not active\n";
4836 } elsif ($stat->{status} eq 'active') {
4837 sleep(1);
4838 next;
4839 } elsif ($stat->{status} eq 'completed') {
4840 last;
4841 } else {
4842 die "query-savevm returned status '$stat->{status}'\n";
4843 }
4844 }
4845};
4846
0d18dcfc 4847sub snapshot_create {
18bfb361 4848 my ($vmid, $snapname, $save_vmstate, $freezefs, $comment) = @_;
0d18dcfc 4849
18bfb361 4850 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 4851
18bfb361 4852 $freezefs = $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
030dd626 4853
3ee28e38
DM
4854 my $drivehash = {};
4855
18bfb361
DM
4856 my $running = check_running($vmid);
4857
0d18dcfc
DM
4858 eval {
4859 # create internal snapshots of all drives
22c377f0
DM
4860
4861 my $storecfg = PVE::Storage::config();
a3222b91
DM
4862
4863 if ($running) {
4864 if ($snap->{vmstate}) {
be190583 4865 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
4866 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
4867 &$savevm_wait($vmid);
a3222b91 4868 } else {
9dcf4909 4869 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
4870 }
4871 };
4872
4873 qga_freezefs($vmid) if $running && $freezefs;
be190583 4874
22c377f0
DM
4875 foreach_drive($snap, sub {
4876 my ($ds, $drive) = @_;
4877
4878 return if drive_is_cdrom($drive);
0d18dcfc 4879
22c377f0
DM
4880 my $volid = $drive->{file};
4881 my $device = "drive-$ds";
4882
4883 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 4884 $drivehash->{$ds} = 1;
22c377f0 4885 });
0d18dcfc 4886 };
22c377f0
DM
4887 my $err = $@;
4888
1a71fa73 4889 eval { qga_unfreezefs($vmid) if $running && $freezefs; };
22c377f0
DM
4890 warn $@ if $@;
4891
9dcf4909 4892 eval { vm_mon_cmd($vmid, "savevm-end") if $running; };
22c377f0
DM
4893 warn $@ if $@;
4894
4895 if ($err) {
0d18dcfc 4896 warn "snapshot create failed: starting cleanup\n";
3ee28e38 4897 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
4898 warn $@ if $@;
4899 die $err;
4900 }
4901
4902 &$snapshot_commit($vmid, $snapname);
4903}
4904
3ee28e38 4905# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 4906sub snapshot_delete {
3ee28e38 4907 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
4908
4909 my $prepare = 1;
4910
22c377f0 4911 my $snap;
ee2f90b1 4912 my $unused = [];
0d18dcfc 4913
6cb1a8cf
DM
4914 my $unlink_parent = sub {
4915 my ($confref, $new_parent) = @_;
4916
4917 if ($confref->{parent} && $confref->{parent} eq $snapname) {
4918 if ($new_parent) {
4919 $confref->{parent} = $new_parent;
4920 } else {
4921 delete $confref->{parent};
4922 }
4923 }
4924 };
be190583 4925
0d18dcfc 4926 my $updatefn = sub {
2009f324 4927 my ($remove_drive) = @_;
0d18dcfc 4928
22c377f0 4929 my $conf = load_config($vmid);
0d18dcfc 4930
5295b23d
DM
4931 if (!$drivehash) {
4932 check_lock($conf);
be190583 4933 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
4934 if is_template($conf);
4935 }
0d18dcfc 4936
22c377f0 4937 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 4938
be190583 4939 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
4940
4941 # remove parent refs
8fd882a4
SP
4942 if (!$prepare) {
4943 &$unlink_parent($conf, $snap->{parent});
4944 foreach my $sn (keys %{$conf->{snapshots}}) {
4945 next if $sn eq $snapname;
4946 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
4947 }
0d18dcfc
DM
4948 }
4949
2009f324 4950 if ($remove_drive) {
18bfb361
DM
4951 if ($remove_drive eq 'vmstate') {
4952 delete $snap->{$remove_drive};
4953 } else {
4954 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
4955 my $volid = $drive->{file};
4956 delete $snap->{$remove_drive};
4957 add_unused_volume($conf, $volid);
4958 }
2009f324
DM
4959 }
4960
0d18dcfc
DM
4961 if ($prepare) {
4962 $snap->{snapstate} = 'delete';
4963 } else {
4964 delete $conf->{snapshots}->{$snapname};
3ee28e38 4965 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
4966 foreach my $volid (@$unused) {
4967 add_unused_volume($conf, $volid);
4968 }
0d18dcfc
DM
4969 }
4970
4971 update_config_nolock($vmid, $conf, 1);
4972 };
4973
4974 lock_config($vmid, $updatefn);
4975
18bfb361 4976 # now remove vmstate file
0d18dcfc 4977
22c377f0
DM
4978 my $storecfg = PVE::Storage::config();
4979
18bfb361
DM
4980 if ($snap->{vmstate}) {
4981 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
4982 if (my $err = $@) {
4983 die $err if !$force;
4984 warn $err;
4985 }
4986 # save changes (remove vmstate from snapshot)
4987 lock_config($vmid, $updatefn, 'vmstate') if !$force;
4988 };
4989
4990 # now remove all internal snapshots
4991 foreach_drive($snap, sub {
22c377f0
DM
4992 my ($ds, $drive) = @_;
4993
4994 return if drive_is_cdrom($drive);
3ee28e38 4995
22c377f0
DM
4996 my $volid = $drive->{file};
4997 my $device = "drive-$ds";
4998
2009f324
DM
4999 if (!$drivehash || $drivehash->{$ds}) {
5000 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5001 if (my $err = $@) {
5002 die $err if !$force;
5003 warn $err;
5004 }
3ee28e38 5005 }
2009f324
DM
5006
5007 # save changes (remove drive fron snapshot)
5008 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5009 push @$unused, $volid;
22c377f0 5010 });
0d18dcfc
DM
5011
5012 # now cleanup config
5013 $prepare = 0;
5014 lock_config($vmid, $updatefn);
5015}
5016
9cd07842 5017sub has_feature {
7ea975ef
AD
5018 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5019
719893a9 5020 my $err;
7ea975ef
AD
5021 foreach_drive($conf, sub {
5022 my ($ds, $drive) = @_;
5023
5024 return if drive_is_cdrom($drive);
5025 my $volid = $drive->{file};
5026 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5027 });
5028
719893a9 5029 return $err ? 0 : 1;
7ea975ef 5030}
04a69bb4
AD
5031
5032sub template_create {
5033 my ($vmid, $conf, $disk) = @_;
5034
04a69bb4 5035 my $storecfg = PVE::Storage::config();
04a69bb4 5036
9cd07842
DM
5037 foreach_drive($conf, sub {
5038 my ($ds, $drive) = @_;
5039
5040 return if drive_is_cdrom($drive);
5041 return if $disk && $ds ne $disk;
5042
5043 my $volid = $drive->{file};
bbd56097 5044 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5045
04a69bb4
AD
5046 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5047 $drive->{file} = $voliddst;
152fe752
DM
5048 $conf->{$ds} = print_drive($vmid, $drive);
5049 update_config_nolock($vmid, $conf, 1);
04a69bb4 5050 });
04a69bb4
AD
5051}
5052
624361b3
AD
5053sub is_template {
5054 my ($conf) = @_;
5055
96d695c0 5056 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5057}
5058
5133de42
AD
5059sub qemu_img_convert {
5060 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5061
5062 my $storecfg = PVE::Storage::config();
5063 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5064 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5065
5066 if ($src_storeid && $dst_storeid) {
5067 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5068 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5069
5070 my $src_format = qemu_img_format($src_scfg, $src_volname);
5071 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5072
5073 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5074 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5075
5076 my $cmd = [];
71ddbff9 5077 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5078 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5079 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5080
5081 my $parser = sub {
5082 my $line = shift;
5083 if($line =~ m/\((\S+)\/100\%\)/){
5084 my $percent = $1;
5085 my $transferred = int($size * $percent / 100);
5086 my $remaining = $size - $transferred;
5087
5088 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5089 }
5090
5091 };
5092
5093 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5094 my $err = $@;
5095 die "copy failed: $err" if $err;
5096 }
5097}
5098
5099sub qemu_img_format {
5100 my ($scfg, $volname) = @_;
5101
ccb5c001 5102 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5103 return $1;
ccb5c001 5104 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5105 return "host_device";
be190583 5106 } else {
5133de42 5107 return "raw";
5133de42
AD
5108 }
5109}
5110
cfad42af
AD
5111sub qemu_drive_mirror {
5112 my ($vmid, $drive, $dst_volid, $vmiddst, $maxwait) = @_;
5113
5114 my $count = 1;
5115 my $old_len = 0;
5116 my $frozen = undef;
5117
5118 my $storecfg = PVE::Storage::config();
5119 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5120
5121 if ($dst_storeid) {
5122 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5123
152fe752 5124 my $format;
cfad42af
AD
5125 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5126 $format = $1;
5127 }
5128
5129 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5130
152fe752 5131 if ($format) {
be190583 5132 #fixme : sometime drive-mirror timeout, but works fine after.
152fe752 5133 # (I have see the problem with big volume > 200GB), so we need to eval
be190583 5134 eval { vm_mon_cmd($vmid, "drive-mirror", timeout => 10, device => "drive-$drive", mode => "existing",
152fe752
DM
5135 sync => "full", target => $dst_path, format => $format); };
5136 } else {
be190583 5137 eval { vm_mon_cmd($vmid, "drive-mirror", timeout => 10, device => "drive-$drive", mode => "existing",
152fe752 5138 sync => "full", target => $dst_path); };
cfad42af 5139 }
152fe752
DM
5140
5141 eval {
cfad42af 5142 while (1) {
152fe752 5143 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
cfad42af 5144 my $stat = @$stats[0];
f6ab3bdb
AD
5145 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5146 die "error job is not mirroring" if $stat->{type} ne "mirror";
5147
cfad42af
AD
5148 my $transferred = $stat->{offset};
5149 my $total = $stat->{len};
5150 my $remaining = $total - $transferred;
5151 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
cfad42af
AD
5152
5153 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent %\n";
5154
5155 last if ($stat->{len} == $stat->{offset});
5156 if ($old_len == $stat->{offset}) {
5157 if ($maxwait && $count > $maxwait) {
5158 # if writes to disk occurs the disk needs to be freezed
5159 # to be able to complete the migration
5160 vm_suspend($vmid,1);
5161 $count = 0;
5162 $frozen = 1;
152fe752 5163 } else {
cfad42af
AD
5164 $count++ unless $frozen;
5165 }
152fe752
DM
5166 } elsif ($frozen) {
5167 vm_resume($vmid,1);
5168 $count = 0;
cfad42af
AD
5169 }
5170 $old_len = $stat->{offset};
5171 sleep 1;
5172 }
be190583 5173
2fc6bc17 5174 if ($vmiddst == $vmid) {
be190583 5175 # switch the disk if source and destination are on the same guest
2fc6bc17
DM
5176 vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive");
5177 }
cfad42af 5178 };
4fca0153 5179 if (my $err = $@) {
152fe752 5180 eval { vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive"); };
4fca0153 5181 die "mirroring error: $err";
cfad42af
AD
5182 }
5183
2fc6bc17
DM
5184 if ($vmiddst != $vmid) {
5185 # if we clone a disk for a new target vm, we don't switch the disk
152fe752 5186 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
cfad42af
AD
5187 }
5188 }
5189}
5190
152fe752 5191sub clone_disk {
be190583 5192 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
5193 $newvmid, $storage, $format, $full, $newvollist) = @_;
5194
5195 my $newvolid;
5196
5197 if (!$full) {
5198 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 5199 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
5200 push @$newvollist, $newvolid;
5201 } else {
5202 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5203 $storeid = $storage if $storage;
5204
1377d7b0
DM
5205 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5206 if (!$format) {
5207 $format = $drive->{format} || $defFormat;
152fe752
DM
5208 }
5209
1377d7b0
DM
5210 # test if requested format is supported - else use default
5211 my $supported = grep { $_ eq $format } @$validFormats;
5212 $format = $defFormat if !$supported;
5213
152fe752
DM
5214 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5215
5216 print "create full clone of drive $drivename ($drive->{file})\n";
5217 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5218 push @$newvollist, $newvolid;
5219
5220 if (!$running || $snapname) {
5221 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5222 } else {
5223 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 5224 }
152fe752
DM
5225 }
5226
5227 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5228
5229 my $disk = $drive;
5230 $disk->{format} = undef;
5231 $disk->{file} = $newvolid;
5232 $disk->{size} = $size;
5233
5234 return $disk;
5235}
5236
ff556cf2
DM
5237# this only works if VM is running
5238sub get_current_qemu_machine {
5239 my ($vmid) = @_;
5240
5241 my $cmd = { execute => 'query-machines', arguments => {} };
be190583 5242 my $res = PVE::QemuServer::vm_qmp_command($vmid, $cmd);
ff556cf2
DM
5243
5244 my ($current, $default);
5245 foreach my $e (@$res) {
5246 $default = $e->{name} if $e->{'is-default'};
5247 $current = $e->{name} if $e->{'is-current'};
5248 }
5249
5250 # fallback to the default machine if current is not supported by qemu
5251 return $current || $default || 'pc';
5252}
5253
4543ecf0
AD
5254sub lspci {
5255
5256 my $devices = {};
5257
5258 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5259 my (undef, $id, $function) = @_;
5260 my $res = { id => $id, function => $function};
5261 push @{$devices->{$id}}, $res;
5262 });
5263
5264 return $devices;
5265}
5266
1e3baf05 52671;