]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
clone_vm: auto generate new uuid
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
990fc5e2 4use warnings;
1e3baf05
DM
5use POSIX;
6use IO::Handle;
7use IO::Select;
8use IO::File;
9use IO::Dir;
10use IO::Socket::UNIX;
11use File::Basename;
12use File::Path;
13use File::stat;
14use Getopt::Long;
fc1ddcdc 15use Digest::SHA;
1e3baf05
DM
16use Fcntl ':flock';
17use Cwd 'abs_path';
18use IPC::Open3;
c971c4f2 19use JSON;
1e3baf05
DM
20use Fcntl;
21use PVE::SafeSyslog;
22use Storable qw(dclone);
23use PVE::Exception qw(raise raise_param_exc);
24use PVE::Storage;
4543ecf0 25use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
b7ba6b79 26use PVE::JSONSchema qw(get_standard_option);
1e3baf05
DM
27use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28use PVE::INotify;
29use PVE::ProcFSTools;
26f11676 30use PVE::QMPClient;
91bd6c90 31use PVE::RPCEnvironment;
6b64503e 32use Time::HiRes qw(gettimeofday);
1e3baf05 33
7f0b5beb 34my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 35
19672434 36# Note about locking: we use flock on the config file protect
1e3baf05
DM
37# against concurent actions.
38# Aditionaly, we have a 'lock' setting in the config file. This
22c377f0 39# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
1e3baf05
DM
40# allowed when such lock is set. But you can ignore this kind of
41# lock with the --skiplock flag.
42
97d62eb7 43cfs_register_file('/qemu-server/',
1858638f
DM
44 \&parse_vm_config,
45 \&write_vm_config);
1e3baf05 46
3ea94c60
DM
47PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 49 type => 'boolean',
3ea94c60
DM
50 optional => 1,
51});
52
53PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58});
59
8abd398b
DM
60PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64});
65
1e3baf05
DM
66#no warnings 'redefine';
67
68unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95}
96
97sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
6b64503e 100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
101}
102
103sub fairsched_rmnod {
104 my ($id) = @_;
105
6b64503e 106 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
107}
108
109sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
6b64503e 112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
113}
114
115sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
6b64503e 118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
119}
120
121sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
6b64503e 124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
125}
126
127use constant FAIRSCHED_SET_RATE => 0;
128use constant FAIRSCHED_DROP_RATE => 1;
129use constant FAIRSCHED_GET_RATE => 2;
130
131sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
6b64503e 134 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
6b64503e 137 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
138}
139
140my $nodename = PVE::INotify::nodename();
141
142mkdir "/etc/pve/nodes/$nodename";
143my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144mkdir $confdir;
145
146my $var_run_tmpdir = "/var/run/qemu-server";
147mkdir $var_run_tmpdir;
148
149my $lock_dir = "/var/lock/qemu-server";
150mkdir $lock_dir;
151
152my $pcisysfs = "/sys/bus/pci";
153
1e3baf05
DM
154my $confdesc = {
155 onboot => {
156 optional => 1,
157 type => 'boolean',
158 description => "Specifies whether a VM will be started during system bootup.",
159 default => 0,
160 },
161 autostart => {
162 optional => 1,
163 type => 'boolean',
164 description => "Automatic restart after crash (currently ignored).",
165 default => 0,
166 },
2ff09f52
DA
167 hotplug => {
168 optional => 1,
e8b9c17c 169 type => 'boolean',
6c52b679 170 description => "Allow hotplug for disk and network device",
2dbe827e 171 default => 0,
2ff09f52 172 },
1e3baf05
DM
173 reboot => {
174 optional => 1,
175 type => 'boolean',
176 description => "Allow reboot. If set to '0' the VM exit on reboot.",
177 default => 1,
178 },
179 lock => {
180 optional => 1,
181 type => 'string',
182 description => "Lock/unlock the VM.",
22c377f0 183 enum => [qw(migrate backup snapshot rollback)],
1e3baf05
DM
184 },
185 cpulimit => {
186 optional => 1,
187 type => 'integer',
188 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
189 minimum => 0,
190 default => 0,
191 },
192 cpuunits => {
193 optional => 1,
194 type => 'integer',
195 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
196 minimum => 0,
197 maximum => 500000,
198 default => 1000,
199 },
200 memory => {
201 optional => 1,
202 type => 'integer',
7878afeb 203 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
204 minimum => 16,
205 default => 512,
206 },
13a48620
DA
207 balloon => {
208 optional => 1,
209 type => 'integer',
8b1accf7
DM
210 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
211 minimum => 0,
212 },
213 shares => {
214 optional => 1,
215 type => 'integer',
216 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
217 minimum => 0,
218 maximum => 50000,
219 default => 1000,
13a48620 220 },
1e3baf05
DM
221 keyboard => {
222 optional => 1,
223 type => 'string',
224 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 225 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
226 default => 'en-us',
227 },
228 name => {
229 optional => 1,
7fabe17d 230 type => 'string', format => 'dns-name',
1e3baf05
DM
231 description => "Set a name for the VM. Only used on the configuration web interface.",
232 },
cdd20088
AD
233 scsihw => {
234 optional => 1,
235 type => 'string',
236 description => "scsi controller model",
5b952ff5 237 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
cdd20088
AD
238 default => 'lsi',
239 },
1e3baf05
DM
240 description => {
241 optional => 1,
242 type => 'string',
0581fe4f 243 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
1e3baf05
DM
244 },
245 ostype => {
246 optional => 1,
247 type => 'string',
6b9d84cf 248 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
1e3baf05
DM
249 description => <<EODESC,
250Used to enable special optimization/features for specific
251operating systems:
252
253other => unspecified OS
254wxp => Microsoft Windows XP
255w2k => Microsoft Windows 2000
256w2k3 => Microsoft Windows 2003
257w2k8 => Microsoft Windows 2008
258wvista => Microsoft Windows Vista
259win7 => Microsoft Windows 7
a70ebde3 260win8 => Microsoft Windows 8/2012
1e3baf05
DM
261l24 => Linux 2.4 Kernel
262l26 => Linux 2.6/3.X Kernel
6b9d84cf 263solaris => solaris/opensolaris/openindiania kernel
1e3baf05 264
6b9d84cf 265other|l24|l26|solaris ... no special behaviour
a70ebde3 266wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
1e3baf05
DM
267EODESC
268 },
269 boot => {
270 optional => 1,
271 type => 'string',
272 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
273 pattern => '[acdn]{1,4}',
32baffb4 274 default => 'cdn',
1e3baf05
DM
275 },
276 bootdisk => {
277 optional => 1,
278 type => 'string', format => 'pve-qm-bootdisk',
279 description => "Enable booting from specified disk.",
03e480fc 280 pattern => '(ide|sata|scsi|virtio)\d+',
1e3baf05
DM
281 },
282 smp => {
283 optional => 1,
284 type => 'integer',
285 description => "The number of CPUs. Please use option -sockets instead.",
286 minimum => 1,
287 default => 1,
288 },
289 sockets => {
290 optional => 1,
291 type => 'integer',
292 description => "The number of CPU sockets.",
293 minimum => 1,
294 default => 1,
295 },
296 cores => {
297 optional => 1,
298 type => 'integer',
299 description => "The number of cores per socket.",
300 minimum => 1,
301 default => 1,
302 },
3bd18e48
AD
303 maxcpus => {
304 optional => 1,
305 type => 'integer',
306 description => "Maximum cpus for hotplug.",
307 minimum => 1,
308 default => 1,
309 },
1e3baf05
DM
310 acpi => {
311 optional => 1,
312 type => 'boolean',
313 description => "Enable/disable ACPI.",
314 default => 1,
315 },
bc84dcca 316 agent => {
ab6a046f
AD
317 optional => 1,
318 type => 'boolean',
319 description => "Enable/disable Qemu GuestAgent.",
be79c214 320 default => 0,
ab6a046f 321 },
1e3baf05
DM
322 kvm => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable KVM hardware virtualization.",
326 default => 1,
327 },
328 tdf => {
329 optional => 1,
330 type => 'boolean',
8c559505
DM
331 description => "Enable/disable time drift fix.",
332 default => 0,
1e3baf05 333 },
19672434 334 localtime => {
1e3baf05
DM
335 optional => 1,
336 type => 'boolean',
337 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
338 },
339 freeze => {
340 optional => 1,
341 type => 'boolean',
342 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
343 },
344 vga => {
345 optional => 1,
346 type => 'string',
ef5e2be2 347 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
2fa3151e 348 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
1e3baf05 349 },
0ea9541d
DM
350 watchdog => {
351 optional => 1,
352 type => 'string', format => 'pve-qm-watchdog',
353 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
354 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
355 },
1e3baf05
DM
356 startdate => {
357 optional => 1,
19672434 358 type => 'string',
1e3baf05
DM
359 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
360 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
361 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
362 default => 'now',
363 },
59411c4e
DM
364 startup => {
365 optional => 1,
366 type => 'string', format => 'pve-qm-startup',
367 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
368 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
369 },
68eda3ab
AD
370 template => {
371 optional => 1,
372 type => 'boolean',
373 description => "Enable/disable Template.",
374 default => 0,
375 },
1e3baf05
DM
376 args => {
377 optional => 1,
378 type => 'string',
379 description => <<EODESCR,
380Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
381
382args: -no-reboot -no-hpet
383EODESCR
384 },
385 tablet => {
386 optional => 1,
387 type => 'boolean',
388 default => 1,
5acbfe9e 389 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
1e3baf05
DM
390 },
391 migrate_speed => {
392 optional => 1,
393 type => 'integer',
394 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
395 minimum => 0,
396 default => 0,
397 },
398 migrate_downtime => {
399 optional => 1,
04432191 400 type => 'number',
1e3baf05
DM
401 description => "Set maximum tolerated downtime (in seconds) for migrations.",
402 minimum => 0,
04432191 403 default => 0.1,
1e3baf05
DM
404 },
405 cdrom => {
406 optional => 1,
407 type => 'string', format => 'pve-qm-drive',
408 typetext => 'volume',
409 description => "This is an alias for option -ide2",
410 },
411 cpu => {
412 optional => 1,
413 description => "Emulated CPU type.",
414 type => 'string',
3aefd6fd 415 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
eac6899d 416 default => 'kvm64',
1e3baf05 417 },
b7ba6b79
DM
418 parent => get_standard_option('pve-snapshot-name', {
419 optional => 1,
420 description => "Parent snapshot name. This is used internally, and should not be modified.",
421 }),
982c7f12
DM
422 snaptime => {
423 optional => 1,
424 description => "Timestamp for snapshots.",
425 type => 'integer',
426 minimum => 0,
427 },
18bfb361
DM
428 vmstate => {
429 optional => 1,
430 type => 'string', format => 'pve-volume-id',
431 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
432 },
3bafc510
DM
433 machine => {
434 description => "Specific the Qemu machine type.",
435 type => 'string',
436 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
437 maxLength => 40,
438 optional => 1,
439 },
2796e7d5
DM
440 smbios1 => {
441 description => "Specify SMBIOS type 1 fields.",
442 type => 'string', format => 'pve-qm-smbios1',
443 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
444 maxLength => 256,
445 optional => 1,
446 },
1e3baf05
DM
447};
448
449# what about other qemu settings ?
450#cpu => 'string',
451#machine => 'string',
452#fda => 'file',
453#fdb => 'file',
454#mtdblock => 'file',
455#sd => 'file',
456#pflash => 'file',
457#snapshot => 'bool',
458#bootp => 'file',
459##tftp => 'dir',
460##smb => 'dir',
461#kernel => 'file',
462#append => 'string',
463#initrd => 'file',
464##soundhw => 'string',
465
466while (my ($k, $v) = each %$confdesc) {
467 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
468}
469
470my $MAX_IDE_DISKS = 4;
f62db2a4 471my $MAX_SCSI_DISKS = 14;
a2650619 472my $MAX_VIRTIO_DISKS = 16;
cdb0931f 473my $MAX_SATA_DISKS = 6;
1e3baf05 474my $MAX_USB_DEVICES = 5;
5bdcf937 475my $MAX_NETS = 32;
1e3baf05 476my $MAX_UNUSED_DISKS = 8;
5cffb2d2 477my $MAX_HOSTPCI_DEVICES = 4;
bae179aa 478my $MAX_SERIAL_PORTS = 4;
1989a89c 479my $MAX_PARALLEL_PORTS = 3;
1e3baf05
DM
480
481my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
e4c6e0b8 482 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
6b64503e 483my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05 484
1e3baf05
DM
485my $netdesc = {
486 optional => 1,
487 type => 'string', format => 'pve-qm-net',
a9410357 488 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
1e3baf05 489 description => <<EODESCR,
19672434 490Specify network devices.
1e3baf05
DM
491
492MODEL is one of: $nic_model_list_txt
493
19672434 494XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
495automatically generated if not specified.
496
497The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
498
499Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
500
501If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
502
50310.0.2.2 Gateway
50410.0.2.3 DNS Server
50510.0.2.4 SMB Server
506
507The DHCP server assign addresses to the guest starting from 10.0.2.15.
508
509EODESCR
510};
511PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
512
513for (my $i = 0; $i < $MAX_NETS; $i++) {
514 $confdesc->{"net$i"} = $netdesc;
515}
516
517my $drivename_hash;
19672434 518
1e3baf05
DM
519my $idedesc = {
520 optional => 1,
521 type => 'string', format => 'pve-qm-drive',
8d87f8aa 522 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 523 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
1e3baf05
DM
524};
525PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
526
527my $scsidesc = {
528 optional => 1,
529 type => 'string', format => 'pve-qm-drive',
8d87f8aa 530 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 531 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
1e3baf05
DM
532};
533PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
534
cdb0931f
DA
535my $satadesc = {
536 optional => 1,
537 type => 'string', format => 'pve-qm-drive',
8d87f8aa 538 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 539 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
cdb0931f
DA
540};
541PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
542
1e3baf05
DM
543my $virtiodesc = {
544 optional => 1,
545 type => 'string', format => 'pve-qm-drive',
8d87f8aa 546 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
3c770faa 547 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
1e3baf05
DM
548};
549PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
550
551my $usbdesc = {
552 optional => 1,
553 type => 'string', format => 'pve-qm-usb-device',
80401dd8 554 typetext => 'host=HOSTUSBDEVICE|spice',
1e3baf05 555 description => <<EODESCR,
2fe1a152 556Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
557pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
558
19672434 559'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
560'vendor_id:product_id' (hexadeciaml numbers)
561
19672434 562You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
563
564Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
565
80401dd8
DM
566The value 'spice' can be used to add a usb redirection devices for spice.
567
1e3baf05
DM
568EODESCR
569};
570PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
571
040b06b7
DA
572my $hostpcidesc = {
573 optional => 1,
574 type => 'string', format => 'pve-qm-hostpci',
2e3b7e2a 575 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
040b06b7
DA
576 description => <<EODESCR,
577Map host pci devices. HOSTPCIDEVICE syntax is:
578
579'bus:dev.func' (hexadecimal numbers)
580
581You can us the 'lspci' command to list existing pci devices.
582
0cea6a01
DM
583The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
584
040b06b7
DA
585Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
586
587Experimental: user reported problems with this option.
588EODESCR
589};
590PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
591
bae179aa
DA
592my $serialdesc = {
593 optional => 1,
ca0cef26 594 type => 'string',
9f9d2fb2 595 pattern => '(/dev/ttyS\d+|socket)',
bae179aa 596 description => <<EODESCR,
9f9d2fb2 597Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device, or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
bae179aa
DA
598
599Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
600
601Experimental: user reported problems with this option.
602EODESCR
603};
bae179aa 604
1989a89c
DA
605my $paralleldesc= {
606 optional => 1,
ca0cef26 607 type => 'string',
9ecc8431 608 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
1989a89c 609 description => <<EODESCR,
19672434 610Map host parallel devices (n is 0 to 2).
1989a89c
DA
611
612Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
613
614Experimental: user reported problems with this option.
615EODESCR
616};
1989a89c
DA
617
618for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
619 $confdesc->{"parallel$i"} = $paralleldesc;
620}
621
bae179aa
DA
622for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
623 $confdesc->{"serial$i"} = $serialdesc;
624}
625
040b06b7
DA
626for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
627 $confdesc->{"hostpci$i"} = $hostpcidesc;
628}
1e3baf05
DM
629
630for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
631 $drivename_hash->{"ide$i"} = 1;
632 $confdesc->{"ide$i"} = $idedesc;
633}
634
cdb0931f
DA
635for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
636 $drivename_hash->{"sata$i"} = 1;
637 $confdesc->{"sata$i"} = $satadesc;
638}
639
1e3baf05
DM
640for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
641 $drivename_hash->{"scsi$i"} = 1;
642 $confdesc->{"scsi$i"} = $scsidesc ;
643}
644
645for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
646 $drivename_hash->{"virtio$i"} = 1;
647 $confdesc->{"virtio$i"} = $virtiodesc;
648}
649
650for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
651 $confdesc->{"usb$i"} = $usbdesc;
652}
653
654my $unuseddesc = {
655 optional => 1,
656 type => 'string', format => 'pve-volume-id',
657 description => "Reference to unused volumes.",
658};
659
660for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
661 $confdesc->{"unused$i"} = $unuseddesc;
662}
663
664my $kvm_api_version = 0;
665
666sub kvm_version {
667
668 return $kvm_api_version if $kvm_api_version;
669
6b64503e 670 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
671 return 0;
672
6b64503e 673 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
674 $kvm_api_version = $v;
675 }
676
677 $fh->close();
678
679 return $kvm_api_version;
680}
681
682my $kvm_user_version;
683
684sub kvm_user_version {
685
686 return $kvm_user_version if $kvm_user_version;
687
688 $kvm_user_version = 'unknown';
689
690 my $tmp = `kvm -help 2>/dev/null`;
19672434 691
fa7ae705 692 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
1e3baf05
DM
693 $kvm_user_version = $2;
694 }
695
696 return $kvm_user_version;
697
698}
699
700my $kernel_has_vhost_net = -c '/dev/vhost-net';
701
702sub disknames {
703 # order is important - used to autoselect boot disk
19672434 704 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 705 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
706 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
707 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
708}
709
710sub valid_drivename {
711 my $dev = shift;
712
6b64503e 713 return defined($drivename_hash->{$dev});
1e3baf05
DM
714}
715
716sub option_exists {
717 my $key = shift;
718 return defined($confdesc->{$key});
19672434 719}
1e3baf05
DM
720
721sub nic_models {
722 return $nic_model_list;
723}
724
725sub os_list_description {
726
727 return {
728 other => 'Other',
729 wxp => 'Windows XP',
730 w2k => 'Windows 2000',
731 w2k3 =>, 'Windows 2003',
732 w2k8 => 'Windows 2008',
733 wvista => 'Windows Vista',
734 win7 => 'Windows 7',
a70ebde3 735 win8 => 'Windows 8/2012',
1e3baf05
DM
736 l24 => 'Linux 2.4',
737 l26 => 'Linux 2.6',
19672434 738 };
1e3baf05
DM
739}
740
1e3baf05
DM
741my $cdrom_path;
742
743sub get_cdrom_path {
744
745 return $cdrom_path if $cdrom_path;
746
747 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
748 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
749 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
750}
751
752sub get_iso_path {
753 my ($storecfg, $vmid, $cdrom) = @_;
754
755 if ($cdrom eq 'cdrom') {
756 return get_cdrom_path();
757 } elsif ($cdrom eq 'none') {
758 return '';
759 } elsif ($cdrom =~ m|^/|) {
760 return $cdrom;
761 } else {
6b64503e 762 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
763 }
764}
765
766# try to convert old style file names to volume IDs
767sub filename_to_volume_id {
768 my ($vmid, $file, $media) = @_;
769
770 if (!($file eq 'none' || $file eq 'cdrom' ||
771 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 772
1e3baf05 773 return undef if $file =~ m|/|;
19672434 774
1e3baf05
DM
775 if ($media && $media eq 'cdrom') {
776 $file = "local:iso/$file";
777 } else {
778 $file = "local:$vmid/$file";
779 }
780 }
781
782 return $file;
783}
784
785sub verify_media_type {
786 my ($opt, $vtype, $media) = @_;
787
788 return if !$media;
789
790 my $etype;
791 if ($media eq 'disk') {
a125592c 792 $etype = 'images';
1e3baf05
DM
793 } elsif ($media eq 'cdrom') {
794 $etype = 'iso';
795 } else {
796 die "internal error";
797 }
798
799 return if ($vtype eq $etype);
19672434 800
1e3baf05
DM
801 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
802}
803
804sub cleanup_drive_path {
805 my ($opt, $storecfg, $drive) = @_;
806
807 # try to convert filesystem paths to volume IDs
808
809 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
810 ($drive->{file} !~ m|^/dev/.+|) &&
811 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 812 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
813 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
814 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
815 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
816 verify_media_type($opt, $vtype, $drive->{media});
817 $drive->{file} = $volid;
818 }
819
820 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
821}
822
823sub create_conf_nolock {
824 my ($vmid, $settings) = @_;
825
6b64503e 826 my $filename = config_file($vmid);
1e3baf05
DM
827
828 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 829
1e3baf05
DM
830 my $defaults = load_defaults();
831
832 $settings->{name} = "vm$vmid" if !$settings->{name};
833 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
834
835 my $data = '';
836 foreach my $opt (keys %$settings) {
837 next if !$confdesc->{$opt};
838
839 my $value = $settings->{$opt};
840 next if !$value;
841
842 $data .= "$opt: $value\n";
843 }
844
845 PVE::Tools::file_set_contents($filename, $data);
846}
847
f36ed4f4
DM
848my $parse_size = sub {
849 my ($value) = @_;
850
9bf371a6 851 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
f36ed4f4
DM
852 my ($size, $unit) = ($1, $3);
853 if ($unit) {
854 if ($unit eq 'K') {
855 $size = $size * 1024;
856 } elsif ($unit eq 'M') {
857 $size = $size * 1024 * 1024;
858 } elsif ($unit eq 'G') {
859 $size = $size * 1024 * 1024 * 1024;
860 }
861 }
862 return int($size);
863};
864
865my $format_size = sub {
866 my ($size) = @_;
867
868 $size = int($size);
869
870 my $kb = int($size/1024);
871 return $size if $kb*1024 != $size;
872
873 my $mb = int($kb/1024);
874 return "${kb}K" if $mb*1024 != $kb;
875
876 my $gb = int($mb/1024);
877 return "${mb}M" if $gb*1024 != $mb;
878
879 return "${gb}G";
880};
881
1e3baf05
DM
882# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
883# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
036e0e2b 884# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
8d87f8aa 885# [,aio=native|threads][,discard=ignore|on]
1e3baf05
DM
886
887sub parse_drive {
888 my ($key, $data) = @_;
889
890 my $res = {};
19672434 891
1e3baf05
DM
892 # $key may be undefined - used to verify JSON parameters
893 if (!defined($key)) {
894 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
895 $res->{index} = 0;
896 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
897 $res->{interface} = $1;
898 $res->{index} = $2;
899 } else {
900 return undef;
901 }
902
903 foreach my $p (split (/,/, $data)) {
904 next if $p =~ m/^\s*$/;
905
74edd76b 906 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
1e3baf05
DM
907 my ($k, $v) = ($1, $2);
908
909 $k = 'file' if $k eq 'volume';
910
911 return undef if defined $res->{$k};
19672434 912
9bf371a6
DM
913 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
914 return undef if !$v || $v !~ m/^\d+/;
915 $k = "m$k";
916 $v = sprintf("%.3f", $v / (1024*1024));
917 }
1e3baf05
DM
918 $res->{$k} = $v;
919 } else {
920 if (!$res->{file} && $p !~ m/=/) {
921 $res->{file} = $p;
922 } else {
923 return undef;
924 }
925 }
926 }
927
928 return undef if !$res->{file};
929
bdf3f362
AD
930 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
931 $res->{format} = $1;
932 }
933
19672434 934 return undef if $res->{cache} &&
e482cec3 935 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
1e3baf05
DM
936 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
937 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
938 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
939 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
940 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
941 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
942 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
943 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
944 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
945 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
946 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
8d87f8aa 947 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
be190583 948
9bf371a6
DM
949 return undef if $res->{mbps_rd} && $res->{mbps};
950 return undef if $res->{mbps_wr} && $res->{mbps};
951
952 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
74edd76b 953 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 954 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
74edd76b 955 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 956 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
74edd76b 957 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
9bf371a6 958
affd2f88
AD
959 return undef if $res->{iops_rd} && $res->{iops};
960 return undef if $res->{iops_wr} && $res->{iops};
74edd76b
AD
961
962
affd2f88 963 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
74edd76b 964 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
affd2f88 965 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
74edd76b 966 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
affd2f88 967 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
74edd76b 968 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
affd2f88
AD
969
970
24afaca0 971 if ($res->{size}) {
be190583 972 return undef if !defined($res->{size} = &$parse_size($res->{size}));
24afaca0
DM
973 }
974
1e3baf05
DM
975 if ($res->{media} && ($res->{media} eq 'cdrom')) {
976 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 977 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
978 return undef if $res->{interface} eq 'virtio';
979 }
980
981 # rerror does not work with scsi drives
982 if ($res->{rerror}) {
983 return undef if $res->{interface} eq 'scsi';
984 }
985
986 return $res;
987}
988
74edd76b 989my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1e3baf05
DM
990
991sub print_drive {
992 my ($vmid, $drive) = @_;
993
994 my $opts = '';
74edd76b 995 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1e3baf05
DM
996 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
997 }
998
24afaca0
DM
999 if ($drive->{size}) {
1000 $opts .= ",size=" . &$format_size($drive->{size});
1001 }
1002
1e3baf05
DM
1003 return "$drive->{file}$opts";
1004}
1005
28ef82d3
DM
1006sub scsi_inquiry {
1007 my($fh, $noerr) = @_;
1008
1009 my $SG_IO = 0x2285;
1010 my $SG_GET_VERSION_NUM = 0x2282;
1011
1012 my $versionbuf = "\x00" x 8;
1013 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1014 if (!$ret) {
1015 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1016 return undef;
1017 }
97d62eb7 1018 my $version = unpack("I", $versionbuf);
28ef82d3
DM
1019 if ($version < 30000) {
1020 die "scsi generic interface too old\n" if !$noerr;
1021 return undef;
1022 }
97d62eb7 1023
28ef82d3
DM
1024 my $buf = "\x00" x 36;
1025 my $sensebuf = "\x00" x 8;
f334aa3e 1026 my $cmd = pack("C x3 C x1", 0x12, 36);
97d62eb7 1027
28ef82d3
DM
1028 # see /usr/include/scsi/sg.h
1029 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1030
97d62eb7
DM
1031 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1032 length($sensebuf), 0, length($buf), $buf,
28ef82d3
DM
1033 $cmd, $sensebuf, 6000);
1034
1035 $ret = ioctl($fh, $SG_IO, $packet);
1036 if (!$ret) {
1037 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1038 return undef;
1039 }
97d62eb7 1040
28ef82d3
DM
1041 my @res = unpack($sg_io_hdr_t, $packet);
1042 if ($res[17] || $res[18]) {
1043 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1044 return undef;
1045 }
1046
1047 my $res = {};
09984754 1048 (my $byte0, my $byte1, $res->{vendor},
28ef82d3
DM
1049 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1050
09984754
DM
1051 $res->{removable} = $byte1 & 128 ? 1 : 0;
1052 $res->{type} = $byte0 & 31;
1053
28ef82d3
DM
1054 return $res;
1055}
1056
1057sub path_is_scsi {
1058 my ($path) = @_;
1059
1060 my $fh = IO::File->new("+<$path") || return undef;
1061 my $res = scsi_inquiry($fh, 1);
1062 close($fh);
1063
1064 return $res;
1065}
1066
db656e5f
DM
1067sub machine_type_is_q35 {
1068 my ($conf) = @_;
1069
1070 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1071}
1072
1073sub print_tabletdevice_full {
1074 my ($conf) = @_;
1075
1076 my $q35 = machine_type_is_q35($conf);
1077
1078 # we use uhci for old VMs because tablet driver was buggy in older qemu
1079 my $usbbus = $q35 ? "ehci" : "uhci";
1080
1081 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1082}
1083
ca916ecc 1084sub print_drivedevice_full {
5bdcf937 1085 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
ca916ecc
DA
1086
1087 my $device = '';
1088 my $maxdev = 0;
19672434 1089
ca916ecc 1090 if ($drive->{interface} eq 'virtio') {
5bdcf937 1091 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
2ed36a41
DM
1092 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
1093 } elsif ($drive->{interface} eq 'scsi') {
5b952ff5 1094 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
2ed36a41
DM
1095 my $controller = int($drive->{index} / $maxdev);
1096 my $unit = $drive->{index} % $maxdev;
1097 my $devicetype = 'hd';
231f2e13
DA
1098 my $path = '';
1099 if (drive_is_cdrom($drive)) {
1100 $devicetype = 'cd';
29b19529 1101 } else {
231f2e13
DA
1102 if ($drive->{file} =~ m|^/|) {
1103 $path = $drive->{file};
1104 } else {
1105 $path = PVE::Storage::path($storecfg, $drive->{file});
1106 }
d454d040
AD
1107
1108 if($path =~ m/^iscsi\:\/\//){
29b19529
DM
1109 $devicetype = 'generic';
1110 } else {
09984754
DM
1111 if (my $info = path_is_scsi($path)) {
1112 if ($info->{type} == 0) {
1113 $devicetype = 'block';
1114 } elsif ($info->{type} == 1) { # tape
1115 $devicetype = 'generic';
1116 }
1117 }
d454d040 1118 }
231f2e13 1119 }
ca916ecc 1120
5b952ff5
DM
1121 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1122 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdd20088
AD
1123 } else {
1124 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1125 }
1126
2ed36a41
DM
1127 } elsif ($drive->{interface} eq 'ide'){
1128 $maxdev = 2;
1129 my $controller = int($drive->{index} / $maxdev);
1130 my $unit = $drive->{index} % $maxdev;
1131 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1132
7ebe888a 1133 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
1134 } elsif ($drive->{interface} eq 'sata'){
1135 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1136 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1137 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
1138 } elsif ($drive->{interface} eq 'usb') {
1139 die "implement me";
1140 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1141 } else {
1142 die "unsupported interface type";
ca916ecc
DA
1143 }
1144
3b408e82
DM
1145 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1146
ca916ecc
DA
1147 return $device;
1148}
1149
15b21acc 1150sub get_initiator_name {
46f58b5f 1151 my $initiator;
15b21acc 1152
46f58b5f
DM
1153 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1154 while (defined(my $line = <$fh>)) {
1155 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
15b21acc
MR
1156 $initiator = $1;
1157 last;
1158 }
46f58b5f
DM
1159 $fh->close();
1160
15b21acc
MR
1161 return $initiator;
1162}
1163
1e3baf05
DM
1164sub print_drive_full {
1165 my ($storecfg, $vmid, $drive) = @_;
1166
1167 my $opts = '';
1168 foreach my $o (@qemu_drive_options) {
3b408e82 1169 next if $o eq 'bootindex';
1e3baf05 1170 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 1171 }
1e3baf05 1172
9bf371a6
DM
1173 foreach my $o (qw(bps bps_rd bps_wr)) {
1174 my $v = $drive->{"m$o"};
1175 $opts .= ",$o=" . int($v*1024*1024) if $v;
1176 }
1177
1e3baf05 1178 # use linux-aio by default (qemu default is threads)
19672434 1179 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
1180
1181 my $path;
1182 my $volid = $drive->{file};
6b64503e
DM
1183 if (drive_is_cdrom($drive)) {
1184 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
1185 } else {
1186 if ($volid =~ m|^/|) {
1187 $path = $volid;
1188 } else {
6b64503e 1189 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05
DM
1190 }
1191 }
1192
ef86170e 1193 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
11490cf2 1194
1e3baf05
DM
1195 my $pathinfo = $path ? "file=$path," : '';
1196
3ebfcc86 1197 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
1198}
1199
cc4d6182 1200sub print_netdevice_full {
5bdcf937 1201 my ($vmid, $conf, $net, $netid, $bridges) = @_;
cc4d6182
DA
1202
1203 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1204
1205 my $device = $net->{model};
1206 if ($net->{model} eq 'virtio') {
1207 $device = 'virtio-net-pci';
1208 };
1209
1210 # qemu > 0.15 always try to boot from network - we disable that by
1211 # not loading the pxe rom file
1212 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
5bdcf937 1213 my $pciaddr = print_pci_addr("$netid", $bridges);
cc4d6182 1214 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
a9410357
AD
1215 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1216 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1217 my $vectors = $net->{queues} * 2 + 2;
1218 $tmpstr .= ",vectors=$vectors,mq=on";
1219 }
cc4d6182
DA
1220 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1221 return $tmpstr;
1222}
1223
1224sub print_netdev_full {
1225 my ($vmid, $conf, $net, $netid) = @_;
1226
1227 my $i = '';
1228 if ($netid =~ m/^net(\d+)$/) {
1229 $i = int($1);
1230 }
1231
1232 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1233
1234 my $ifname = "tap${vmid}i$i";
1235
1236 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1237 die "interface name '$ifname' is too long (max 15 character)\n"
1238 if length($ifname) >= 16;
1239
1240 my $vhostparam = '';
1241 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1242
1243 my $vmname = $conf->{name} || "vm$vmid";
1244
a9410357
AD
1245 my $netdev = "";
1246
cc4d6182 1247 if ($net->{bridge}) {
a9410357 1248 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
cc4d6182 1249 } else {
a9410357 1250 $netdev = "type=user,id=$netid,hostname=$vmname";
cc4d6182 1251 }
a9410357
AD
1252
1253 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1254
1255 return $netdev;
cc4d6182 1256}
1e3baf05
DM
1257
1258sub drive_is_cdrom {
1259 my ($drive) = @_;
1260
1261 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1262
1263}
1264
040b06b7
DA
1265sub parse_hostpci {
1266 my ($value) = @_;
1267
1268 return undef if !$value;
1269
0cea6a01
DM
1270
1271 my @list = split(/,/, $value);
1272 my $found;
1273
040b06b7 1274 my $res = {};
0cea6a01 1275 foreach my $kv (@list) {
040b06b7 1276
4543ecf0 1277 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
0cea6a01 1278 $found = 1;
4543ecf0
AD
1279 if(defined($4)){
1280 push @{$res->{pciid}}, { id => $2 , function => $4};
1281
1282 }else{
1283 my $pcidevices = lspci($2);
1284 $res->{pciid} = $pcidevices->{$2};
1285 }
0cea6a01
DM
1286 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1287 $res->{driver} = $1;
1288 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1289 $res->{rombar} = $1;
2e3b7e2a
AD
1290 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1291 $res->{'x-vga'} = $1;
1292 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1293 $res->{pcie} = 1 if $1 == 1;
0cea6a01
DM
1294 } else {
1295 warn "unknown hostpci setting '$kv'\n";
1296 }
040b06b7
DA
1297 }
1298
0cea6a01
DM
1299 return undef if !$found;
1300
040b06b7
DA
1301 return $res;
1302}
1303
1e3baf05
DM
1304# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1305sub parse_net {
1306 my ($data) = @_;
1307
1308 my $res = {};
1309
6b64503e 1310 foreach my $kvp (split(/,/, $data)) {
1e3baf05 1311
e4c6e0b8 1312 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1313 my $model = lc($1);
92f0fedc 1314 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1e3baf05
DM
1315 $res->{model} = $model;
1316 $res->{macaddr} = $mac;
1317 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1318 $res->{bridge} = $1;
a9410357
AD
1319 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1320 $res->{queues} = $1;
1e3baf05
DM
1321 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1322 $res->{rate} = $1;
5070f384
DA
1323 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1324 $res->{tag} = $1;
2dd4aa4c
AD
1325 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1326 $res->{firewall} = $1;
1e3baf05
DM
1327 } else {
1328 return undef;
1329 }
19672434 1330
1e3baf05
DM
1331 }
1332
1333 return undef if !$res->{model};
1334
1335 return $res;
1336}
1337
1338sub print_net {
1339 my $net = shift;
1340
1341 my $res = "$net->{model}";
1342 $res .= "=$net->{macaddr}" if $net->{macaddr};
1343 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1344 $res .= ",rate=$net->{rate}" if $net->{rate};
18744ba3 1345 $res .= ",tag=$net->{tag}" if $net->{tag};
28138e9a 1346 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1e3baf05
DM
1347
1348 return $res;
1349}
1350
1351sub add_random_macs {
1352 my ($settings) = @_;
1353
1354 foreach my $opt (keys %$settings) {
1355 next if $opt !~ m/^net(\d+)$/;
1356 my $net = parse_net($settings->{$opt});
1357 next if !$net;
1358 $settings->{$opt} = print_net($net);
1359 }
1360}
1361
1362sub add_unused_volume {
1858638f 1363 my ($config, $volid) = @_;
1e3baf05
DM
1364
1365 my $key;
1366 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1367 my $test = "unused$ind";
1368 if (my $vid = $config->{$test}) {
1369 return if $vid eq $volid; # do not add duplicates
1370 } else {
1371 $key = $test;
19672434 1372 }
1e3baf05
DM
1373 }
1374
1375 die "To many unused volume - please delete them first.\n" if !$key;
97d62eb7 1376
1858638f 1377 $config->{$key} = $volid;
1e3baf05 1378
1858638f 1379 return $key;
1e3baf05
DM
1380}
1381
2796e7d5
DM
1382my $valid_smbios1_options = {
1383 manufacturer => '\S+',
1384 product => '\S+',
1385 version => '\S+',
1386 serial => '\S+',
1387 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1388 sku => '\S+',
1389 family => '\S+',
1390};
1391
1392# smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1393sub parse_smbios1 {
1394 my ($data) = @_;
1395
1396 my $res = {};
1397
1398 foreach my $kvp (split(/,/, $data)) {
1399 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1400 my ($k, $v) = split(/=/, $kvp);
1401 return undef if !defined($k) || !defined($v);
1402 return undef if !$valid_smbios1_options->{$k};
1403 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1404 $res->{$k} = $v;
1405 }
1406
1407 return $res;
1408}
1409
cd11416f
DM
1410sub print_smbios1 {
1411 my ($smbios1) = @_;
1412
1413 my $data = '';
1414 foreach my $k (keys %$smbios1) {
1415 next if !defined($smbios1->{$k});
1416 next if !$valid_smbios1_options->{$k};
1417 $data .= ',' if $data;
1418 $data .= "$k=$smbios1->{$k}";
1419 }
1420 return $data;
1421}
1422
2796e7d5
DM
1423PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1424sub verify_smbios1 {
1425 my ($value, $noerr) = @_;
1426
1427 return $value if parse_smbios1($value);
1428
1429 return undef if $noerr;
1430
1431 die "unable to parse smbios (type 1) options\n";
1432}
1433
1e3baf05
DM
1434PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1435sub verify_bootdisk {
1436 my ($value, $noerr) = @_;
1437
19672434 1438 return $value if valid_drivename($value);
1e3baf05
DM
1439
1440 return undef if $noerr;
1441
1442 die "invalid boot disk '$value'\n";
1443}
1444
1445PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1446sub verify_net {
1447 my ($value, $noerr) = @_;
1448
1449 return $value if parse_net($value);
1450
1451 return undef if $noerr;
19672434 1452
1e3baf05
DM
1453 die "unable to parse network options\n";
1454}
1455
1456PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1457sub verify_drive {
1458 my ($value, $noerr) = @_;
1459
6b64503e 1460 return $value if parse_drive(undef, $value);
1e3baf05
DM
1461
1462 return undef if $noerr;
19672434 1463
1e3baf05
DM
1464 die "unable to parse drive options\n";
1465}
1466
1467PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1468sub verify_hostpci {
1469 my ($value, $noerr) = @_;
1470
040b06b7
DA
1471 return $value if parse_hostpci($value);
1472
1473 return undef if $noerr;
1474
1475 die "unable to parse pci id\n";
1e3baf05
DM
1476}
1477
0ea9541d
DM
1478PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1479sub verify_watchdog {
1480 my ($value, $noerr) = @_;
1481
1482 return $value if parse_watchdog($value);
1483
1484 return undef if $noerr;
19672434 1485
0ea9541d
DM
1486 die "unable to parse watchdog options\n";
1487}
1488
1489sub parse_watchdog {
1490 my ($value) = @_;
1491
1492 return undef if !$value;
1493
1494 my $res = {};
1495
6b64503e 1496 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1497 next if $p =~ m/^\s*$/;
1498
1499 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1500 $res->{model} = $2;
1501 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1502 $res->{action} = $2;
1503 } else {
1504 return undef;
1505 }
1506 }
1507
1508 return $res;
1509}
1510
59411c4e
DM
1511PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1512sub verify_startup {
1513 my ($value, $noerr) = @_;
1514
1515 return $value if parse_startup($value);
1516
1517 return undef if $noerr;
1518
1519 die "unable to parse startup options\n";
1520}
1521
1522sub parse_startup {
1523 my ($value) = @_;
1524
1525 return undef if !$value;
1526
1527 my $res = {};
1528
1529 foreach my $p (split(/,/, $value)) {
1530 next if $p =~ m/^\s*$/;
1531
1532 if ($p =~ m/^(order=)?(\d+)$/) {
1533 $res->{order} = $2;
1534 } elsif ($p =~ m/^up=(\d+)$/) {
1535 $res->{up} = $1;
1536 } elsif ($p =~ m/^down=(\d+)$/) {
1537 $res->{down} = $1;
1538 } else {
1539 return undef;
1540 }
1541 }
1542
1543 return $res;
1544}
1545
1e3baf05
DM
1546sub parse_usb_device {
1547 my ($value) = @_;
1548
1549 return undef if !$value;
1550
6b64503e 1551 my @dl = split(/,/, $value);
1e3baf05
DM
1552 my $found;
1553
1554 my $res = {};
1555 foreach my $v (@dl) {
036e0e2b 1556 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1e3baf05 1557 $found = 1;
036e0e2b
DM
1558 $res->{vendorid} = $2;
1559 $res->{productid} = $4;
1e3baf05
DM
1560 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1561 $found = 1;
1562 $res->{hostbus} = $1;
1563 $res->{hostport} = $2;
80401dd8
DM
1564 } elsif ($v =~ m/^spice$/) {
1565 $found = 1;
1566 $res->{spice} = 1;
1e3baf05
DM
1567 } else {
1568 return undef;
1569 }
1570 }
1571 return undef if !$found;
1572
1573 return $res;
1574}
19672434 1575
1e3baf05
DM
1576PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1577sub verify_usb_device {
1578 my ($value, $noerr) = @_;
1579
1580 return $value if parse_usb_device($value);
1581
1582 return undef if $noerr;
19672434 1583
1e3baf05
DM
1584 die "unable to parse usb device\n";
1585}
1586
1e3baf05
DM
1587# add JSON properties for create and set function
1588sub json_config_properties {
1589 my $prop = shift;
1590
1591 foreach my $opt (keys %$confdesc) {
18bfb361 1592 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1e3baf05
DM
1593 $prop->{$opt} = $confdesc->{$opt};
1594 }
1595
1596 return $prop;
1597}
1598
1599sub check_type {
1600 my ($key, $value) = @_;
1601
1602 die "unknown setting '$key'\n" if !$confdesc->{$key};
1603
1604 my $type = $confdesc->{$key}->{type};
1605
6b64503e 1606 if (!defined($value)) {
1e3baf05
DM
1607 die "got undefined value\n";
1608 }
1609
1610 if ($value =~ m/[\n\r]/) {
1611 die "property contains a line feed\n";
1612 }
1613
1614 if ($type eq 'boolean') {
19672434
DM
1615 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1616 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1617 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1618 } elsif ($type eq 'integer') {
1619 return int($1) if $value =~ m/^(\d+)$/;
1620 die "type check ('integer') failed - got '$value'\n";
04432191
AD
1621 } elsif ($type eq 'number') {
1622 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1623 die "type check ('number') failed - got '$value'\n";
1e3baf05
DM
1624 } elsif ($type eq 'string') {
1625 if (my $fmt = $confdesc->{$key}->{format}) {
1626 if ($fmt eq 'pve-qm-drive') {
1627 # special case - we need to pass $key to parse_drive()
6b64503e 1628 my $drive = parse_drive($key, $value);
1e3baf05
DM
1629 return $value if $drive;
1630 die "unable to parse drive options\n";
1631 }
1632 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1633 return $value;
1634 }
1e3baf05 1635 $value =~ s/^\"(.*)\"$/$1/;
19672434 1636 return $value;
1e3baf05
DM
1637 } else {
1638 die "internal error"
1639 }
1640}
1641
191435c6
DM
1642sub lock_config_full {
1643 my ($vmid, $timeout, $code, @param) = @_;
1e3baf05 1644
6b64503e 1645 my $filename = config_file_lock($vmid);
1e3baf05 1646
191435c6 1647 my $res = lock_file($filename, $timeout, $code, @param);
1e3baf05
DM
1648
1649 die $@ if $@;
5fdbe4f0
DM
1650
1651 return $res;
1e3baf05
DM
1652}
1653
4e4f83fe
DM
1654sub lock_config_mode {
1655 my ($vmid, $timeout, $shared, $code, @param) = @_;
6116f729
DM
1656
1657 my $filename = config_file_lock($vmid);
1658
4e4f83fe 1659 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
6116f729
DM
1660
1661 die $@ if $@;
1662
1663 return $res;
1664}
1665
191435c6
DM
1666sub lock_config {
1667 my ($vmid, $code, @param) = @_;
1668
1669 return lock_config_full($vmid, 10, $code, @param);
1670}
1671
1e3baf05 1672sub cfs_config_path {
a78ccf26 1673 my ($vmid, $node) = @_;
1e3baf05 1674
a78ccf26
DM
1675 $node = $nodename if !$node;
1676 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1677}
1678
040b06b7
DA
1679sub check_iommu_support{
1680 #fixme : need to check IOMMU support
1681 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1682
1683 my $iommu=1;
1684 return $iommu;
1685
1686}
1687
1e3baf05 1688sub config_file {
a78ccf26 1689 my ($vmid, $node) = @_;
1e3baf05 1690
a78ccf26 1691 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1692 return "/etc/pve/$cfspath";
1693}
1694
1695sub config_file_lock {
1696 my ($vmid) = @_;
1697
1698 return "$lock_dir/lock-$vmid.conf";
1699}
1700
1701sub touch_config {
1702 my ($vmid) = @_;
1703
6b64503e 1704 my $conf = config_file($vmid);
1e3baf05
DM
1705 utime undef, undef, $conf;
1706}
1707
1e3baf05 1708sub destroy_vm {
a6af7b3e 1709 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1710
6b64503e 1711 my $conffile = config_file($vmid);
1e3baf05 1712
6b64503e 1713 my $conf = load_config($vmid);
1e3baf05 1714
6b64503e 1715 check_lock($conf);
1e3baf05 1716
19672434 1717 # only remove disks owned by this VM
1e3baf05
DM
1718 foreach_drive($conf, sub {
1719 my ($ds, $drive) = @_;
1720
6b64503e 1721 return if drive_is_cdrom($drive);
1e3baf05
DM
1722
1723 my $volid = $drive->{file};
ed221350 1724
ff1a2432 1725 return if !$volid || $volid =~ m|^/|;
1e3baf05 1726
6b64503e 1727 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1728 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1729
6b64503e 1730 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1731 });
19672434 1732
a6af7b3e 1733 if ($keep_empty_config) {
9c502e26 1734 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1735 } else {
1736 unlink $conffile;
1737 }
1e3baf05
DM
1738
1739 # also remove unused disk
1740 eval {
6b64503e 1741 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1742
1743 eval {
6b64503e 1744 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1745 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1746 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1747 });
1748 };
1749 warn $@ if $@;
1750
1751 };
1752 warn $@ if $@;
1753}
1754
1e3baf05 1755sub load_config {
7e8dcf2c 1756 my ($vmid, $node) = @_;
1e3baf05 1757
7e8dcf2c 1758 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1759
1760 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1761
1762 die "no such VM ('$vmid')\n" if !defined($conf);
1763
1764 return $conf;
19672434 1765}
1e3baf05
DM
1766
1767sub parse_vm_config {
1768 my ($filename, $raw) = @_;
1769
1770 return undef if !defined($raw);
1771
554ac7e7 1772 my $res = {
fc1ddcdc 1773 digest => Digest::SHA::sha1_hex($raw),
0d18dcfc 1774 snapshots => {},
554ac7e7 1775 };
1e3baf05 1776
19672434 1777 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1778 || die "got strange filename '$filename'";
1779
1780 my $vmid = $1;
1781
0d18dcfc 1782 my $conf = $res;
0581fe4f
DM
1783 my $descr = '';
1784
0d18dcfc
DM
1785 my @lines = split(/\n/, $raw);
1786 foreach my $line (@lines) {
1e3baf05 1787 next if $line =~ m/^\s*$/;
be190583 1788
0d18dcfc
DM
1789 if ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
1790 my $snapname = $1;
1791 $conf->{description} = $descr if $descr;
782f4f75 1792 $descr = '';
be190583 1793 $conf = $res->{snapshots}->{$snapname} = {};
0d18dcfc
DM
1794 next;
1795 }
1e3baf05 1796
0581fe4f
DM
1797 if ($line =~ m/^\#(.*)\s*$/) {
1798 $descr .= PVE::Tools::decode_text($1) . "\n";
1799 next;
1800 }
1801
1e3baf05 1802 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
0581fe4f 1803 $descr .= PVE::Tools::decode_text($2);
0d18dcfc
DM
1804 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1805 $conf->{snapstate} = $1;
1e3baf05
DM
1806 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1807 my $key = $1;
1808 my $value = $2;
0d18dcfc 1809 $conf->{$key} = $value;
1e3baf05
DM
1810 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1811 my $key = $1;
1812 my $value = $2;
1813 eval { $value = check_type($key, $value); };
1814 if ($@) {
1815 warn "vm $vmid - unable to parse value of '$key' - $@";
1816 } else {
1817 my $fmt = $confdesc->{$key}->{format};
1818 if ($fmt && $fmt eq 'pve-qm-drive') {
1819 my $v = parse_drive($key, $value);
1820 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1821 $v->{file} = $volid;
6b64503e 1822 $value = print_drive($vmid, $v);
1e3baf05
DM
1823 } else {
1824 warn "vm $vmid - unable to parse value of '$key'\n";
1825 next;
1826 }
1827 }
1828
1829 if ($key eq 'cdrom') {
0d18dcfc 1830 $conf->{ide2} = $value;
1e3baf05 1831 } else {
0d18dcfc 1832 $conf->{$key} = $value;
1e3baf05
DM
1833 }
1834 }
1835 }
1836 }
1837
0d18dcfc 1838 $conf->{description} = $descr if $descr;
0581fe4f 1839
0d18dcfc 1840 delete $res->{snapstate}; # just to be sure
1e3baf05
DM
1841
1842 return $res;
1843}
1844
1858638f
DM
1845sub write_vm_config {
1846 my ($filename, $conf) = @_;
1e3baf05 1847
0d18dcfc
DM
1848 delete $conf->{snapstate}; # just to be sure
1849
1858638f
DM
1850 if ($conf->{cdrom}) {
1851 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
1852 $conf->{ide2} = $conf->{cdrom};
1853 delete $conf->{cdrom};
1854 }
1e3baf05
DM
1855
1856 # we do not use 'smp' any longer
1858638f
DM
1857 if ($conf->{sockets}) {
1858 delete $conf->{smp};
1859 } elsif ($conf->{smp}) {
1860 $conf->{sockets} = $conf->{smp};
1861 delete $conf->{cores};
1862 delete $conf->{smp};
1e3baf05
DM
1863 }
1864
264e519f 1865 if ($conf->{maxcpus} && $conf->{sockets}) {
3bd18e48
AD
1866 delete $conf->{sockets};
1867 }
264e519f 1868
ee2f90b1 1869 my $used_volids = {};
0d18dcfc 1870
ee2f90b1 1871 my $cleanup_config = sub {
a8e2f942 1872 my ($cref, $snapname) = @_;
1858638f 1873
ee2f90b1
DM
1874 foreach my $key (keys %$cref) {
1875 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
1876 $key eq 'snapstate';
1877 my $value = $cref->{$key};
1878 eval { $value = check_type($key, $value); };
1879 die "unable to parse value of '$key' - $@" if $@;
1858638f 1880
ee2f90b1
DM
1881 $cref->{$key} = $value;
1882
a8e2f942 1883 if (!$snapname && valid_drivename($key)) {
ed221350 1884 my $drive = parse_drive($key, $value);
ee2f90b1
DM
1885 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
1886 }
1e3baf05 1887 }
ee2f90b1
DM
1888 };
1889
1890 &$cleanup_config($conf);
1891 foreach my $snapname (keys %{$conf->{snapshots}}) {
a8e2f942 1892 &$cleanup_config($conf->{snapshots}->{$snapname}, $snapname);
1e3baf05
DM
1893 }
1894
1858638f
DM
1895 # remove 'unusedX' settings if we re-add a volume
1896 foreach my $key (keys %$conf) {
1897 my $value = $conf->{$key};
ee2f90b1 1898 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1858638f 1899 delete $conf->{$key};
1e3baf05 1900 }
1858638f 1901 }
be190583 1902
0d18dcfc
DM
1903 my $generate_raw_config = sub {
1904 my ($conf) = @_;
0581fe4f 1905
0d18dcfc
DM
1906 my $raw = '';
1907
1908 # add description as comment to top of file
1909 my $descr = $conf->{description} || '';
1910 foreach my $cl (split(/\n/, $descr)) {
1911 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
1912 }
1913
1914 foreach my $key (sort keys %$conf) {
1915 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots';
1916 $raw .= "$key: $conf->{$key}\n";
1917 }
1918 return $raw;
1919 };
0581fe4f 1920
0d18dcfc
DM
1921 my $raw = &$generate_raw_config($conf);
1922 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
1923 $raw .= "\n[$snapname]\n";
1924 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1858638f 1925 }
1e3baf05 1926
1858638f
DM
1927 return $raw;
1928}
1e3baf05 1929
1858638f
DM
1930sub update_config_nolock {
1931 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 1932
1858638f 1933 check_lock($conf) if !$skiplock;
97d62eb7 1934
1858638f 1935 my $cfspath = cfs_config_path($vmid);
1e3baf05 1936
1858638f
DM
1937 PVE::Cluster::cfs_write_file($cfspath, $conf);
1938}
1e3baf05 1939
1858638f
DM
1940sub update_config {
1941 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 1942
1858638f 1943 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
1944}
1945
19672434 1946sub load_defaults {
1e3baf05
DM
1947
1948 my $res = {};
1949
1950 # we use static defaults from our JSON schema configuration
1951 foreach my $key (keys %$confdesc) {
1952 if (defined(my $default = $confdesc->{$key}->{default})) {
1953 $res->{$key} = $default;
1954 }
1955 }
19672434 1956
1e3baf05
DM
1957 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
1958 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
1959
1960 return $res;
1961}
1962
1963sub config_list {
1964 my $vmlist = PVE::Cluster::get_vmlist();
1965 my $res = {};
1966 return $res if !$vmlist || !$vmlist->{ids};
1967 my $ids = $vmlist->{ids};
1968
1e3baf05
DM
1969 foreach my $vmid (keys %$ids) {
1970 my $d = $ids->{$vmid};
1971 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 1972 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
1973 $res->{$vmid}->{exists} = 1;
1974 }
1975 return $res;
1976}
1977
64e13401
DM
1978# test if VM uses local resources (to prevent migration)
1979sub check_local_resources {
1980 my ($conf, $noerr) = @_;
1981
1982 my $loc_res = 0;
19672434 1983
e0ab7331
DM
1984 $loc_res = 1 if $conf->{hostusb}; # old syntax
1985 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 1986
0d29ab3b 1987 foreach my $k (keys %$conf) {
49ca581d 1988 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2fe1a152 1989 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
1990 }
1991
1992 die "VM uses local resources\n" if $loc_res && !$noerr;
1993
1994 return $loc_res;
1995}
1996
719893a9 1997# check if used storages are available on all nodes (use by migrate)
47152e2e
DM
1998sub check_storage_availability {
1999 my ($storecfg, $conf, $node) = @_;
2000
2001 foreach_drive($conf, sub {
2002 my ($ds, $drive) = @_;
2003
2004 my $volid = $drive->{file};
2005 return if !$volid;
2006
2007 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2008 return if !$sid;
2009
2010 # check if storage is available on both nodes
2011 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2012 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2013 });
2014}
2015
719893a9
DM
2016# list nodes where all VM images are available (used by has_feature API)
2017sub shared_nodes {
2018 my ($conf, $storecfg) = @_;
2019
2020 my $nodelist = PVE::Cluster::get_nodelist();
2021 my $nodehash = { map { $_ => 1 } @$nodelist };
2022 my $nodename = PVE::INotify::nodename();
be190583 2023
719893a9
DM
2024 foreach_drive($conf, sub {
2025 my ($ds, $drive) = @_;
2026
2027 my $volid = $drive->{file};
2028 return if !$volid;
2029
2030 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2031 if ($storeid) {
2032 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2033 if ($scfg->{disable}) {
2034 $nodehash = {};
2035 } elsif (my $avail = $scfg->{nodes}) {
2036 foreach my $node (keys %$nodehash) {
2037 delete $nodehash->{$node} if !$avail->{$node};
2038 }
2039 } elsif (!$scfg->{shared}) {
2040 foreach my $node (keys %$nodehash) {
2041 delete $nodehash->{$node} if $node ne $nodename
2042 }
2043 }
2044 }
2045 });
2046
2047 return $nodehash
2048}
2049
1e3baf05
DM
2050sub check_lock {
2051 my ($conf) = @_;
2052
2053 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2054}
2055
2056sub check_cmdline {
2057 my ($pidfile, $pid) = @_;
2058
6b64503e
DM
2059 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2060 if (defined($fh)) {
1e3baf05
DM
2061 my $line = <$fh>;
2062 $fh->close;
2063 return undef if !$line;
6b64503e 2064 my @param = split(/\0/, $line);
1e3baf05
DM
2065
2066 my $cmd = $param[0];
06094efd 2067 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1e3baf05
DM
2068
2069 for (my $i = 0; $i < scalar (@param); $i++) {
2070 my $p = $param[$i];
2071 next if !$p;
2072 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2073 my $p = $param[$i+1];
2074 return 1 if $p && ($p eq $pidfile);
2075 return undef;
2076 }
2077 }
2078 }
2079 return undef;
2080}
2081
2082sub check_running {
7e8dcf2c 2083 my ($vmid, $nocheck, $node) = @_;
1e3baf05 2084
7e8dcf2c 2085 my $filename = config_file($vmid, $node);
1e3baf05
DM
2086
2087 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 2088 if !$nocheck && ! -f $filename;
1e3baf05 2089
e6c3b671 2090 my $pidfile = pidfile_name($vmid);
1e3baf05 2091
e6c3b671
DM
2092 if (my $fd = IO::File->new("<$pidfile")) {
2093 my $st = stat($fd);
1e3baf05 2094 my $line = <$fd>;
6b64503e 2095 close($fd);
1e3baf05
DM
2096
2097 my $mtime = $st->mtime;
2098 if ($mtime > time()) {
2099 warn "file '$filename' modified in future\n";
2100 }
2101
2102 if ($line =~ m/^(\d+)$/) {
2103 my $pid = $1;
e6c3b671
DM
2104 if (check_cmdline($pidfile, $pid)) {
2105 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2106 return $pid;
2107 }
2108 }
1e3baf05
DM
2109 }
2110 }
2111
2112 return undef;
2113}
2114
2115sub vzlist {
19672434 2116
1e3baf05
DM
2117 my $vzlist = config_list();
2118
6b64503e 2119 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 2120
19672434 2121 while (defined(my $de = $fd->read)) {
1e3baf05
DM
2122 next if $de !~ m/^(\d+)\.pid$/;
2123 my $vmid = $1;
6b64503e
DM
2124 next if !defined($vzlist->{$vmid});
2125 if (my $pid = check_running($vmid)) {
1e3baf05
DM
2126 $vzlist->{$vmid}->{pid} = $pid;
2127 }
2128 }
2129
2130 return $vzlist;
2131}
2132
1e3baf05
DM
2133sub disksize {
2134 my ($storecfg, $conf) = @_;
2135
2136 my $bootdisk = $conf->{bootdisk};
2137 return undef if !$bootdisk;
2138 return undef if !valid_drivename($bootdisk);
2139
2140 return undef if !$conf->{$bootdisk};
2141
2142 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2143 return undef if !defined($drive);
2144
2145 return undef if drive_is_cdrom($drive);
2146
2147 my $volid = $drive->{file};
2148 return undef if !$volid;
2149
24afaca0 2150 return $drive->{size};
1e3baf05
DM
2151}
2152
2153my $last_proc_pid_stat;
2154
03a33f30
DM
2155# get VM status information
2156# This must be fast and should not block ($full == false)
2157# We only query KVM using QMP if $full == true (this can be slow)
1e3baf05 2158sub vmstatus {
03a33f30 2159 my ($opt_vmid, $full) = @_;
1e3baf05
DM
2160
2161 my $res = {};
2162
19672434 2163 my $storecfg = PVE::Storage::config();
1e3baf05
DM
2164
2165 my $list = vzlist();
694fcad4 2166 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 2167
ae4915a2
DM
2168 my $cpucount = $cpuinfo->{cpus} || 1;
2169
1e3baf05
DM
2170 foreach my $vmid (keys %$list) {
2171 next if $opt_vmid && ($vmid ne $opt_vmid);
2172
2173 my $cfspath = cfs_config_path($vmid);
2174 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2175
2176 my $d = {};
2177 $d->{pid} = $list->{$vmid}->{pid};
2178
2179 # fixme: better status?
2180 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2181
af990afe
DM
2182 my $size = disksize($storecfg, $conf);
2183 if (defined($size)) {
2184 $d->{disk} = 0; # no info available
1e3baf05
DM
2185 $d->{maxdisk} = $size;
2186 } else {
2187 $d->{disk} = 0;
2188 $d->{maxdisk} = 0;
2189 }
2190
2191 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
2192 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2193
1e3baf05 2194 $d->{name} = $conf->{name} || "VM $vmid";
19672434 2195 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 2196
8b1accf7 2197 if ($conf->{balloon}) {
4bdb0514 2198 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
074e01c8 2199 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
8b1accf7
DM
2200 }
2201
1e3baf05
DM
2202 $d->{uptime} = 0;
2203 $d->{cpu} = 0;
1e3baf05
DM
2204 $d->{mem} = 0;
2205
2206 $d->{netout} = 0;
2207 $d->{netin} = 0;
2208
2209 $d->{diskread} = 0;
2210 $d->{diskwrite} = 0;
2211
4d8c851b
AD
2212 $d->{template} = is_template($conf);
2213
1e3baf05
DM
2214 $res->{$vmid} = $d;
2215 }
2216
2217 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2218 foreach my $dev (keys %$netdev) {
2219 next if $dev !~ m/^tap([1-9]\d*)i/;
2220 my $vmid = $1;
2221 my $d = $res->{$vmid};
2222 next if !$d;
19672434 2223
1e3baf05
DM
2224 $d->{netout} += $netdev->{$dev}->{receive};
2225 $d->{netin} += $netdev->{$dev}->{transmit};
2226 }
2227
1e3baf05
DM
2228 my $ctime = gettimeofday;
2229
2230 foreach my $vmid (keys %$list) {
2231
2232 my $d = $res->{$vmid};
2233 my $pid = $d->{pid};
2234 next if !$pid;
2235
694fcad4
DM
2236 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2237 next if !$pstat; # not running
19672434 2238
694fcad4 2239 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 2240
694fcad4 2241 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 2242
694fcad4 2243 if ($pstat->{vsize}) {
6b64503e 2244 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
2245 }
2246
2247 my $old = $last_proc_pid_stat->{$pid};
2248 if (!$old) {
19672434
DM
2249 $last_proc_pid_stat->{$pid} = {
2250 time => $ctime,
1e3baf05
DM
2251 used => $used,
2252 cpu => 0,
1e3baf05
DM
2253 };
2254 next;
2255 }
2256
7f0b5beb 2257 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
2258
2259 if ($dtime > 1000) {
2260 my $dutime = $used - $old->{used};
2261
ae4915a2 2262 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 2263 $last_proc_pid_stat->{$pid} = {
19672434 2264 time => $ctime,
1e3baf05
DM
2265 used => $used,
2266 cpu => $d->{cpu},
1e3baf05
DM
2267 };
2268 } else {
2269 $d->{cpu} = $old->{cpu};
1e3baf05
DM
2270 }
2271 }
2272
f5eb281a 2273 return $res if !$full;
03a33f30
DM
2274
2275 my $qmpclient = PVE::QMPClient->new();
2276
64e7fcf2
DM
2277 my $ballooncb = sub {
2278 my ($vmid, $resp) = @_;
2279
2280 my $info = $resp->{'return'};
2281 return if !$info->{max_mem};
be190583 2282
64e7fcf2
DM
2283 my $d = $res->{$vmid};
2284
2285 # use memory assigned to VM
2286 $d->{maxmem} = $info->{max_mem};
2287 $d->{balloon} = $info->{actual};
be190583 2288
64e7fcf2
DM
2289 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2290 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2291 $d->{freemem} = $info->{free_mem};
2292 }
2293
2294 };
2295
03a33f30
DM
2296 my $blockstatscb = sub {
2297 my ($vmid, $resp) = @_;
2298 my $data = $resp->{'return'} || [];
2299 my $totalrdbytes = 0;
2300 my $totalwrbytes = 0;
2301 for my $blockstat (@$data) {
2302 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2303 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2304 }
2305 $res->{$vmid}->{diskread} = $totalrdbytes;
2306 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2307 };
2308
2309 my $statuscb = sub {
2310 my ($vmid, $resp) = @_;
64e7fcf2 2311
03a33f30 2312 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
64e7fcf2
DM
2313 # this fails if ballon driver is not loaded, so this must be
2314 # the last commnand (following command are aborted if this fails).
2315 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
03a33f30
DM
2316
2317 my $status = 'unknown';
2318 if (!defined($status = $resp->{'return'}->{status})) {
2319 warn "unable to get VM status\n";
2320 return;
2321 }
2322
2323 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2324 };
2325
2326 foreach my $vmid (keys %$list) {
2327 next if $opt_vmid && ($vmid ne $opt_vmid);
2328 next if !$res->{$vmid}->{pid}; # not running
2329 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2330 }
2331
2332 $qmpclient->queue_execute();
2333
2334 foreach my $vmid (keys %$list) {
2335 next if $opt_vmid && ($vmid ne $opt_vmid);
2336 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2337 }
2338
1e3baf05
DM
2339 return $res;
2340}
2341
2342sub foreach_drive {
2343 my ($conf, $func) = @_;
2344
2345 foreach my $ds (keys %$conf) {
2346 next if !valid_drivename($ds);
2347
6b64503e 2348 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
2349 next if !$drive;
2350
2351 &$func($ds, $drive);
2352 }
2353}
2354
d5769dc2
DM
2355sub foreach_volid {
2356 my ($conf, $func) = @_;
be190583 2357
d5769dc2
DM
2358 my $volhash = {};
2359
2360 my $test_volid = sub {
2361 my ($volid, $is_cdrom) = @_;
2362
2363 return if !$volid;
be190583 2364
d5769dc2
DM
2365 $volhash->{$volid} = $is_cdrom || 0;
2366 };
2367
ed221350 2368 foreach_drive($conf, sub {
d5769dc2
DM
2369 my ($ds, $drive) = @_;
2370 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2371 });
2372
2373 foreach my $snapname (keys %{$conf->{snapshots}}) {
2374 my $snap = $conf->{snapshots}->{$snapname};
2375 &$test_volid($snap->{vmstate}, 0);
ed221350 2376 foreach_drive($snap, sub {
d5769dc2
DM
2377 my ($ds, $drive) = @_;
2378 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2379 });
2380 }
2381
2382 foreach my $volid (keys %$volhash) {
be190583 2383 &$func($volid, $volhash->{$volid});
d5769dc2
DM
2384 }
2385}
2386
86b8228b
DM
2387sub vga_conf_has_spice {
2388 my ($vga) = @_;
2389
590e698c
DM
2390 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2391
2392 return $1 || 1;
86b8228b
DM
2393}
2394
1e3baf05 2395sub config_to_command {
952958bc 2396 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
1e3baf05
DM
2397
2398 my $cmd = [];
8c559505
DM
2399 my $globalFlags = [];
2400 my $machineFlags = [];
2401 my $rtcFlags = [];
519ed28c 2402 my $cpuFlags = [];
5bdcf937 2403 my $devices = [];
b78ebef7 2404 my $pciaddr = '';
5bdcf937 2405 my $bridges = {};
1e3baf05
DM
2406 my $kvmver = kvm_user_version();
2407 my $vernum = 0; # unknown
a3c52213
DM
2408 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2409 $vernum = $1*1000000+$2*1000;
2410 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
2411 $vernum = $1*1000000+$2*1000+$3;
2412 }
2413
a3c52213 2414 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
2415
2416 my $have_ovz = -f '/proc/vz/vestat';
2417
db656e5f
DM
2418 my $q35 = machine_type_is_q35($conf);
2419
1e3baf05
DM
2420 push @$cmd, '/usr/bin/kvm';
2421
2422 push @$cmd, '-id', $vmid;
2423
2424 my $use_virtio = 0;
2425
c971c4f2
AD
2426 my $qmpsocket = qmp_socket($vmid);
2427 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2428 push @$cmd, '-mon', "chardev=qmp,mode=control";
2429
7b7c6d1b 2430 my $socket = vnc_socket($vmid);
1e3baf05
DM
2431 push @$cmd, '-vnc', "unix:$socket,x509,password";
2432
6b64503e 2433 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 2434
1e3baf05
DM
2435 push @$cmd, '-daemonize';
2436
2796e7d5
DM
2437 if ($conf->{smbios1}) {
2438 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2439 }
2440
db656e5f
DM
2441 if ($q35) {
2442 # the q35 chipset support native usb2, so we enable usb controller
2443 # by default for this machine type
f8e83f05 2444 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
db656e5f 2445 } else {
f8e83f05
AD
2446 $pciaddr = print_pci_addr("piix3", $bridges);
2447 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
24f0d39a 2448
f8e83f05 2449 my $use_usb2 = 0;
db656e5f
DM
2450 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2451 next if !$conf->{"usb$i"};
2452 $use_usb2 = 1;
2453 }
2454 # include usb device config
2455 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
fcc573ab 2456 }
19672434 2457
5acbfe9e 2458 my $vga = $conf->{vga};
2fa3151e 2459
590e698c
DM
2460 my $qxlnum = vga_conf_has_spice($vga);
2461 $vga = 'qxl' if $qxlnum;
2fa3151e 2462
5acbfe9e 2463 if (!$vga) {
264e519f
DM
2464 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2465 $conf->{ostype} eq 'win7' ||
5acbfe9e
DM
2466 $conf->{ostype} eq 'w2k8')) {
2467 $vga = 'std';
2468 } else {
2469 $vga = 'cirrus';
2470 }
2471 }
2472
1e3baf05 2473 # enable absolute mouse coordinates (needed by vnc)
5acbfe9e
DM
2474 my $tablet;
2475 if (defined($conf->{tablet})) {
2476 $tablet = $conf->{tablet};
2477 } else {
2478 $tablet = $defaults->{tablet};
590e698c 2479 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
ef5e2be2 2480 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
5acbfe9e
DM
2481 }
2482
db656e5f 2483 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
90404354 2484
1e3baf05 2485 # host pci devices
040b06b7 2486 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2e3b7e2a
AD
2487 my $d = parse_hostpci($conf->{"hostpci$i"});
2488 next if !$d;
2489
2490 my $pcie = $d->{pcie};
2491 if($pcie){
2492 die "q35 machine model is not enabled" if !$q35;
2493 $pciaddr = print_pcie_addr("hostpci$i");
2494 }else{
2495 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2496 }
2497
2498 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2499 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2500 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
137483c0
AD
2501 if ($xvga && $xvga ne '') {
2502 push @$cpuFlags, 'kvm=off';
2503 $vga = 'none';
2504 }
2e3b7e2a 2505 $driver = "vfio-pci" if $xvga ne '';
4543ecf0
AD
2506 my $pcidevices = $d->{pciid};
2507 my $multifunction = 1 if @$pcidevices > 1;
2e3b7e2a 2508
4543ecf0
AD
2509 my $j=0;
2510 foreach my $pcidevice (@$pcidevices) {
2e3b7e2a 2511
4543ecf0
AD
2512 my $id = "hostpci$i";
2513 $id .= ".$j" if $multifunction;
2514 my $addr = $pciaddr;
2515 $addr .= ".$j" if $multifunction;
2516 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2517
2518 if($j == 0){
2519 $devicestr .= "$rombar$xvga";
2520 $devicestr .= ",multifunction=on" if $multifunction;
2521 }
2522
2523 push @$devices, '-device', $devicestr;
2524 $j++;
2525 }
1e3baf05
DM
2526 }
2527
2528 # usb devices
2529 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2530 my $d = parse_usb_device($conf->{"usb$i"});
2531 next if !$d;
2532 if ($d->{vendorid} && $d->{productid}) {
5bdcf937 2533 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
1e3baf05 2534 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
5bdcf937 2535 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
80401dd8
DM
2536 } elsif ($d->{spice}) {
2537 # usb redir support for spice
2538 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2539 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
1e3baf05
DM
2540 }
2541 }
2542
1e3baf05 2543 # serial devices
bae179aa 2544 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 2545 if (my $path = $conf->{"serial$i"}) {
9f9d2fb2
DM
2546 if ($path eq 'socket') {
2547 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2548 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2549 push @$devices, '-device', "isa-serial,chardev=serial$i";
2550 } else {
2551 die "no such serial device\n" if ! -c $path;
2552 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2553 push @$devices, '-device', "isa-serial,chardev=serial$i";
2554 }
34978be3 2555 }
1e3baf05
DM
2556 }
2557
2558 # parallel devices
1989a89c 2559 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 2560 if (my $path = $conf->{"parallel$i"}) {
19672434 2561 die "no such parallel device\n" if ! -c $path;
32e69805 2562 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
4c5dbaf6 2563 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
5bdcf937 2564 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
34978be3 2565 }
1e3baf05
DM
2566 }
2567
2568 my $vmname = $conf->{name} || "vm$vmid";
2569
2570 push @$cmd, '-name', $vmname;
19672434 2571
1e3baf05
DM
2572 my $sockets = 1;
2573 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2574 $sockets = $conf->{sockets} if $conf->{sockets};
2575
2576 my $cores = $conf->{cores} || 1;
3bd18e48
AD
2577 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2578
264e519f 2579 if ($maxcpus) {
3bd18e48 2580 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
264e519f 2581 } else {
3bd18e48
AD
2582 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2583 }
1e3baf05 2584
1e3baf05
DM
2585 push @$cmd, '-nodefaults';
2586
32baffb4 2587 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 2588
0888fdce
DM
2589 my $bootindex_hash = {};
2590 my $i = 1;
2591 foreach my $o (split(//, $bootorder)) {
2592 $bootindex_hash->{$o} = $i*100;
2593 $i++;
afdb31d5 2594 }
3b408e82
DM
2595
2596 push @$cmd, '-boot', "menu=on";
1e3baf05 2597
6b64503e 2598 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2599
6b64503e 2600 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05 2601
ef5e2be2 2602 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
1e3baf05
DM
2603
2604 # time drift fix
6b64503e 2605 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
1e3baf05 2606
6b64503e 2607 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
8c559505 2608 my $useLocaltime = $conf->{localtime};
1e3baf05
DM
2609
2610 if (my $ost = $conf->{ostype}) {
6b9d84cf 2611 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
1e3baf05
DM
2612
2613 if ($ost =~ m/^w/) { # windows
8c559505 2614 $useLocaltime = 1 if !defined($conf->{localtime});
1e3baf05 2615
8c559505 2616 # use time drift fix when acpi is enabled
6b64503e 2617 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
8c559505 2618 $tdf = 1 if !defined($conf->{tdf});
1e3baf05
DM
2619 }
2620 }
2621
be190583 2622 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
a70ebde3 2623 $ost eq 'wvista') {
8c559505 2624 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
b7e0c8bf 2625 push @$cmd, '-no-hpet';
462e8d19
AD
2626 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2627 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2628 }
2629
2630 if ($ost eq 'win7' || $ost eq 'win8') {
2631 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
b7e0c8bf 2632 }
1e3baf05
DM
2633 }
2634
8c559505
DM
2635 push @$rtcFlags, 'driftfix=slew' if $tdf;
2636
7f0b5beb 2637 if ($nokvm) {
8c559505 2638 push @$machineFlags, 'accel=tcg';
7f0b5beb
DM
2639 } else {
2640 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2641 }
1e3baf05 2642
952958bc
DM
2643 my $machine_type = $forcemachine || $conf->{machine};
2644 if ($machine_type) {
2645 push @$machineFlags, "type=${machine_type}";
3bafc510
DM
2646 }
2647
8c559505
DM
2648 if ($conf->{startdate}) {
2649 push @$rtcFlags, "base=$conf->{startdate}";
2650 } elsif ($useLocaltime) {
2651 push @$rtcFlags, 'base=localtime';
2652 }
1e3baf05 2653
519ed28c
AD
2654 my $cpu = $nokvm ? "qemu64" : "kvm64";
2655 $cpu = $conf->{cpu} if $conf->{cpu};
2656
4dc339e7
AD
2657 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2658
6b9d84cf
AD
2659 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2660
2661 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
519ed28c 2662
2e1a5389
AD
2663 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2664
be190583 2665 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
519ed28c 2666
c0efd8cd
DM
2667 # Note: enforce needs kernel 3.10, so we do not use it for now
2668 # push @$cmd, '-cpu', "$cpu,enforce";
2669 push @$cmd, '-cpu', $cpu;
519ed28c 2670
1e3baf05
DM
2671 push @$cmd, '-S' if $conf->{freeze};
2672
2673 # set keyboard layout
2674 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2675 push @$cmd, '-k', $kb if $kb;
2676
2677 # enable sound
2678 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2679 #push @$cmd, '-soundhw', 'es1370';
2680 #push @$cmd, '-soundhw', $soundhw if $soundhw;
ab6a046f 2681
bc84dcca 2682 if($conf->{agent}) {
ab6a046f
AD
2683 my $qgasocket = qga_socket($vmid);
2684 my $pciaddr = print_pci_addr("qga0", $bridges);
2685 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2686 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2687 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2688 }
2689
1d794448 2690 my $spice_port;
2fa3151e 2691
590e698c
DM
2692 if ($qxlnum) {
2693 if ($qxlnum > 1) {
2694 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2695 for(my $i = 1; $i < $qxlnum; $i++){
2696 my $pciaddr = print_pci_addr("vga$i", $bridges);
2697 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2698 }
2699 } else {
2700 # assume other OS works like Linux
2701 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2702 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2fa3151e
AD
2703 }
2704 }
2705
1011b570 2706 my $pciaddr = print_pci_addr("spice", $bridges);
95a4b4a9 2707
cd339d1f 2708 $spice_port = PVE::Tools::next_spice_port();
943340a6 2709
d2da6d9b 2710 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
1011b570 2711
d2da6d9b
AD
2712 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2713 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2714 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
1011b570
DM
2715 }
2716
8d9ae0d2
DM
2717 # enable balloon by default, unless explicitly disabled
2718 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2719 $pciaddr = print_pci_addr("balloon0", $bridges);
2720 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2721 }
1e3baf05 2722
0ea9541d
DM
2723 if ($conf->{watchdog}) {
2724 my $wdopts = parse_watchdog($conf->{watchdog});
5bdcf937 2725 $pciaddr = print_pci_addr("watchdog", $bridges);
0a40e8ea 2726 my $watchdog = $wdopts->{model} || 'i6300esb';
5bdcf937
AD
2727 push @$devices, '-device', "$watchdog$pciaddr";
2728 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
0ea9541d
DM
2729 }
2730
1e3baf05 2731 my $vollist = [];
941e0c42 2732 my $scsicontroller = {};
26ee04b6 2733 my $ahcicontroller = {};
cdd20088 2734 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
1e3baf05 2735
5881b913
DM
2736 # Add iscsi initiator name if available
2737 if (my $initiator = get_initiator_name()) {
2738 push @$devices, '-iscsi', "initiator-name=$initiator";
2739 }
2740
1e3baf05
DM
2741 foreach_drive($conf, sub {
2742 my ($ds, $drive) = @_;
2743
ff1a2432 2744 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 2745 push @$vollist, $drive->{file};
ff1a2432 2746 }
afdb31d5 2747
1e3baf05 2748 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
2749
2750 if (drive_is_cdrom ($drive)) {
2751 if ($bootindex_hash->{d}) {
2752 $drive->{bootindex} = $bootindex_hash->{d};
2753 $bootindex_hash->{d} += 1;
2754 }
2755 } else {
2756 if ($bootindex_hash->{c}) {
2757 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
2758 $bootindex_hash->{c} += 1;
2759 }
2760 }
2761
941e0c42 2762 if ($drive->{interface} eq 'scsi') {
cdd20088 2763
5b952ff5 2764 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
cdd20088 2765 my $controller = int($drive->{index} / $maxdev);
5bdcf937
AD
2766 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
2767 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
cdd20088 2768 $scsicontroller->{$controller}=1;
941e0c42 2769 }
3b408e82 2770
26ee04b6
DA
2771 if ($drive->{interface} eq 'sata') {
2772 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
5bdcf937
AD
2773 $pciaddr = print_pci_addr("ahci$controller", $bridges);
2774 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
26ee04b6
DA
2775 $ahcicontroller->{$controller}=1;
2776 }
46f58b5f 2777
15b21acc
MR
2778 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
2779 push @$devices, '-drive',$drive_cmd;
46f58b5f 2780 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
1e3baf05
DM
2781 });
2782
2783 push @$cmd, '-m', $conf->{memory} || $defaults->{memory};
19672434 2784
cc4d6182 2785 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 2786 next if !$conf->{"net$i"};
cc4d6182
DA
2787 my $d = parse_net($conf->{"net$i"});
2788 next if !$d;
1e3baf05 2789
cc4d6182 2790 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 2791
cc4d6182
DA
2792 if ($bootindex_hash->{n}) {
2793 $d->{bootindex} = $bootindex_hash->{n};
2794 $bootindex_hash->{n} += 1;
2795 }
1e3baf05 2796
cc4d6182 2797 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
5bdcf937
AD
2798 push @$devices, '-netdev', $netdevfull;
2799
2800 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
2801 push @$devices, '-device', $netdevicefull;
2802 }
1e3baf05 2803
db656e5f
DM
2804 if (!$q35) {
2805 # add pci bridges
f8e83f05
AD
2806 while (my ($k, $v) = each %$bridges) {
2807 $pciaddr = print_pci_addr("pci.$k");
2808 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
2809 }
19672434
DM
2810 }
2811
1e3baf05
DM
2812 # hack: virtio with fairsched is unreliable, so we do not use fairsched
2813 # when the VM uses virtio devices.
19672434
DM
2814 if (!$use_virtio && $have_ovz) {
2815
6b64503e 2816 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
2817 $conf->{cpuunits} : $defaults->{cpuunits};
2818
2819 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
2820
2821 # fixme: cpulimit is currently ignored
2822 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
2823 }
2824
2825 # add custom args
2826 if ($conf->{args}) {
3ada46c9 2827 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
2828 push @$cmd, @$aa;
2829 }
2830
5bdcf937 2831 push @$cmd, @$devices;
be190583 2832 push @$cmd, '-rtc', join(',', @$rtcFlags)
8c559505 2833 if scalar(@$rtcFlags);
be190583 2834 push @$cmd, '-machine', join(',', @$machineFlags)
8c559505
DM
2835 if scalar(@$machineFlags);
2836 push @$cmd, '-global', join(',', @$globalFlags)
2837 if scalar(@$globalFlags);
2838
1d794448 2839 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
1e3baf05 2840}
19672434 2841
1e3baf05
DM
2842sub vnc_socket {
2843 my ($vmid) = @_;
2844 return "${var_run_tmpdir}/$vmid.vnc";
2845}
2846
943340a6 2847sub spice_port {
1011b570 2848 my ($vmid) = @_;
943340a6 2849
1d794448 2850 my $res = vm_mon_cmd($vmid, 'query-spice');
943340a6
DM
2851
2852 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
1011b570
DM
2853}
2854
c971c4f2
AD
2855sub qmp_socket {
2856 my ($vmid) = @_;
2857 return "${var_run_tmpdir}/$vmid.qmp";
2858}
2859
ab6a046f
AD
2860sub qga_socket {
2861 my ($vmid) = @_;
2862 return "${var_run_tmpdir}/$vmid.qga";
2863}
2864
1e3baf05
DM
2865sub pidfile_name {
2866 my ($vmid) = @_;
2867 return "${var_run_tmpdir}/$vmid.pid";
2868}
2869
86fdcfb2
DA
2870sub vm_devices_list {
2871 my ($vmid) = @_;
2872
ceea9078
DM
2873 my $res = vm_mon_cmd($vmid, 'query-pci');
2874
2875 my $devices = {};
2876 foreach my $pcibus (@$res) {
2877 foreach my $device (@{$pcibus->{devices}}) {
2878 next if !$device->{'qdev_id'};
2879 $devices->{$device->{'qdev_id'}} = $device;
1dc4f496
DM
2880 }
2881 }
86fdcfb2 2882
1dc4f496 2883 return $devices;
86fdcfb2
DA
2884}
2885
ec21aa11 2886sub vm_deviceplug {
f19d1c47 2887 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 2888
cd6ecb89 2889 return 1 if !check_running($vmid);
db656e5f
DM
2890
2891 my $q35 = machine_type_is_q35($conf);
2892
cd6ecb89 2893 if ($deviceid eq 'tablet') {
db656e5f 2894 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
cd6ecb89
AD
2895 return 1;
2896 }
2897
2dbe827e 2898 return 1 if !$conf->{hotplug};
afdb31d5 2899
95d6343b
DA
2900 my $devices_list = vm_devices_list($vmid);
2901 return 1 if defined($devices_list->{$deviceid});
2902
40f28a9f
AD
2903 qemu_bridgeadd($storecfg, $conf, $vmid, $deviceid); #add bridge if we need it for the device
2904
5e5dcb73
DA
2905 if ($deviceid =~ m/^(virtio)(\d+)$/) {
2906 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 2907 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
5e5dcb73
DA
2908 qemu_deviceadd($vmid, $devicefull);
2909 if(!qemu_deviceaddverify($vmid, $deviceid)) {
2910 qemu_drivedel($vmid, $deviceid);
2911 return undef;
2912 }
f19d1c47 2913 }
cfc817c7 2914
cdd20088
AD
2915 if ($deviceid =~ m/^(scsihw)(\d+)$/) {
2916 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
cfc817c7 2917 my $pciaddr = print_pci_addr($deviceid);
cdd20088 2918 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
cfc817c7
DA
2919 qemu_deviceadd($vmid, $devicefull);
2920 return undef if(!qemu_deviceaddverify($vmid, $deviceid));
2921 }
2922
a4f091a0 2923 if ($deviceid =~ m/^(scsi)(\d+)$/) {
5b952ff5 2924 return 1 if ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)); #virtio-scsi not yet support hotplug
cdd20088 2925 return undef if !qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
a4f091a0 2926 return undef if !qemu_driveadd($storecfg, $vmid, $device);
cdd20088 2927 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
a4f091a0
DA
2928 if(!qemu_deviceadd($vmid, $devicefull)) {
2929 qemu_drivedel($vmid, $deviceid);
2930 return undef;
2931 }
2932 }
2933
2630d2a9
DA
2934 if ($deviceid =~ m/^(net)(\d+)$/) {
2935 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
2936 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
2937 qemu_deviceadd($vmid, $netdevicefull);
2938 if(!qemu_deviceaddverify($vmid, $deviceid)) {
2939 qemu_netdevdel($vmid, $deviceid);
2940 return undef;
2941 }
2942 }
2943
f8e83f05
AD
2944
2945 if (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
40f28a9f
AD
2946 my $bridgeid = $2;
2947 my $pciaddr = print_pci_addr($deviceid);
2948 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
2949 qemu_deviceadd($vmid, $devicefull);
2950 return undef if !qemu_deviceaddverify($vmid, $deviceid);
2951 }
2952
5e5dcb73 2953 return 1;
a4dea331
DA
2954}
2955
ec21aa11 2956sub vm_deviceunplug {
f19d1c47 2957 my ($vmid, $conf, $deviceid) = @_;
873c2d69 2958
cd6ecb89
AD
2959 return 1 if !check_running ($vmid);
2960
2961 if ($deviceid eq 'tablet') {
2962 qemu_devicedel($vmid, $deviceid);
2963 return 1;
2964 }
2965
2dbe827e 2966 return 1 if !$conf->{hotplug};
873c2d69 2967
95d6343b
DA
2968 my $devices_list = vm_devices_list($vmid);
2969 return 1 if !defined($devices_list->{$deviceid});
2970
ae57f6b3 2971 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
f19d1c47 2972
5e5dcb73 2973 if ($deviceid =~ m/^(virtio)(\d+)$/) {
5e5dcb73
DA
2974 qemu_devicedel($vmid, $deviceid);
2975 return undef if !qemu_devicedelverify($vmid, $deviceid);
1f219ef5 2976 return undef if !qemu_drivedel($vmid, $deviceid);
5e5dcb73 2977 }
cfc817c7
DA
2978
2979 if ($deviceid =~ m/^(lsi)(\d+)$/) {
2980 return undef if !qemu_devicedel($vmid, $deviceid);
2981 }
2982
a4f091a0
DA
2983 if ($deviceid =~ m/^(scsi)(\d+)$/) {
2984 return undef if !qemu_devicedel($vmid, $deviceid);
2985 return undef if !qemu_drivedel($vmid, $deviceid);
2986 }
2987
2630d2a9 2988 if ($deviceid =~ m/^(net)(\d+)$/) {
2630d2a9
DA
2989 qemu_devicedel($vmid, $deviceid);
2990 return undef if !qemu_devicedelverify($vmid, $deviceid);
750886f8 2991 return undef if !qemu_netdevdel($vmid, $deviceid);
2630d2a9
DA
2992 }
2993
5e5dcb73
DA
2994 return 1;
2995}
2996
2997sub qemu_deviceadd {
2998 my ($vmid, $devicefull) = @_;
873c2d69 2999
d695b5b7
AD
3000 $devicefull = "driver=".$devicefull;
3001 my %options = split(/[=,]/, $devicefull);
f19d1c47 3002
d695b5b7
AD
3003 vm_mon_cmd($vmid, "device_add" , %options);
3004 return 1;
5e5dcb73 3005}
afdb31d5 3006
5e5dcb73
DA
3007sub qemu_devicedel {
3008 my($vmid, $deviceid) = @_;
5a77d8c1
AD
3009 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
3010 return 1;
5e5dcb73
DA
3011}
3012
3013sub qemu_driveadd {
3014 my($storecfg, $vmid, $device) = @_;
3015
3016 my $drive = print_drive_full($storecfg, $vmid, $device);
7b7c6d1b 3017 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
5e5dcb73
DA
3018 # If the command succeeds qemu prints: "OK"
3019 if ($ret !~ m/OK/s) {
3020 syslog("err", "adding drive failed: $ret");
3021 return undef;
f19d1c47 3022 }
5e5dcb73
DA
3023 return 1;
3024}
afdb31d5 3025
5e5dcb73
DA
3026sub qemu_drivedel {
3027 my($vmid, $deviceid) = @_;
873c2d69 3028
7b7c6d1b 3029 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
5e5dcb73
DA
3030 $ret =~ s/^\s+//;
3031 if ($ret =~ m/Device \'.*?\' not found/s) {
afdb31d5 3032 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
5e5dcb73
DA
3033 }
3034 elsif ($ret ne "") {
3035 syslog("err", "deleting drive $deviceid failed : $ret");
3036 return undef;
873c2d69 3037 }
5e5dcb73
DA
3038 return 1;
3039}
f19d1c47 3040
5e5dcb73
DA
3041sub qemu_deviceaddverify {
3042 my ($vmid,$deviceid) = @_;
873c2d69 3043
5e5dcb73
DA
3044 for (my $i = 0; $i <= 5; $i++) {
3045 my $devices_list = vm_devices_list($vmid);
3046 return 1 if defined($devices_list->{$deviceid});
3047 sleep 1;
afdb31d5 3048 }
5e5dcb73
DA
3049 syslog("err", "error on hotplug device $deviceid");
3050 return undef;
3051}
afdb31d5 3052
5e5dcb73
DA
3053
3054sub qemu_devicedelverify {
3055 my ($vmid,$deviceid) = @_;
3056
3057 #need to verify the device is correctly remove as device_del is async and empty return is not reliable
3058 for (my $i = 0; $i <= 5; $i++) {
3059 my $devices_list = vm_devices_list($vmid);
3060 return 1 if !defined($devices_list->{$deviceid});
3061 sleep 1;
afdb31d5 3062 }
5e5dcb73
DA
3063 syslog("err", "error on hot-unplugging device $deviceid");
3064 return undef;
873c2d69
DA
3065}
3066
cdd20088 3067sub qemu_findorcreatescsihw {
cfc817c7
DA
3068 my ($storecfg, $conf, $vmid, $device) = @_;
3069
5b952ff5 3070 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
cfc817c7 3071 my $controller = int($device->{index} / $maxdev);
cdd20088 3072 my $scsihwid="scsihw$controller";
cfc817c7
DA
3073 my $devices_list = vm_devices_list($vmid);
3074
cdd20088
AD
3075 if(!defined($devices_list->{$scsihwid})) {
3076 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
cfc817c7
DA
3077 }
3078 return 1;
3079}
3080
40f28a9f
AD
3081sub qemu_bridgeadd {
3082 my ($storecfg, $conf, $vmid, $device) = @_;
3083
3084 my $bridges = {};
3085 my $bridgeid = undef;
3086 print_pci_addr($device, $bridges);
3087
3088 while (my ($k, $v) = each %$bridges) {
3089 $bridgeid = $k;
3090 }
0e616534 3091 return if !$bridgeid || $bridgeid < 1;
40f28a9f
AD
3092 my $bridge = "pci.$bridgeid";
3093 my $devices_list = vm_devices_list($vmid);
3094
3095 if(!defined($devices_list->{$bridge})) {
3096 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $bridge);
3097 }
3098 return 1;
3099}
3100
2630d2a9
DA
3101sub qemu_netdevadd {
3102 my ($vmid, $conf, $device, $deviceid) = @_;
3103
3104 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
73aa03b8 3105 my %options = split(/[=,]/, $netdev);
2630d2a9 3106
73aa03b8
AD
3107 vm_mon_cmd($vmid, "netdev_add", %options);
3108 return 1;
2630d2a9
DA
3109}
3110
3111sub qemu_netdevdel {
3112 my ($vmid, $deviceid) = @_;
3113
89c1e0f4
AD
3114 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
3115 return 1;
2630d2a9
DA
3116}
3117
838776ab
AD
3118sub qemu_cpu_hotplug {
3119 my ($vmid, $conf, $cores) = @_;
3120
3121 die "new cores config is not defined" if !$cores;
264e519f
DM
3122 die "you can't add more cores than maxcpus"
3123 if $conf->{maxcpus} && ($cores > $conf->{maxcpus});
838776ab
AD
3124 return if !check_running($vmid);
3125
3126 my $currentcores = $conf->{cores} if $conf->{cores};
3127 die "current cores is not defined" if !$currentcores;
3128 die "maxcpus is not defined" if !$conf->{maxcpus};
264e519f
DM
3129 raise_param_exc({ 'cores' => "online cpu unplug is not yet possible" })
3130 if($cores < $currentcores);
838776ab
AD
3131
3132 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
264e519f
DM
3133 raise_param_exc({ 'cores' => "cores number if running vm is different than configuration" })
3134 if scalar (@{$currentrunningcores}) != $currentcores;
838776ab 3135
264e519f 3136 for(my $i = $currentcores; $i < $cores; $i++) {
838776ab
AD
3137 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3138 }
3139}
3140
affd2f88
AD
3141sub qemu_block_set_io_throttle {
3142 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3143
f3f323a3
AD
3144 return if !check_running($vmid) ;
3145
f3f323a3
AD
3146 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3147
affd2f88
AD
3148}
3149
f5eb281a 3150# old code, only used to shutdown old VM after update
dab36e1e
DM
3151sub __read_avail {
3152 my ($fh, $timeout) = @_;
3153
3154 my $sel = new IO::Select;
3155 $sel->add($fh);
3156
3157 my $res = '';
3158 my $buf;
3159
3160 my @ready;
3161 while (scalar (@ready = $sel->can_read($timeout))) {
3162 my $count;
3163 if ($count = $fh->sysread($buf, 8192)) {
3164 if ($buf =~ /^(.*)\(qemu\) $/s) {
3165 $res .= $1;
3166 last;
3167 } else {
3168 $res .= $buf;
3169 }
3170 } else {
3171 if (!defined($count)) {
3172 die "$!\n";
3173 }
3174 last;
3175 }
3176 }
3177
3178 die "monitor read timeout\n" if !scalar(@ready);
f5eb281a 3179
dab36e1e
DM
3180 return $res;
3181}
3182
f5eb281a 3183# old code, only used to shutdown old VM after update
dab36e1e
DM
3184sub vm_monitor_command {
3185 my ($vmid, $cmdstr, $nocheck) = @_;
f5eb281a 3186
dab36e1e
DM
3187 my $res;
3188
3189 eval {
3190 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3191
3192 my $sname = "${var_run_tmpdir}/$vmid.mon";
3193
3194 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3195 die "unable to connect to VM $vmid socket - $!\n";
3196
3197 my $timeout = 3;
3198
3199 # hack: migrate sometime blocks the monitor (when migrate_downtime
3200 # is set)
3201 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3202 $timeout = 60*60; # 1 hour
3203 }
3204
3205 # read banner;
3206 my $data = __read_avail($sock, $timeout);
3207
3208 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3209 die "got unexpected qemu monitor banner\n";
3210 }
3211
3212 my $sel = new IO::Select;
3213 $sel->add($sock);
3214
3215 if (!scalar(my @ready = $sel->can_write($timeout))) {
3216 die "monitor write error - timeout";
3217 }
3218
3219 my $fullcmd = "$cmdstr\r";
3220
3221 # syslog('info', "VM $vmid monitor command: $cmdstr");
3222
3223 my $b;
3224 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3225 die "monitor write error - $!";
3226 }
3227
3228 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3229
3230 $timeout = 20;
3231
3232 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3233 $timeout = 60*60; # 1 hour
3234 } elsif ($cmdstr =~ m/^(eject|change)/) {
3235 $timeout = 60; # note: cdrom mount command is slow
3236 }
3237 if ($res = __read_avail($sock, $timeout)) {
3238
3239 my @lines = split("\r?\n", $res);
f5eb281a 3240
dab36e1e 3241 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
f5eb281a 3242
dab36e1e
DM
3243 $res = join("\n", @lines);
3244 $res .= "\n";
3245 }
3246 };
3247
3248 my $err = $@;
3249
3250 if ($err) {
3251 syslog("err", "VM $vmid monitor command failed - $err");
3252 die $err;
3253 }
f5eb281a 3254
dab36e1e
DM
3255 return $res;
3256}
3257
c1175c92
AD
3258sub qemu_block_resize {
3259 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3260
ed221350 3261 my $running = check_running($vmid);
c1175c92
AD
3262
3263 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3264
3265 return if !$running;
3266
3267 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3268
3269}
3270
1ab0057c
AD
3271sub qemu_volume_snapshot {
3272 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3273
ed221350 3274 my $running = check_running($vmid);
1ab0057c
AD
3275
3276 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3277
3278 return if !$running;
3279
3280 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3281
3282}
3283
fc46aff9
AD
3284sub qemu_volume_snapshot_delete {
3285 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3286
ed221350 3287 my $running = check_running($vmid);
fc46aff9
AD
3288
3289 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3290
3291 return if !$running;
3292
18bfb361 3293 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
fc46aff9
AD
3294}
3295
3d5149c9
AD
3296sub qga_freezefs {
3297 my ($vmid) = @_;
3298
3299 #need to impplement call to qemu-ga
3300}
3301
e8f3f18e
AD
3302sub qga_unfreezefs {
3303 my ($vmid) = @_;
3304
3305 #need to impplement call to qemu-ga
3306}
3307
264e519f
DM
3308sub set_migration_caps {
3309 my ($vmid) = @_;
a89fded1 3310
8b8345f3 3311 my $cap_ref = [];
a89fded1
AD
3312
3313 my $enabled_cap = {
8b8345f3
DM
3314 "auto-converge" => 1,
3315 "xbzrle" => 0,
3316 "x-rdma-pin-all" => 0,
3317 "zero-blocks" => 0,
a89fded1
AD
3318 };
3319
8b8345f3 3320 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
a89fded1 3321
8b8345f3 3322 for my $supported_capability (@$supported_capabilities) {
b463a3ce
SP
3323 push @$cap_ref, {
3324 capability => $supported_capability->{capability},
22430fa2
DM
3325 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3326 };
a89fded1
AD
3327 }
3328
8b8345f3
DM
3329 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3330}
a89fded1 3331
1e3baf05 3332sub vm_start {
1d794448 3333 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
1e3baf05 3334
6b64503e 3335 lock_config($vmid, sub {
7e8dcf2c 3336 my $conf = load_config($vmid, $migratedfrom);
1e3baf05 3337
8b43bc11 3338 die "you can't start a vm if it's a template\n" if is_template($conf);
3dcb98d5 3339
6b64503e 3340 check_lock($conf) if !$skiplock;
1e3baf05 3341
7e8dcf2c 3342 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
1e3baf05 3343
6c47d546
DM
3344 my $defaults = load_defaults();
3345
3346 # set environment variable useful inside network script
3347 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3348
1d794448 3349 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
6c47d546 3350
1e3baf05 3351 my $migrate_port = 0;
5bc1e039 3352 my $migrate_uri;
1e3baf05
DM
3353 if ($statefile) {
3354 if ($statefile eq 'tcp') {
5bc1e039
SP
3355 my $localip = "localhost";
3356 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3357 if ($datacenterconf->{migration_unsecure}) {
3358 my $nodename = PVE::INotify::nodename();
3359 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3360 }
f9a971e0 3361 $migrate_port = PVE::Tools::next_migrate_port();
5bc1e039 3362 $migrate_uri = "tcp:${localip}:${migrate_port}";
6c47d546
DM
3363 push @$cmd, '-incoming', $migrate_uri;
3364 push @$cmd, '-S';
1e3baf05 3365 } else {
6c47d546 3366 push @$cmd, '-loadstate', $statefile;
1e3baf05 3367 }
91bd6c90
DM
3368 } elsif ($paused) {
3369 push @$cmd, '-S';
1e3baf05
DM
3370 }
3371
1e3baf05 3372 # host pci devices
040b06b7
DA
3373 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3374 my $d = parse_hostpci($conf->{"hostpci$i"});
3375 next if !$d;
b1f72af6
AD
3376 my $pcidevices = $d->{pciid};
3377 foreach my $pcidevice (@$pcidevices) {
3378 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
000fc0a2 3379
b1f72af6
AD
3380 my $info = pci_device_info("0000:$pciid");
3381 die "IOMMU not present\n" if !check_iommu_support();
3382 die "no pci device info for device '$pciid'\n" if !$info;
000fc0a2 3383
b1f72af6
AD
3384 if ($d->{driver} && $d->{driver} eq "vfio") {
3385 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3386 } else {
3387 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3388 }
3389
8f3e88af 3390 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
b1f72af6 3391 }
040b06b7 3392 }
1e3baf05
DM
3393
3394 PVE::Storage::activate_volumes($storecfg, $vollist);
3395
585b6e28
DM
3396 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3397 umask => 0077); };
1e3baf05 3398 my $err = $@;
ff1a2432 3399 die "start failed: $err" if $err;
1e3baf05 3400
5bc1e039 3401 print "migration listens on $migrate_uri\n" if $migrate_uri;
afdb31d5 3402
8c609afd 3403 if ($statefile && $statefile ne 'tcp') {
95381ce0 3404 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
8c609afd 3405 warn $@ if $@;
62de2cbd
DM
3406 }
3407
1d794448 3408 if ($migratedfrom) {
a89fded1
AD
3409
3410 eval {
3411 PVE::QemuServer::set_migration_caps($vmid);
3412 };
1d794448 3413 warn $@ if $@;
a89fded1 3414
1d794448
DM
3415 if ($spice_port) {
3416 print "spice listens on port $spice_port\n";
3417 if ($spice_ticket) {
3418 PVE::QemuServer::vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
3419 PVE::QemuServer::vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
95a4b4a9
AD
3420 }
3421 }
3422
1d794448 3423 } else {
4ec05c4c 3424
15b1fc93 3425 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
be190583 3426 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
4ec05c4c 3427 if $conf->{balloon};
be190583
DM
3428 vm_mon_cmd_nocheck($vmid, 'qom-set',
3429 path => "machine/peripheral/balloon0",
3430 property => "guest-stats-polling-interval",
4ec05c4c
AD
3431 value => 2);
3432 }
e18b0b99 3433 }
1e3baf05
DM
3434 });
3435}
3436
0eedc444
AD
3437sub vm_mon_cmd {
3438 my ($vmid, $execute, %params) = @_;
3439
26f11676
DM
3440 my $cmd = { execute => $execute, arguments => \%params };
3441 vm_qmp_command($vmid, $cmd);
0eedc444
AD
3442}
3443
3444sub vm_mon_cmd_nocheck {
3445 my ($vmid, $execute, %params) = @_;
3446
26f11676
DM
3447 my $cmd = { execute => $execute, arguments => \%params };
3448 vm_qmp_command($vmid, $cmd, 1);
0eedc444
AD
3449}
3450
c971c4f2 3451sub vm_qmp_command {
d967756b 3452 my ($vmid, $cmd, $nocheck) = @_;
97d62eb7 3453
c971c4f2 3454 my $res;
26f11676 3455
14db5366
DM
3456 my $timeout;
3457 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
3458 $timeout = $cmd->{arguments}->{timeout};
3459 delete $cmd->{arguments}->{timeout};
3460 }
be190583 3461
c971c4f2
AD
3462 eval {
3463 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
ed221350 3464 my $sname = qmp_socket($vmid);
f5eb281a 3465 if (-e $sname) {
dab36e1e
DM
3466 my $qmpclient = PVE::QMPClient->new();
3467
14db5366 3468 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
dab36e1e
DM
3469 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
3470 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
3471 if scalar(%{$cmd->{arguments}});
3472 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
3473 } else {
3474 die "unable to open monitor socket\n";
3475 }
c971c4f2 3476 };
26f11676 3477 if (my $err = $@) {
c971c4f2
AD
3478 syslog("err", "VM $vmid qmp command failed - $err");
3479 die $err;
3480 }
3481
3482 return $res;
3483}
3484
9df5cbcc
DM
3485sub vm_human_monitor_command {
3486 my ($vmid, $cmdline) = @_;
3487
3488 my $res;
3489
f5eb281a 3490 my $cmd = {
9df5cbcc
DM
3491 execute => 'human-monitor-command',
3492 arguments => { 'command-line' => $cmdline},
3493 };
3494
3495 return vm_qmp_command($vmid, $cmd);
3496}
3497
1e3baf05
DM
3498sub vm_commandline {
3499 my ($storecfg, $vmid) = @_;
3500
6b64503e 3501 my $conf = load_config($vmid);
1e3baf05
DM
3502
3503 my $defaults = load_defaults();
3504
6b64503e 3505 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 3506
6b64503e 3507 return join(' ', @$cmd);
1e3baf05
DM
3508}
3509
3510sub vm_reset {
3511 my ($vmid, $skiplock) = @_;
3512
6b64503e 3513 lock_config($vmid, sub {
1e3baf05 3514
6b64503e 3515 my $conf = load_config($vmid);
1e3baf05 3516
6b64503e 3517 check_lock($conf) if !$skiplock;
1e3baf05 3518
816e2c4a 3519 vm_mon_cmd($vmid, "system_reset");
ff1a2432
DM
3520 });
3521}
3522
3523sub get_vm_volumes {
3524 my ($conf) = @_;
1e3baf05 3525
ff1a2432 3526 my $vollist = [];
d5769dc2
DM
3527 foreach_volid($conf, sub {
3528 my ($volid, $is_cdrom) = @_;
ff1a2432 3529
d5769dc2 3530 return if $volid =~ m|^/|;
ff1a2432 3531
d5769dc2
DM
3532 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
3533 return if !$sid;
ff1a2432
DM
3534
3535 push @$vollist, $volid;
1e3baf05 3536 });
ff1a2432
DM
3537
3538 return $vollist;
3539}
3540
3541sub vm_stop_cleanup {
254575e9 3542 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 3543
745fed70
DM
3544 eval {
3545 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 3546
254575e9
DM
3547 if (!$keepActive) {
3548 my $vollist = get_vm_volumes($conf);
3549 PVE::Storage::deactivate_volumes($storecfg, $vollist);
3550 }
961bfcb2 3551
ab6a046f 3552 foreach my $ext (qw(mon qmp pid vnc qga)) {
961bfcb2
DM
3553 unlink "/var/run/qemu-server/${vmid}.$ext";
3554 }
745fed70
DM
3555 };
3556 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
3557}
3558
e6c3b671 3559# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
3560# We need that when migration VMs to other nodes (files already moved)
3561# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 3562sub vm_stop {
af30308f 3563 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
9269013a 3564
9269013a 3565 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 3566
af30308f
DM
3567 if ($migratedfrom){
3568 my $pid = check_running($vmid, $nocheck, $migratedfrom);
3569 kill 15, $pid if $pid;
3570 my $conf = load_config($vmid, $migratedfrom);
3571 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
3572 return;
3573 }
3574
e6c3b671 3575 lock_config($vmid, sub {
1e3baf05 3576
e6c3b671 3577 my $pid = check_running($vmid, $nocheck);
ff1a2432 3578 return if !$pid;
1e3baf05 3579
ff1a2432 3580 my $conf;
e6c3b671 3581 if (!$nocheck) {
ff1a2432 3582 $conf = load_config($vmid);
e6c3b671 3583 check_lock($conf) if !$skiplock;
7f4a5b5a
DM
3584 if (!defined($timeout) && $shutdown && $conf->{startup}) {
3585 my $opts = parse_startup($conf->{startup});
3586 $timeout = $opts->{down} if $opts->{down};
3587 }
e6c3b671 3588 }
19672434 3589
7f4a5b5a
DM
3590 $timeout = 60 if !defined($timeout);
3591
9269013a
DM
3592 eval {
3593 if ($shutdown) {
988903ca 3594 $nocheck ? vm_mon_cmd_nocheck($vmid, "system_powerdown") : vm_mon_cmd($vmid, "system_powerdown");
bcb7c9cf 3595
9269013a 3596 } else {
988903ca 3597 $nocheck ? vm_mon_cmd_nocheck($vmid, "quit") : vm_mon_cmd($vmid, "quit");
afdb31d5 3598 }
9269013a 3599 };
1e3baf05
DM
3600 my $err = $@;
3601
3602 if (!$err) {
1e3baf05 3603 my $count = 0;
e6c3b671 3604 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
3605 $count++;
3606 sleep 1;
3607 }
3608
3609 if ($count >= $timeout) {
9269013a
DM
3610 if ($force) {
3611 warn "VM still running - terminating now with SIGTERM\n";
3612 kill 15, $pid;
3613 } else {
3614 die "VM quit/powerdown failed - got timeout\n";
3615 }
3616 } else {
254575e9 3617 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 3618 return;
1e3baf05
DM
3619 }
3620 } else {
9269013a
DM
3621 if ($force) {
3622 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
3623 kill 15, $pid;
3624 } else {
afdb31d5 3625 die "VM quit/powerdown failed\n";
9269013a 3626 }
1e3baf05
DM
3627 }
3628
3629 # wait again
ff1a2432 3630 $timeout = 10;
1e3baf05
DM
3631
3632 my $count = 0;
e6c3b671 3633 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
3634 $count++;
3635 sleep 1;
3636 }
3637
3638 if ($count >= $timeout) {
ff1a2432 3639 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 3640 kill 9, $pid;
ff1a2432 3641 sleep 1;
1e3baf05
DM
3642 }
3643
254575e9 3644 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 3645 });
1e3baf05
DM
3646}
3647
3648sub vm_suspend {
3649 my ($vmid, $skiplock) = @_;
3650
6b64503e 3651 lock_config($vmid, sub {
1e3baf05 3652
6b64503e 3653 my $conf = load_config($vmid);
1e3baf05 3654
051347aa 3655 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
bcb7c9cf 3656
f77f91f3 3657 vm_mon_cmd($vmid, "stop");
1e3baf05
DM
3658 });
3659}
3660
3661sub vm_resume {
3662 my ($vmid, $skiplock) = @_;
3663
6b64503e 3664 lock_config($vmid, sub {
1e3baf05 3665
6b64503e 3666 my $conf = load_config($vmid);
1e3baf05 3667
051347aa 3668 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
1e3baf05 3669
12060fe8 3670 vm_mon_cmd($vmid, "cont");
1e3baf05
DM
3671 });
3672}
3673
5fdbe4f0
DM
3674sub vm_sendkey {
3675 my ($vmid, $skiplock, $key) = @_;
1e3baf05 3676
6b64503e 3677 lock_config($vmid, sub {
1e3baf05 3678
6b64503e 3679 my $conf = load_config($vmid);
f5eb281a 3680
7b7c6d1b
DM
3681 # there is no qmp command, so we use the human monitor command
3682 vm_human_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
3683 });
3684}
3685
3686sub vm_destroy {
3687 my ($storecfg, $vmid, $skiplock) = @_;
3688
6b64503e 3689 lock_config($vmid, sub {
1e3baf05 3690
6b64503e 3691 my $conf = load_config($vmid);
1e3baf05 3692
6b64503e 3693 check_lock($conf) if !$skiplock;
1e3baf05 3694
ff1a2432
DM
3695 if (!check_running($vmid)) {
3696 fairsched_rmnod($vmid); # try to destroy group
3697 destroy_vm($storecfg, $vmid);
3698 } else {
3699 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
3700 }
3701 });
3702}
3703
1e3baf05
DM
3704# pci helpers
3705
3706sub file_write {
3707 my ($filename, $buf) = @_;
3708
6b64503e 3709 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
3710 return undef if !$fh;
3711
3712 my $res = print $fh $buf;
3713
3714 $fh->close();
3715
3716 return $res;
3717}
3718
3719sub pci_device_info {
3720 my ($name) = @_;
3721
3722 my $res;
3723
3724 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
3725 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
3726
3727 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
3728 return undef if !defined($irq) || $irq !~ m/^\d+$/;
3729
3730 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
3731 return undef if !defined($vendor) || $vendor !~ s/^0x//;
3732
3733 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
3734 return undef if !defined($product) || $product !~ s/^0x//;
3735
3736 $res = {
3737 name => $name,
3738 vendor => $vendor,
3739 product => $product,
3740 domain => $domain,
3741 bus => $bus,
3742 slot => $slot,
3743 func => $func,
3744 irq => $irq,
3745 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
3746 };
3747
3748 return $res;
3749}
3750
3751sub pci_dev_reset {
3752 my ($dev) = @_;
3753
3754 my $name = $dev->{name};
3755
3756 my $fn = "$pcisysfs/devices/$name/reset";
3757
6b64503e 3758 return file_write($fn, "1");
1e3baf05
DM
3759}
3760
3761sub pci_dev_bind_to_stub {
3762 my ($dev) = @_;
3763
3764 my $name = $dev->{name};
3765
3766 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
3767 return 1 if -d $testdir;
3768
3769 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 3770 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
3771
3772 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 3773 if (!file_write($fn, $name)) {
1e3baf05
DM
3774 return undef if -f $fn;
3775 }
3776
3777 $fn = "$pcisysfs/drivers/pci-stub/bind";
3778 if (! -d $testdir) {
6b64503e 3779 return undef if !file_write($fn, $name);
1e3baf05
DM
3780 }
3781
3782 return -d $testdir;
3783}
3784
000fc0a2
SP
3785sub pci_dev_bind_to_vfio {
3786 my ($dev) = @_;
3787
3788 my $name = $dev->{name};
3789
3790 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
3791
3792 if (!-d $vfio_basedir) {
3793 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
3794 }
3795 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
3796
3797 my $testdir = "$vfio_basedir/$name";
3798 return 1 if -d $testdir;
3799
3800 my $data = "$dev->{vendor} $dev->{product}";
3801 return undef if !file_write("$vfio_basedir/new_id", $data);
3802
3803 my $fn = "$pcisysfs/devices/$name/driver/unbind";
3804 if (!file_write($fn, $name)) {
3805 return undef if -f $fn;
3806 }
3807
3808 $fn = "$vfio_basedir/bind";
3809 if (! -d $testdir) {
3810 return undef if !file_write($fn, $name);
3811 }
3812
3813 return -d $testdir;
3814}
3815
3816sub pci_dev_group_bind_to_vfio {
3817 my ($pciid) = @_;
3818
3819 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
3820
3821 if (!-d $vfio_basedir) {
3822 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
3823 }
3824 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
3825
3826 # get IOMMU group devices
3827 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
3828 my @devs = grep /^0000:/, readdir($D);
3829 closedir($D);
3830
3831 foreach my $pciid (@devs) {
3832 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
3833 my $info = pci_device_info($1);
3834 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
3835 }
3836
3837 return 1;
3838}
3839
afdb31d5 3840sub print_pci_addr {
5bdcf937 3841 my ($id, $bridges) = @_;
6b64503e 3842
72a063e4 3843 my $res = '';
6b64503e 3844 my $devices = {
24f0d39a 3845 piix3 => { bus => 0, addr => 1 },
e5f7f8ed 3846 #addr2 : first videocard
13b5a753 3847 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 3848 watchdog => { bus => 0, addr => 4 },
cdd20088
AD
3849 scsihw0 => { bus => 0, addr => 5 },
3850 scsihw1 => { bus => 0, addr => 6 },
26ee04b6 3851 ahci0 => { bus => 0, addr => 7 },
ab6a046f 3852 qga0 => { bus => 0, addr => 8 },
1011b570 3853 spice => { bus => 0, addr => 9 },
6b64503e
DM
3854 virtio0 => { bus => 0, addr => 10 },
3855 virtio1 => { bus => 0, addr => 11 },
3856 virtio2 => { bus => 0, addr => 12 },
3857 virtio3 => { bus => 0, addr => 13 },
3858 virtio4 => { bus => 0, addr => 14 },
3859 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
3860 hostpci0 => { bus => 0, addr => 16 },
3861 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
3862 net0 => { bus => 0, addr => 18 },
3863 net1 => { bus => 0, addr => 19 },
3864 net2 => { bus => 0, addr => 20 },
3865 net3 => { bus => 0, addr => 21 },
3866 net4 => { bus => 0, addr => 22 },
3867 net5 => { bus => 0, addr => 23 },
2fa3151e
AD
3868 vga1 => { bus => 0, addr => 24 },
3869 vga2 => { bus => 0, addr => 25 },
3870 vga3 => { bus => 0, addr => 26 },
5cffb2d2
AD
3871 hostpci2 => { bus => 0, addr => 27 },
3872 hostpci3 => { bus => 0, addr => 28 },
e5f7f8ed 3873 #addr29 : usb-host (pve-usb.cfg)
5bdcf937
AD
3874 'pci.1' => { bus => 0, addr => 30 },
3875 'pci.2' => { bus => 0, addr => 31 },
3876 'net6' => { bus => 1, addr => 1 },
3877 'net7' => { bus => 1, addr => 2 },
3878 'net8' => { bus => 1, addr => 3 },
3879 'net9' => { bus => 1, addr => 4 },
3880 'net10' => { bus => 1, addr => 5 },
3881 'net11' => { bus => 1, addr => 6 },
3882 'net12' => { bus => 1, addr => 7 },
3883 'net13' => { bus => 1, addr => 8 },
3884 'net14' => { bus => 1, addr => 9 },
3885 'net15' => { bus => 1, addr => 10 },
3886 'net16' => { bus => 1, addr => 11 },
3887 'net17' => { bus => 1, addr => 12 },
3888 'net18' => { bus => 1, addr => 13 },
3889 'net19' => { bus => 1, addr => 14 },
3890 'net20' => { bus => 1, addr => 15 },
3891 'net21' => { bus => 1, addr => 16 },
3892 'net22' => { bus => 1, addr => 17 },
3893 'net23' => { bus => 1, addr => 18 },
3894 'net24' => { bus => 1, addr => 19 },
3895 'net25' => { bus => 1, addr => 20 },
3896 'net26' => { bus => 1, addr => 21 },
3897 'net27' => { bus => 1, addr => 22 },
3898 'net28' => { bus => 1, addr => 23 },
3899 'net29' => { bus => 1, addr => 24 },
3900 'net30' => { bus => 1, addr => 25 },
3901 'net31' => { bus => 1, addr => 26 },
3902 'virtio6' => { bus => 2, addr => 1 },
3903 'virtio7' => { bus => 2, addr => 2 },
3904 'virtio8' => { bus => 2, addr => 3 },
3905 'virtio9' => { bus => 2, addr => 4 },
3906 'virtio10' => { bus => 2, addr => 5 },
3907 'virtio11' => { bus => 2, addr => 6 },
3908 'virtio12' => { bus => 2, addr => 7 },
3909 'virtio13' => { bus => 2, addr => 8 },
3910 'virtio14' => { bus => 2, addr => 9 },
3911 'virtio15' => { bus => 2, addr => 10 },
6b64503e
DM
3912 };
3913
3914 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4 3915 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
5bdcf937
AD
3916 my $bus = $devices->{$id}->{bus};
3917 $res = ",bus=pci.$bus,addr=$addr";
98627641 3918 $bridges->{$bus} = 1 if $bridges;
72a063e4
DA
3919 }
3920 return $res;
3921
3922}
3923
2e3b7e2a
AD
3924sub print_pcie_addr {
3925 my ($id) = @_;
3926
3927 my $res = '';
3928 my $devices = {
3929 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
3930 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
3931 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
3932 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
3933 };
3934
3935 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
3936 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
3937 my $bus = $devices->{$id}->{bus};
3938 $res = ",bus=$bus,addr=$addr";
3939 }
3940 return $res;
3941
3942}
3943
3e16d5fc
DM
3944# vzdump restore implementaion
3945
ed221350 3946sub tar_archive_read_firstfile {
3e16d5fc 3947 my $archive = shift;
afdb31d5 3948
3e16d5fc
DM
3949 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
3950
3951 # try to detect archive type first
3952 my $pid = open (TMP, "tar tf '$archive'|") ||
3953 die "unable to open file '$archive'\n";
3954 my $firstfile = <TMP>;
3955 kill 15, $pid;
3956 close TMP;
3957
3958 die "ERROR: archive contaions no data\n" if !$firstfile;
3959 chomp $firstfile;
3960
3961 return $firstfile;
3962}
3963
ed221350
DM
3964sub tar_restore_cleanup {
3965 my ($storecfg, $statfile) = @_;
3e16d5fc
DM
3966
3967 print STDERR "starting cleanup\n";
3968
3969 if (my $fd = IO::File->new($statfile, "r")) {
3970 while (defined(my $line = <$fd>)) {
3971 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
3972 my $volid = $2;
3973 eval {
3974 if ($volid =~ m|^/|) {
3975 unlink $volid || die 'unlink failed\n';
3976 } else {
ed221350 3977 PVE::Storage::vdisk_free($storecfg, $volid);
3e16d5fc 3978 }
afdb31d5 3979 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
3980 };
3981 print STDERR "unable to cleanup '$volid' - $@" if $@;
3982 } else {
3983 print STDERR "unable to parse line in statfile - $line";
afdb31d5 3984 }
3e16d5fc
DM
3985 }
3986 $fd->close();
3987 }
3988}
3989
3990sub restore_archive {
a0d1b1a2 3991 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 3992
91bd6c90
DM
3993 my $format = $opts->{format};
3994 my $comp;
3995
3996 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
3997 $format = 'tar' if !$format;
3998 $comp = 'gzip';
3999 } elsif ($archive =~ m/\.tar$/) {
4000 $format = 'tar' if !$format;
4001 } elsif ($archive =~ m/.tar.lzo$/) {
4002 $format = 'tar' if !$format;
4003 $comp = 'lzop';
4004 } elsif ($archive =~ m/\.vma$/) {
4005 $format = 'vma' if !$format;
4006 } elsif ($archive =~ m/\.vma\.gz$/) {
4007 $format = 'vma' if !$format;
4008 $comp = 'gzip';
4009 } elsif ($archive =~ m/\.vma\.lzo$/) {
4010 $format = 'vma' if !$format;
4011 $comp = 'lzop';
4012 } else {
4013 $format = 'vma' if !$format; # default
4014 }
4015
4016 # try to detect archive format
4017 if ($format eq 'tar') {
4018 return restore_tar_archive($archive, $vmid, $user, $opts);
4019 } else {
4020 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4021 }
4022}
4023
4024sub restore_update_config_line {
4025 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4026
4027 return if $line =~ m/^\#qmdump\#/;
4028 return if $line =~ m/^\#vzdump\#/;
4029 return if $line =~ m/^lock:/;
4030 return if $line =~ m/^unused\d+:/;
4031 return if $line =~ m/^parent:/;
ca3e4fa4 4032 return if $line =~ m/^template:/; # restored VM is never a template
91bd6c90
DM
4033
4034 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4035 # try to convert old 1.X settings
4036 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4037 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4038 my ($model, $macaddr) = split(/\=/, $devconfig);
4039 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4040 my $net = {
4041 model => $model,
4042 bridge => "vmbr$ind",
4043 macaddr => $macaddr,
4044 };
4045 my $netstr = print_net($net);
4046
4047 print $outfd "net$cookie->{netcount}: $netstr\n";
4048 $cookie->{netcount}++;
4049 }
4050 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4051 my ($id, $netstr) = ($1, $2);
4052 my $net = parse_net($netstr);
4053 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4054 $netstr = print_net($net);
4055 print $outfd "$id: $netstr\n";
4056 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4057 my $virtdev = $1;
907ea891 4058 my $value = $3;
91bd6c90
DM
4059 if ($line =~ m/backup=no/) {
4060 print $outfd "#$line";
4061 } elsif ($virtdev && $map->{$virtdev}) {
ed221350 4062 my $di = parse_drive($virtdev, $value);
8fd57431 4063 delete $di->{format}; # format can change on restore
91bd6c90 4064 $di->{file} = $map->{$virtdev};
ed221350 4065 $value = print_drive($vmid, $di);
91bd6c90
DM
4066 print $outfd "$virtdev: $value\n";
4067 } else {
4068 print $outfd $line;
4069 }
4070 } else {
4071 print $outfd $line;
4072 }
4073}
4074
4075sub scan_volids {
4076 my ($cfg, $vmid) = @_;
4077
4078 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4079
4080 my $volid_hash = {};
4081 foreach my $storeid (keys %$info) {
4082 foreach my $item (@{$info->{$storeid}}) {
4083 next if !($item->{volid} && $item->{size});
5996a936 4084 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
91bd6c90
DM
4085 $volid_hash->{$item->{volid}} = $item;
4086 }
4087 }
4088
4089 return $volid_hash;
4090}
4091
a8e2f942
DM
4092sub get_used_paths {
4093 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4094
4095 my $used_path = {};
4096
4097 my $scan_config = sub {
4098 my ($cref, $snapname) = @_;
4099
4100 foreach my $key (keys %$cref) {
4101 my $value = $cref->{$key};
4102 if (valid_drivename($key)) {
4103 next if $skip_drive && $key eq $skip_drive;
4104 my $drive = parse_drive($key, $value);
4105 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4106 if ($drive->{file} =~ m!^/!) {
4107 $used_path->{$drive->{file}}++; # = 1;
4108 } else {
4109 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4110 next if !$storeid;
4111 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4112 next if !$scfg;
4113 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4114 $used_path->{$path}++; # = 1;
4115 }
4116 }
4117 }
4118 };
4119
4120 &$scan_config($conf);
4121
4122 undef $skip_drive;
4123
4124 if ($scan_snapshots) {
4125 foreach my $snapname (keys %{$conf->{snapshots}}) {
4126 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4127 }
4128 }
4129
4130 return $used_path;
4131}
4132
91bd6c90
DM
4133sub update_disksize {
4134 my ($vmid, $conf, $volid_hash) = @_;
be190583 4135
91bd6c90
DM
4136 my $changes;
4137
4138 my $used = {};
4139
5996a936
DM
4140 # Note: it is allowed to define multiple storages with same path (alias), so
4141 # we need to check both 'volid' and real 'path' (two different volid can point
4142 # to the same path).
4143
4144 my $usedpath = {};
be190583 4145
91bd6c90
DM
4146 # update size info
4147 foreach my $opt (keys %$conf) {
ed221350
DM
4148 if (valid_drivename($opt)) {
4149 my $drive = parse_drive($opt, $conf->{$opt});
91bd6c90
DM
4150 my $volid = $drive->{file};
4151 next if !$volid;
4152
4153 $used->{$volid} = 1;
be190583 4154 if ($volid_hash->{$volid} &&
5996a936
DM
4155 (my $path = $volid_hash->{$volid}->{path})) {
4156 $usedpath->{$path} = 1;
4157 }
91bd6c90 4158
ed221350 4159 next if drive_is_cdrom($drive);
91bd6c90
DM
4160 next if !$volid_hash->{$volid};
4161
4162 $drive->{size} = $volid_hash->{$volid}->{size};
7a907ce6
DM
4163 my $new = print_drive($vmid, $drive);
4164 if ($new ne $conf->{$opt}) {
4165 $changes = 1;
4166 $conf->{$opt} = $new;
4167 }
91bd6c90
DM
4168 }
4169 }
4170
5996a936
DM
4171 # remove 'unusedX' entry if volume is used
4172 foreach my $opt (keys %$conf) {
4173 next if $opt !~ m/^unused\d+$/;
4174 my $volid = $conf->{$opt};
4175 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
be190583 4176 if ($used->{$volid} || ($path && $usedpath->{$path})) {
5996a936
DM
4177 $changes = 1;
4178 delete $conf->{$opt};
4179 }
4180 }
4181
91bd6c90
DM
4182 foreach my $volid (sort keys %$volid_hash) {
4183 next if $volid =~ m/vm-$vmid-state-/;
4184 next if $used->{$volid};
5996a936
DM
4185 my $path = $volid_hash->{$volid}->{path};
4186 next if !$path; # just to be sure
4187 next if $usedpath->{$path};
91bd6c90 4188 $changes = 1;
ed221350 4189 add_unused_volume($conf, $volid);
05937a14 4190 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
91bd6c90
DM
4191 }
4192
4193 return $changes;
4194}
4195
4196sub rescan {
4197 my ($vmid, $nolock) = @_;
4198
4199 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4200
4201 my $volid_hash = scan_volids($cfg, $vmid);
4202
4203 my $updatefn = sub {
4204 my ($vmid) = @_;
4205
ed221350 4206 my $conf = load_config($vmid);
be190583 4207
ed221350 4208 check_lock($conf);
91bd6c90 4209
03da3f0d
DM
4210 my $vm_volids = {};
4211 foreach my $volid (keys %$volid_hash) {
4212 my $info = $volid_hash->{$volid};
4213 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4214 }
4215
4216 my $changes = update_disksize($vmid, $conf, $vm_volids);
91bd6c90 4217
ed221350 4218 update_config_nolock($vmid, $conf, 1) if $changes;
91bd6c90
DM
4219 };
4220
4221 if (defined($vmid)) {
4222 if ($nolock) {
4223 &$updatefn($vmid);
4224 } else {
ed221350 4225 lock_config($vmid, $updatefn, $vmid);
91bd6c90
DM
4226 }
4227 } else {
4228 my $vmlist = config_list();
4229 foreach my $vmid (keys %$vmlist) {
4230 if ($nolock) {
4231 &$updatefn($vmid);
4232 } else {
ed221350 4233 lock_config($vmid, $updatefn, $vmid);
be190583 4234 }
91bd6c90
DM
4235 }
4236 }
4237}
4238
4239sub restore_vma_archive {
4240 my ($archive, $vmid, $user, $opts, $comp) = @_;
4241
4242 my $input = $archive eq '-' ? "<&STDIN" : undef;
4243 my $readfrom = $archive;
4244
4245 my $uncomp = '';
4246 if ($comp) {
4247 $readfrom = '-';
4248 my $qarchive = PVE::Tools::shellquote($archive);
4249 if ($comp eq 'gzip') {
4250 $uncomp = "zcat $qarchive|";
4251 } elsif ($comp eq 'lzop') {
4252 $uncomp = "lzop -d -c $qarchive|";
4253 } else {
4254 die "unknown compression method '$comp'\n";
4255 }
be190583 4256
91bd6c90
DM
4257 }
4258
4259 my $tmpdir = "/var/tmp/vzdumptmp$$";
4260 rmtree $tmpdir;
4261
4262 # disable interrupts (always do cleanups)
4263 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4264 warn "got interrupt - ignored\n";
4265 };
4266
4267 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4268 POSIX::mkfifo($mapfifo, 0600);
4269 my $fifofh;
4270
4271 my $openfifo = sub {
4272 open($fifofh, '>', $mapfifo) || die $!;
4273 };
4274
4275 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4276
4277 my $oldtimeout;
4278 my $timeout = 5;
4279
4280 my $devinfo = {};
4281
4282 my $rpcenv = PVE::RPCEnvironment::get();
4283
ed221350 4284 my $conffile = config_file($vmid);
91bd6c90
DM
4285 my $tmpfn = "$conffile.$$.tmp";
4286
ed221350
DM
4287 # Note: $oldconf is undef if VM does not exists
4288 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4289
91bd6c90
DM
4290 my $print_devmap = sub {
4291 my $virtdev_hash = {};
4292
4293 my $cfgfn = "$tmpdir/qemu-server.conf";
4294
4295 # we can read the config - that is already extracted
4296 my $fh = IO::File->new($cfgfn, "r") ||
4297 "unable to read qemu-server.conf - $!\n";
4298
4299 while (defined(my $line = <$fh>)) {
4300 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4301 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4302 die "archive does not contain data for drive '$virtdev'\n"
4303 if !$devinfo->{$devname};
4304 if (defined($opts->{storage})) {
4305 $storeid = $opts->{storage} || 'local';
4306 } elsif (!$storeid) {
4307 $storeid = 'local';
4308 }
4309 $format = 'raw' if !$format;
4310 $devinfo->{$devname}->{devname} = $devname;
4311 $devinfo->{$devname}->{virtdev} = $virtdev;
4312 $devinfo->{$devname}->{format} = $format;
4313 $devinfo->{$devname}->{storeid} = $storeid;
4314
be190583 4315 # check permission on storage
91bd6c90
DM
4316 my $pool = $opts->{pool}; # todo: do we need that?
4317 if ($user ne 'root@pam') {
4318 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4319 }
4320
4321 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4322 }
4323 }
4324
4325 foreach my $devname (keys %$devinfo) {
be190583
DM
4326 die "found no device mapping information for device '$devname'\n"
4327 if !$devinfo->{$devname}->{virtdev};
91bd6c90
DM
4328 }
4329
91bd6c90 4330 my $cfg = cfs_read_file('storage.cfg');
ed221350
DM
4331
4332 # create empty/temp config
be190583 4333 if ($oldconf) {
ed221350
DM
4334 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4335 foreach_drive($oldconf, sub {
4336 my ($ds, $drive) = @_;
4337
4338 return if drive_is_cdrom($drive);
4339
4340 my $volid = $drive->{file};
4341
4342 return if !$volid || $volid =~ m|^/|;
4343
4344 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4345 return if !$path || !$owner || ($owner != $vmid);
4346
4347 # Note: only delete disk we want to restore
4348 # other volumes will become unused
4349 if ($virtdev_hash->{$ds}) {
4350 PVE::Storage::vdisk_free($cfg, $volid);
4351 }
4352 });
4353 }
4354
4355 my $map = {};
91bd6c90
DM
4356 foreach my $virtdev (sort keys %$virtdev_hash) {
4357 my $d = $virtdev_hash->{$virtdev};
4358 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4359 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
8fd57431
DM
4360
4361 # test if requested format is supported
4362 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4363 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4364 $d->{format} = $defFormat if !$supported;
4365
91bd6c90
DM
4366 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4367 $d->{format}, undef, $alloc_size);
4368 print STDERR "new volume ID is '$volid'\n";
4369 $d->{volid} = $volid;
4370 my $path = PVE::Storage::path($cfg, $volid);
4371
4372 my $write_zeros = 1;
4373 # fixme: what other storages types initialize volumes with zero?
244f2577 4374 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
013d5275 4375 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
91bd6c90
DM
4376 $write_zeros = 0;
4377 }
4378
4379 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4380
4381 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4382 $map->{$virtdev} = $volid;
4383 }
4384
4385 $fh->seek(0, 0) || die "seek failed - $!\n";
4386
4387 my $outfd = new IO::File ($tmpfn, "w") ||
4388 die "unable to write config for VM $vmid\n";
4389
4390 my $cookie = { netcount => 0 };
4391 while (defined(my $line = <$fh>)) {
be190583 4392 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
91bd6c90
DM
4393 }
4394
4395 $fh->close();
4396 $outfd->close();
4397 };
4398
4399 eval {
4400 # enable interrupts
4401 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4402 die "interrupted by signal\n";
4403 };
4404 local $SIG{ALRM} = sub { die "got timeout\n"; };
4405
4406 $oldtimeout = alarm($timeout);
4407
4408 my $parser = sub {
4409 my $line = shift;
4410
4411 print "$line\n";
4412
4413 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
4414 my ($dev_id, $size, $devname) = ($1, $2, $3);
4415 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
4416 } elsif ($line =~ m/^CTIME: /) {
46f58b5f 4417 # we correctly received the vma config, so we can disable
3cf90d7a
DM
4418 # the timeout now for disk allocation (set to 10 minutes, so
4419 # that we always timeout if something goes wrong)
4420 alarm(600);
91bd6c90
DM
4421 &$print_devmap();
4422 print $fifofh "done\n";
4423 my $tmp = $oldtimeout || 0;
4424 $oldtimeout = undef;
4425 alarm($tmp);
4426 close($fifofh);
4427 }
4428 };
be190583 4429
91bd6c90
DM
4430 print "restore vma archive: $cmd\n";
4431 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
4432 };
4433 my $err = $@;
4434
4435 alarm($oldtimeout) if $oldtimeout;
4436
4437 unlink $mapfifo;
4438
4439 if ($err) {
4440 rmtree $tmpdir;
4441 unlink $tmpfn;
4442
4443 my $cfg = cfs_read_file('storage.cfg');
4444 foreach my $devname (keys %$devinfo) {
4445 my $volid = $devinfo->{$devname}->{volid};
4446 next if !$volid;
4447 eval {
4448 if ($volid =~ m|^/|) {
4449 unlink $volid || die 'unlink failed\n';
4450 } else {
4451 PVE::Storage::vdisk_free($cfg, $volid);
4452 }
4453 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4454 };
4455 print STDERR "unable to cleanup '$volid' - $@" if $@;
4456 }
4457 die $err;
4458 }
4459
4460 rmtree $tmpdir;
ed221350
DM
4461
4462 rename($tmpfn, $conffile) ||
91bd6c90
DM
4463 die "unable to commit configuration file '$conffile'\n";
4464
ed221350
DM
4465 PVE::Cluster::cfs_update(); # make sure we read new file
4466
91bd6c90
DM
4467 eval { rescan($vmid, 1); };
4468 warn $@ if $@;
4469}
4470
4471sub restore_tar_archive {
4472 my ($archive, $vmid, $user, $opts) = @_;
4473
9c502e26 4474 if ($archive ne '-') {
ed221350 4475 my $firstfile = tar_archive_read_firstfile($archive);
9c502e26
DM
4476 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
4477 if $firstfile ne 'qemu-server.conf';
4478 }
3e16d5fc 4479
ed221350 4480 my $storecfg = cfs_read_file('storage.cfg');
ebb55558 4481
ed221350 4482 # destroy existing data - keep empty config
ebb55558
DM
4483 my $vmcfgfn = PVE::QemuServer::config_file($vmid);
4484 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
ed221350 4485
3e16d5fc
DM
4486 my $tocmd = "/usr/lib/qemu-server/qmextract";
4487
2415a446 4488 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 4489 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
4490 $tocmd .= ' --prealloc' if $opts->{prealloc};
4491 $tocmd .= ' --info' if $opts->{info};
4492
a0d1b1a2 4493 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 4494 # so we pipe to zcat
2415a446
DM
4495 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
4496 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
4497
4498 my $tmpdir = "/var/tmp/vzdumptmp$$";
4499 mkpath $tmpdir;
4500
4501 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
4502 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 4503 local $ENV{VZDUMP_USER} = $user;
3e16d5fc 4504
ed221350 4505 my $conffile = config_file($vmid);
3e16d5fc
DM
4506 my $tmpfn = "$conffile.$$.tmp";
4507
4508 # disable interrupts (always do cleanups)
4509 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4510 print STDERR "got interrupt - ignored\n";
4511 };
4512
afdb31d5 4513 eval {
3e16d5fc
DM
4514 # enable interrupts
4515 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4516 die "interrupted by signal\n";
4517 };
4518
9c502e26
DM
4519 if ($archive eq '-') {
4520 print "extracting archive from STDIN\n";
4521 run_command($cmd, input => "<&STDIN");
4522 } else {
4523 print "extracting archive '$archive'\n";
4524 run_command($cmd);
4525 }
3e16d5fc
DM
4526
4527 return if $opts->{info};
4528
4529 # read new mapping
4530 my $map = {};
4531 my $statfile = "$tmpdir/qmrestore.stat";
4532 if (my $fd = IO::File->new($statfile, "r")) {
4533 while (defined (my $line = <$fd>)) {
4534 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4535 $map->{$1} = $2 if $1;
4536 } else {
4537 print STDERR "unable to parse line in statfile - $line\n";
4538 }
4539 }
4540 $fd->close();
4541 }
4542
4543 my $confsrc = "$tmpdir/qemu-server.conf";
4544
4545 my $srcfd = new IO::File($confsrc, "r") ||
4546 die "unable to open file '$confsrc'\n";
4547
4548 my $outfd = new IO::File ($tmpfn, "w") ||
4549 die "unable to write config for VM $vmid\n";
4550
91bd6c90 4551 my $cookie = { netcount => 0 };
3e16d5fc 4552 while (defined (my $line = <$srcfd>)) {
be190583 4553 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3e16d5fc
DM
4554 }
4555
4556 $srcfd->close();
4557 $outfd->close();
4558 };
4559 my $err = $@;
4560
afdb31d5 4561 if ($err) {
3e16d5fc
DM
4562
4563 unlink $tmpfn;
4564
ed221350 4565 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 4566
3e16d5fc 4567 die $err;
afdb31d5 4568 }
3e16d5fc
DM
4569
4570 rmtree $tmpdir;
4571
4572 rename $tmpfn, $conffile ||
4573 die "unable to commit configuration file '$conffile'\n";
91bd6c90 4574
ed221350
DM
4575 PVE::Cluster::cfs_update(); # make sure we read new file
4576
91bd6c90
DM
4577 eval { rescan($vmid, 1); };
4578 warn $@ if $@;
3e16d5fc
DM
4579};
4580
0d18dcfc
DM
4581
4582# Internal snapshots
4583
4584# NOTE: Snapshot create/delete involves several non-atomic
4585# action, and can take a long time.
4586# So we try to avoid locking the file and use 'lock' variable
4587# inside the config file instead.
4588
ef59d1ca
DM
4589my $snapshot_copy_config = sub {
4590 my ($source, $dest) = @_;
4591
4592 foreach my $k (keys %$source) {
4593 next if $k eq 'snapshots';
982c7f12
DM
4594 next if $k eq 'snapstate';
4595 next if $k eq 'snaptime';
18bfb361 4596 next if $k eq 'vmstate';
ef59d1ca
DM
4597 next if $k eq 'lock';
4598 next if $k eq 'digest';
db7c26e5 4599 next if $k eq 'description';
ef59d1ca 4600 next if $k =~ m/^unused\d+$/;
be190583 4601
ef59d1ca
DM
4602 $dest->{$k} = $source->{$k};
4603 }
4604};
4605
4606my $snapshot_apply_config = sub {
4607 my ($conf, $snap) = @_;
4608
4609 # copy snapshot list
4610 my $newconf = {
4611 snapshots => $conf->{snapshots},
4612 };
4613
db7c26e5 4614 # keep description and list of unused disks
ef59d1ca 4615 foreach my $k (keys %$conf) {
db7c26e5 4616 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
ef59d1ca
DM
4617 $newconf->{$k} = $conf->{$k};
4618 }
4619
4620 &$snapshot_copy_config($snap, $newconf);
4621
4622 return $newconf;
4623};
4624
18bfb361
DM
4625sub foreach_writable_storage {
4626 my ($conf, $func) = @_;
4627
4628 my $sidhash = {};
4629
4630 foreach my $ds (keys %$conf) {
4631 next if !valid_drivename($ds);
4632
4633 my $drive = parse_drive($ds, $conf->{$ds});
4634 next if !$drive;
4635 next if drive_is_cdrom($drive);
4636
4637 my $volid = $drive->{file};
4638
4639 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
be190583 4640 $sidhash->{$sid} = $sid if $sid;
18bfb361
DM
4641 }
4642
4643 foreach my $sid (sort keys %$sidhash) {
4644 &$func($sid);
4645 }
4646}
4647
4648my $alloc_vmstate_volid = sub {
4649 my ($storecfg, $vmid, $conf, $snapname) = @_;
be190583 4650
18bfb361
DM
4651 # Note: we try to be smart when selecting a $target storage
4652
4653 my $target;
4654
4655 # search shared storage first
4656 foreach_writable_storage($conf, sub {
4657 my ($sid) = @_;
4658 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4659 return if !$scfg->{shared};
4660
4661 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
4662 });
4663
4664 if (!$target) {
4665 # now search local storage
4666 foreach_writable_storage($conf, sub {
4667 my ($sid) = @_;
4668 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4669 return if $scfg->{shared};
4670
4671 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
4672 });
4673 }
4674
4675 $target = 'local' if !$target;
4676
fe6249f4
DM
4677 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
4678 # we abort live save after $conf->{memory}, so we need at max twice that space
4679 my $size = $conf->{memory}*2 + $driver_state_size;
18bfb361
DM
4680
4681 my $name = "vm-$vmid-state-$snapname";
4682 my $scfg = PVE::Storage::storage_config($storecfg, $target);
4683 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
4684 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
4685
4686 return $volid;
4687};
4688
0d18dcfc 4689my $snapshot_prepare = sub {
18bfb361 4690 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
22c377f0
DM
4691
4692 my $snap;
0d18dcfc
DM
4693
4694 my $updatefn = sub {
4695
4696 my $conf = load_config($vmid);
4697
be190583 4698 die "you can't take a snapshot if it's a template\n"
5295b23d
DM
4699 if is_template($conf);
4700
0d18dcfc
DM
4701 check_lock($conf);
4702
22c377f0
DM
4703 $conf->{lock} = 'snapshot';
4704
be190583
DM
4705 die "snapshot name '$snapname' already used\n"
4706 if defined($conf->{snapshots}->{$snapname});
0d18dcfc 4707
ee2f90b1 4708 my $storecfg = PVE::Storage::config();
7ea975ef 4709 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
18bfb361 4710
782f4f75 4711 $snap = $conf->{snapshots}->{$snapname} = {};
0d18dcfc 4712
18bfb361
DM
4713 if ($save_vmstate && check_running($vmid)) {
4714 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
4715 }
4716
ef59d1ca 4717 &$snapshot_copy_config($conf, $snap);
0d18dcfc 4718
782f4f75
DM
4719 $snap->{snapstate} = "prepare";
4720 $snap->{snaptime} = time();
4721 $snap->{description} = $comment if $comment;
4722
4b15803d
DM
4723 # always overwrite machine if we save vmstate. This makes sure we
4724 # can restore it later using correct machine type
4725 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
4726
0d18dcfc
DM
4727 update_config_nolock($vmid, $conf, 1);
4728 };
4729
4730 lock_config($vmid, $updatefn);
22c377f0
DM
4731
4732 return $snap;
0d18dcfc
DM
4733};
4734
4735my $snapshot_commit = sub {
4736 my ($vmid, $snapname) = @_;
4737
4738 my $updatefn = sub {
4739
4740 my $conf = load_config($vmid);
4741
be190583
DM
4742 die "missing snapshot lock\n"
4743 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
0d18dcfc
DM
4744
4745 my $snap = $conf->{snapshots}->{$snapname};
4746
be190583
DM
4747 die "snapshot '$snapname' does not exist\n" if !defined($snap);
4748
4749 die "wrong snapshot state\n"
4750 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
0d18dcfc 4751
0d18dcfc 4752 delete $snap->{snapstate};
ee2f90b1 4753 delete $conf->{lock};
0d18dcfc 4754
ef59d1ca 4755 my $newconf = &$snapshot_apply_config($conf, $snap);
0d18dcfc 4756
05e5ad3f
DM
4757 $newconf->{parent} = $snapname;
4758
0d18dcfc
DM
4759 update_config_nolock($vmid, $newconf, 1);
4760 };
4761
4762 lock_config($vmid, $updatefn);
4763};
4764
22c377f0
DM
4765sub snapshot_rollback {
4766 my ($vmid, $snapname) = @_;
4767
4768 my $snap;
4769
4770 my $prepare = 1;
4771
a3222b91 4772 my $storecfg = PVE::Storage::config();
be190583 4773
22c377f0
DM
4774 my $updatefn = sub {
4775
4776 my $conf = load_config($vmid);
4777
8b43bc11 4778 die "you can't rollback if vm is a template\n" if is_template($conf);
90b0c6b3 4779
ab33a7c2
DM
4780 $snap = $conf->{snapshots}->{$snapname};
4781
be190583 4782 die "snapshot '$snapname' does not exist\n" if !defined($snap);
ab33a7c2 4783
be190583 4784 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
ab33a7c2
DM
4785 if $snap->{snapstate};
4786
a3222b91
DM
4787 if ($prepare) {
4788 check_lock($conf);
4789 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
4790 }
22c377f0
DM
4791
4792 die "unable to rollback vm $vmid: vm is running\n"
4793 if check_running($vmid);
4794
4795 if ($prepare) {
4796 $conf->{lock} = 'rollback';
4797 } else {
4798 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
4799 delete $conf->{lock};
4800 }
4801
4b15803d
DM
4802 my $forcemachine;
4803
22c377f0 4804 if (!$prepare) {
4b15803d
DM
4805 my $has_machine_config = defined($conf->{machine});
4806
22c377f0 4807 # copy snapshot config to current config
ef59d1ca
DM
4808 $conf = &$snapshot_apply_config($conf, $snap);
4809 $conf->{parent} = $snapname;
4b15803d 4810
d8b916fd
DM
4811 # Note: old code did not store 'machine', so we try to be smart
4812 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
4813 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
be190583 4814 # we remove the 'machine' configuration if not explicitly specified
4b15803d
DM
4815 # in the original config.
4816 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
22c377f0
DM
4817 }
4818
4819 update_config_nolock($vmid, $conf, 1);
a3222b91
DM
4820
4821 if (!$prepare && $snap->{vmstate}) {
4822 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4b15803d 4823 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
a3222b91 4824 }
22c377f0
DM
4825 };
4826
4827 lock_config($vmid, $updatefn);
be190583 4828
22c377f0
DM
4829 foreach_drive($snap, sub {
4830 my ($ds, $drive) = @_;
4831
4832 return if drive_is_cdrom($drive);
4833
4834 my $volid = $drive->{file};
4835 my $device = "drive-$ds";
4836
79e57b29 4837 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
22c377f0
DM
4838 });
4839
4840 $prepare = 0;
4841 lock_config($vmid, $updatefn);
4842}
4843
9dcf4909
DM
4844my $savevm_wait = sub {
4845 my ($vmid) = @_;
4846
4847 for(;;) {
ed221350 4848 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
9dcf4909
DM
4849 if (!$stat->{status}) {
4850 die "savevm not active\n";
4851 } elsif ($stat->{status} eq 'active') {
4852 sleep(1);
4853 next;
4854 } elsif ($stat->{status} eq 'completed') {
4855 last;
4856 } else {
4857 die "query-savevm returned status '$stat->{status}'\n";
4858 }
4859 }
4860};
4861
0d18dcfc 4862sub snapshot_create {
18bfb361 4863 my ($vmid, $snapname, $save_vmstate, $freezefs, $comment) = @_;
0d18dcfc 4864
18bfb361 4865 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
0d18dcfc 4866
18bfb361 4867 $freezefs = $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
030dd626 4868
3ee28e38
DM
4869 my $drivehash = {};
4870
18bfb361
DM
4871 my $running = check_running($vmid);
4872
0d18dcfc
DM
4873 eval {
4874 # create internal snapshots of all drives
22c377f0
DM
4875
4876 my $storecfg = PVE::Storage::config();
a3222b91
DM
4877
4878 if ($running) {
4879 if ($snap->{vmstate}) {
be190583 4880 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
9dcf4909
DM
4881 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
4882 &$savevm_wait($vmid);
a3222b91 4883 } else {
9dcf4909 4884 vm_mon_cmd($vmid, "savevm-start");
a3222b91
DM
4885 }
4886 };
4887
4888 qga_freezefs($vmid) if $running && $freezefs;
be190583 4889
22c377f0
DM
4890 foreach_drive($snap, sub {
4891 my ($ds, $drive) = @_;
4892
4893 return if drive_is_cdrom($drive);
0d18dcfc 4894
22c377f0
DM
4895 my $volid = $drive->{file};
4896 my $device = "drive-$ds";
4897
4898 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
3ee28e38 4899 $drivehash->{$ds} = 1;
22c377f0 4900 });
0d18dcfc 4901 };
22c377f0
DM
4902 my $err = $@;
4903
1a71fa73 4904 eval { qga_unfreezefs($vmid) if $running && $freezefs; };
22c377f0
DM
4905 warn $@ if $@;
4906
9dcf4909 4907 eval { vm_mon_cmd($vmid, "savevm-end") if $running; };
22c377f0
DM
4908 warn $@ if $@;
4909
4910 if ($err) {
0d18dcfc 4911 warn "snapshot create failed: starting cleanup\n";
3ee28e38 4912 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
0d18dcfc
DM
4913 warn $@ if $@;
4914 die $err;
4915 }
4916
4917 &$snapshot_commit($vmid, $snapname);
4918}
4919
3ee28e38 4920# Note: $drivehash is only set when called from snapshot_create.
0d18dcfc 4921sub snapshot_delete {
3ee28e38 4922 my ($vmid, $snapname, $force, $drivehash) = @_;
0d18dcfc
DM
4923
4924 my $prepare = 1;
4925
22c377f0 4926 my $snap;
ee2f90b1 4927 my $unused = [];
0d18dcfc 4928
6cb1a8cf
DM
4929 my $unlink_parent = sub {
4930 my ($confref, $new_parent) = @_;
4931
4932 if ($confref->{parent} && $confref->{parent} eq $snapname) {
4933 if ($new_parent) {
4934 $confref->{parent} = $new_parent;
4935 } else {
4936 delete $confref->{parent};
4937 }
4938 }
4939 };
be190583 4940
0d18dcfc 4941 my $updatefn = sub {
2009f324 4942 my ($remove_drive) = @_;
0d18dcfc 4943
22c377f0 4944 my $conf = load_config($vmid);
0d18dcfc 4945
5295b23d
DM
4946 if (!$drivehash) {
4947 check_lock($conf);
be190583 4948 die "you can't delete a snapshot if vm is a template\n"
5295b23d
DM
4949 if is_template($conf);
4950 }
0d18dcfc 4951
22c377f0 4952 $snap = $conf->{snapshots}->{$snapname};
0d18dcfc 4953
be190583 4954 die "snapshot '$snapname' does not exist\n" if !defined($snap);
0d18dcfc
DM
4955
4956 # remove parent refs
8fd882a4
SP
4957 if (!$prepare) {
4958 &$unlink_parent($conf, $snap->{parent});
4959 foreach my $sn (keys %{$conf->{snapshots}}) {
4960 next if $sn eq $snapname;
4961 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
4962 }
0d18dcfc
DM
4963 }
4964
2009f324 4965 if ($remove_drive) {
18bfb361
DM
4966 if ($remove_drive eq 'vmstate') {
4967 delete $snap->{$remove_drive};
4968 } else {
4969 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
4970 my $volid = $drive->{file};
4971 delete $snap->{$remove_drive};
4972 add_unused_volume($conf, $volid);
4973 }
2009f324
DM
4974 }
4975
0d18dcfc
DM
4976 if ($prepare) {
4977 $snap->{snapstate} = 'delete';
4978 } else {
4979 delete $conf->{snapshots}->{$snapname};
3ee28e38 4980 delete $conf->{lock} if $drivehash;
ee2f90b1
DM
4981 foreach my $volid (@$unused) {
4982 add_unused_volume($conf, $volid);
4983 }
0d18dcfc
DM
4984 }
4985
4986 update_config_nolock($vmid, $conf, 1);
4987 };
4988
4989 lock_config($vmid, $updatefn);
4990
18bfb361 4991 # now remove vmstate file
0d18dcfc 4992
22c377f0
DM
4993 my $storecfg = PVE::Storage::config();
4994
18bfb361
DM
4995 if ($snap->{vmstate}) {
4996 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
4997 if (my $err = $@) {
4998 die $err if !$force;
4999 warn $err;
5000 }
5001 # save changes (remove vmstate from snapshot)
5002 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5003 };
5004
5005 # now remove all internal snapshots
5006 foreach_drive($snap, sub {
22c377f0
DM
5007 my ($ds, $drive) = @_;
5008
5009 return if drive_is_cdrom($drive);
3ee28e38 5010
22c377f0
DM
5011 my $volid = $drive->{file};
5012 my $device = "drive-$ds";
5013
2009f324
DM
5014 if (!$drivehash || $drivehash->{$ds}) {
5015 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5016 if (my $err = $@) {
5017 die $err if !$force;
5018 warn $err;
5019 }
3ee28e38 5020 }
2009f324
DM
5021
5022 # save changes (remove drive fron snapshot)
5023 lock_config($vmid, $updatefn, $ds) if !$force;
ee2f90b1 5024 push @$unused, $volid;
22c377f0 5025 });
0d18dcfc
DM
5026
5027 # now cleanup config
5028 $prepare = 0;
5029 lock_config($vmid, $updatefn);
5030}
5031
9cd07842 5032sub has_feature {
7ea975ef
AD
5033 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5034
719893a9 5035 my $err;
7ea975ef
AD
5036 foreach_drive($conf, sub {
5037 my ($ds, $drive) = @_;
5038
5039 return if drive_is_cdrom($drive);
5040 my $volid = $drive->{file};
5041 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5042 });
5043
719893a9 5044 return $err ? 0 : 1;
7ea975ef 5045}
04a69bb4
AD
5046
5047sub template_create {
5048 my ($vmid, $conf, $disk) = @_;
5049
04a69bb4 5050 my $storecfg = PVE::Storage::config();
04a69bb4 5051
9cd07842
DM
5052 foreach_drive($conf, sub {
5053 my ($ds, $drive) = @_;
5054
5055 return if drive_is_cdrom($drive);
5056 return if $disk && $ds ne $disk;
5057
5058 my $volid = $drive->{file};
bbd56097 5059 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
9cd07842 5060
04a69bb4
AD
5061 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5062 $drive->{file} = $voliddst;
152fe752
DM
5063 $conf->{$ds} = print_drive($vmid, $drive);
5064 update_config_nolock($vmid, $conf, 1);
04a69bb4 5065 });
04a69bb4
AD
5066}
5067
624361b3
AD
5068sub is_template {
5069 my ($conf) = @_;
5070
96d695c0 5071 return 1 if defined $conf->{template} && $conf->{template} == 1;
624361b3
AD
5072}
5073
5133de42
AD
5074sub qemu_img_convert {
5075 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5076
5077 my $storecfg = PVE::Storage::config();
5078 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5079 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5080
5081 if ($src_storeid && $dst_storeid) {
5082 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5083 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5084
5085 my $src_format = qemu_img_format($src_scfg, $src_volname);
5086 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5087
5088 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5089 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5090
5091 my $cmd = [];
71ddbff9 5092 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5133de42
AD
5093 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5094 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5095
5096 my $parser = sub {
5097 my $line = shift;
5098 if($line =~ m/\((\S+)\/100\%\)/){
5099 my $percent = $1;
5100 my $transferred = int($size * $percent / 100);
5101 my $remaining = $size - $transferred;
5102
5103 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5104 }
5105
5106 };
5107
5108 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5109 my $err = $@;
5110 die "copy failed: $err" if $err;
5111 }
5112}
5113
5114sub qemu_img_format {
5115 my ($scfg, $volname) = @_;
5116
ccb5c001 5117 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5133de42 5118 return $1;
ccb5c001 5119 } elsif ($scfg->{type} eq 'iscsi') {
5133de42 5120 return "host_device";
be190583 5121 } else {
5133de42 5122 return "raw";
5133de42
AD
5123 }
5124}
5125
cfad42af
AD
5126sub qemu_drive_mirror {
5127 my ($vmid, $drive, $dst_volid, $vmiddst, $maxwait) = @_;
5128
5129 my $count = 1;
5130 my $old_len = 0;
5131 my $frozen = undef;
5132
5133 my $storecfg = PVE::Storage::config();
5134 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5135
5136 if ($dst_storeid) {
5137 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5138
152fe752 5139 my $format;
cfad42af
AD
5140 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5141 $format = $1;
5142 }
5143
5144 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5145
152fe752 5146 if ($format) {
be190583 5147 #fixme : sometime drive-mirror timeout, but works fine after.
152fe752 5148 # (I have see the problem with big volume > 200GB), so we need to eval
be190583 5149 eval { vm_mon_cmd($vmid, "drive-mirror", timeout => 10, device => "drive-$drive", mode => "existing",
152fe752
DM
5150 sync => "full", target => $dst_path, format => $format); };
5151 } else {
be190583 5152 eval { vm_mon_cmd($vmid, "drive-mirror", timeout => 10, device => "drive-$drive", mode => "existing",
152fe752 5153 sync => "full", target => $dst_path); };
cfad42af 5154 }
152fe752
DM
5155
5156 eval {
cfad42af 5157 while (1) {
152fe752 5158 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
cfad42af 5159 my $stat = @$stats[0];
f6ab3bdb
AD
5160 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5161 die "error job is not mirroring" if $stat->{type} ne "mirror";
5162
cfad42af
AD
5163 my $transferred = $stat->{offset};
5164 my $total = $stat->{len};
5165 my $remaining = $total - $transferred;
5166 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
cfad42af
AD
5167
5168 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent %\n";
5169
5170 last if ($stat->{len} == $stat->{offset});
5171 if ($old_len == $stat->{offset}) {
5172 if ($maxwait && $count > $maxwait) {
5173 # if writes to disk occurs the disk needs to be freezed
5174 # to be able to complete the migration
5175 vm_suspend($vmid,1);
5176 $count = 0;
5177 $frozen = 1;
152fe752 5178 } else {
cfad42af
AD
5179 $count++ unless $frozen;
5180 }
152fe752
DM
5181 } elsif ($frozen) {
5182 vm_resume($vmid,1);
5183 $count = 0;
cfad42af
AD
5184 }
5185 $old_len = $stat->{offset};
5186 sleep 1;
5187 }
be190583 5188
2fc6bc17 5189 if ($vmiddst == $vmid) {
be190583 5190 # switch the disk if source and destination are on the same guest
2fc6bc17
DM
5191 vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive");
5192 }
cfad42af 5193 };
4fca0153 5194 if (my $err = $@) {
152fe752 5195 eval { vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive"); };
4fca0153 5196 die "mirroring error: $err";
cfad42af
AD
5197 }
5198
2fc6bc17
DM
5199 if ($vmiddst != $vmid) {
5200 # if we clone a disk for a new target vm, we don't switch the disk
152fe752 5201 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
cfad42af
AD
5202 }
5203 }
5204}
5205
152fe752 5206sub clone_disk {
be190583 5207 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
152fe752
DM
5208 $newvmid, $storage, $format, $full, $newvollist) = @_;
5209
5210 my $newvolid;
5211
5212 if (!$full) {
5213 print "create linked clone of drive $drivename ($drive->{file})\n";
258e646c 5214 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
152fe752
DM
5215 push @$newvollist, $newvolid;
5216 } else {
5217 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5218 $storeid = $storage if $storage;
5219
1377d7b0
DM
5220 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5221 if (!$format) {
5222 $format = $drive->{format} || $defFormat;
152fe752
DM
5223 }
5224
1377d7b0
DM
5225 # test if requested format is supported - else use default
5226 my $supported = grep { $_ eq $format } @$validFormats;
5227 $format = $defFormat if !$supported;
5228
152fe752
DM
5229 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5230
5231 print "create full clone of drive $drivename ($drive->{file})\n";
5232 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5233 push @$newvollist, $newvolid;
5234
5235 if (!$running || $snapname) {
5236 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5237 } else {
5238 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
be190583 5239 }
152fe752
DM
5240 }
5241
5242 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5243
5244 my $disk = $drive;
5245 $disk->{format} = undef;
5246 $disk->{file} = $newvolid;
5247 $disk->{size} = $size;
5248
5249 return $disk;
5250}
5251
ff556cf2
DM
5252# this only works if VM is running
5253sub get_current_qemu_machine {
5254 my ($vmid) = @_;
5255
5256 my $cmd = { execute => 'query-machines', arguments => {} };
be190583 5257 my $res = PVE::QemuServer::vm_qmp_command($vmid, $cmd);
ff556cf2
DM
5258
5259 my ($current, $default);
5260 foreach my $e (@$res) {
5261 $default = $e->{name} if $e->{'is-default'};
5262 $current = $e->{name} if $e->{'is-current'};
5263 }
5264
5265 # fallback to the default machine if current is not supported by qemu
5266 return $current || $default || 'pc';
5267}
5268
4543ecf0
AD
5269sub lspci {
5270
5271 my $devices = {};
5272
5273 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5274 my (undef, $id, $function) = @_;
5275 my $res = { id => $id, function => $function};
5276 push @{$devices->{$id}}, $res;
5277 });
5278
5279 return $devices;
5280}
5281
1e3baf05 52821;