]> git.proxmox.com Git - qemu-server.git/blob - PVE/QemuServer.pm
b077d58a4f183c5005dc03dccffcc1bf86120865
[qemu-server.git] / PVE / QemuServer.pm
1 package PVE::QemuServer;
2
3 use strict;
4 use warnings;
5 use POSIX;
6 use IO::Handle;
7 use IO::Select;
8 use IO::File;
9 use IO::Dir;
10 use IO::Socket::UNIX;
11 use File::Basename;
12 use File::Path;
13 use File::stat;
14 use Getopt::Long;
15 use Digest::SHA;
16 use Fcntl ':flock';
17 use Cwd 'abs_path';
18 use IPC::Open3;
19 use JSON;
20 use Fcntl;
21 use PVE::SafeSyslog;
22 use Storable qw(dclone);
23 use PVE::Exception qw(raise raise_param_exc);
24 use PVE::Storage;
25 use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
26 use PVE::JSONSchema qw(get_standard_option);
27 use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28 use PVE::INotify;
29 use PVE::ProcFSTools;
30 use PVE::QMPClient;
31 use PVE::RPCEnvironment;
32 use Time::HiRes qw(gettimeofday);
33
34 my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
35
36 # Note about locking: we use flock on the config file protect
37 # against concurent actions.
38 # Aditionaly, we have a 'lock' setting in the config file. This
39 # can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
40 # allowed when such lock is set. But you can ignore this kind of
41 # lock with the --skiplock flag.
42
43 cfs_register_file('/qemu-server/',
44 \&parse_vm_config,
45 \&write_vm_config);
46
47 PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
49 type => 'boolean',
50 optional => 1,
51 });
52
53 PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58 });
59
60 PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64 });
65
66 #no warnings 'redefine';
67
68 unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95 }
96
97 sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
101 }
102
103 sub fairsched_rmnod {
104 my ($id) = @_;
105
106 return syscall(&__NR_fairsched_rmnod, int($id));
107 }
108
109 sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
113 }
114
115 sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
119 }
120
121 sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
125 }
126
127 use constant FAIRSCHED_SET_RATE => 0;
128 use constant FAIRSCHED_DROP_RATE => 1;
129 use constant FAIRSCHED_GET_RATE => 2;
130
131 sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
134 my $cpulim1024 = int($limit * 1024 / 100);
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
137 return fairsched_rate($id, $op, $cpulim1024);
138 }
139
140 my $nodename = PVE::INotify::nodename();
141
142 mkdir "/etc/pve/nodes/$nodename";
143 my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144 mkdir $confdir;
145
146 my $var_run_tmpdir = "/var/run/qemu-server";
147 mkdir $var_run_tmpdir;
148
149 my $lock_dir = "/var/lock/qemu-server";
150 mkdir $lock_dir;
151
152 my $pcisysfs = "/sys/bus/pci";
153
154 my $confdesc = {
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
173 hotplug => {
174 optional => 1,
175 type => 'boolean',
176 description => "Allow hotplug for disk and network device",
177 default => 0,
178 },
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
189 enum => [qw(migrate backup snapshot rollback)],
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
210 minimum => 16,
211 default => 512,
212 },
213 balloon => {
214 optional => 1,
215 type => 'integer',
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
226 },
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
231 enum => PVE::Tools::kvmkeymaplist(),
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
236 type => 'string', format => 'dns-name',
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
244 default => 'lsi',
245 },
246 description => {
247 optional => 1,
248 type => 'string',
249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
255 description => <<EODESC,
256 Used to enable special optimization/features for specific
257 operating systems:
258
259 other => unspecified OS
260 wxp => Microsoft Windows XP
261 w2k => Microsoft Windows 2000
262 w2k3 => Microsoft Windows 2003
263 w2k8 => Microsoft Windows 2008
264 wvista => Microsoft Windows Vista
265 win7 => Microsoft Windows 7
266 win8 => Microsoft Windows 8/2012
267 l24 => Linux 2.4 Kernel
268 l26 => Linux 2.6/3.X Kernel
269 solaris => solaris/opensolaris/openindiania kernel
270
271 other|l24|l26|solaris ... no special behaviour
272 wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
273 EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
280 default => 'cdn',
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
286 pattern => '(ide|sata|scsi|virtio)\d+',
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
315 maxcpus => {
316 optional => 1,
317 type => 'integer',
318 description => "Maximum cpus for hotplug.",
319 minimum => 1,
320 default => 1,
321 },
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
328 agent => {
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
332 default => 0,
333 },
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
343 description => "Enable/disable time drift fix.",
344 default => 0,
345 },
346 localtime => {
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
361 },
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
368 startdate => {
369 optional => 1,
370 type => 'string',
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392 Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394 args: -no-reboot -no-hpet
395 EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
412 type => 'number',
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
415 default => 0.1,
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
428 default => 'kvm64',
429 },
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
459 };
460
461 # what about other qemu settings ?
462 #cpu => 'string',
463 #machine => 'string',
464 #fda => 'file',
465 #fdb => 'file',
466 #mtdblock => 'file',
467 #sd => 'file',
468 #pflash => 'file',
469 #snapshot => 'bool',
470 #bootp => 'file',
471 ##tftp => 'dir',
472 ##smb => 'dir',
473 #kernel => 'file',
474 #append => 'string',
475 #initrd => 'file',
476 ##soundhw => 'string',
477
478 while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480 }
481
482 my $MAX_IDE_DISKS = 4;
483 my $MAX_SCSI_DISKS = 14;
484 my $MAX_VIRTIO_DISKS = 16;
485 my $MAX_SATA_DISKS = 6;
486 my $MAX_USB_DEVICES = 5;
487 my $MAX_NETS = 32;
488 my $MAX_UNUSED_DISKS = 8;
489 my $MAX_HOSTPCI_DEVICES = 4;
490 my $MAX_SERIAL_PORTS = 4;
491 my $MAX_PARALLEL_PORTS = 3;
492 my $MAX_NUMA = 8;
493
494 my $numadesc = {
495 optional => 1,
496 type => 'string', format => 'pve-qm-numanode',
497 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>][,policy=<preferred|bind|interleave>]]",
498 description => "numa topology",
499 };
500 PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
501
502 for (my $i = 0; $i < $MAX_NUMA; $i++) {
503 $confdesc->{"numa$i"} = $numadesc;
504 }
505
506 my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
507 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
508 my $nic_model_list_txt = join(' ', sort @$nic_model_list);
509
510 my $netdesc = {
511 optional => 1,
512 type => 'string', format => 'pve-qm-net',
513 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
514 description => <<EODESCR,
515 Specify network devices.
516
517 MODEL is one of: $nic_model_list_txt
518
519 XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
520 automatically generated if not specified.
521
522 The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
523
524 Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
525
526 If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
527
528 10.0.2.2 Gateway
529 10.0.2.3 DNS Server
530 10.0.2.4 SMB Server
531
532 The DHCP server assign addresses to the guest starting from 10.0.2.15.
533
534 EODESCR
535 };
536 PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
537
538 for (my $i = 0; $i < $MAX_NETS; $i++) {
539 $confdesc->{"net$i"} = $netdesc;
540 }
541
542 my $drivename_hash;
543
544 my $idedesc = {
545 optional => 1,
546 type => 'string', format => 'pve-qm-drive',
547 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
548 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
549 };
550 PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
551
552 my $scsidesc = {
553 optional => 1,
554 type => 'string', format => 'pve-qm-drive',
555 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
556 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
557 };
558 PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
559
560 my $satadesc = {
561 optional => 1,
562 type => 'string', format => 'pve-qm-drive',
563 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
564 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
565 };
566 PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
567
568 my $virtiodesc = {
569 optional => 1,
570 type => 'string', format => 'pve-qm-drive',
571 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
572 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
573 };
574 PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
575
576 my $usbdesc = {
577 optional => 1,
578 type => 'string', format => 'pve-qm-usb-device',
579 typetext => 'host=HOSTUSBDEVICE|spice',
580 description => <<EODESCR,
581 Configure an USB device (n is 0 to 4). This can be used to
582 pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
583
584 'bus-port(.port)*' (decimal numbers) or
585 'vendor_id:product_id' (hexadeciaml numbers)
586
587 You can use the 'lsusb -t' command to list existing usb devices.
588
589 Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
590
591 The value 'spice' can be used to add a usb redirection devices for spice.
592
593 EODESCR
594 };
595 PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
596
597 my $hostpcidesc = {
598 optional => 1,
599 type => 'string', format => 'pve-qm-hostpci',
600 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
601 description => <<EODESCR,
602 Map host pci devices. HOSTPCIDEVICE syntax is:
603
604 'bus:dev.func' (hexadecimal numbers)
605
606 You can us the 'lspci' command to list existing pci devices.
607
608 The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
609
610 Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
611
612 Experimental: user reported problems with this option.
613 EODESCR
614 };
615 PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
616
617 my $serialdesc = {
618 optional => 1,
619 type => 'string',
620 pattern => '(/dev/.+|socket)',
621 description => <<EODESCR,
622 Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
623
624 Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
625
626 Experimental: user reported problems with this option.
627 EODESCR
628 };
629
630 my $paralleldesc= {
631 optional => 1,
632 type => 'string',
633 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
634 description => <<EODESCR,
635 Map host parallel devices (n is 0 to 2).
636
637 Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
638
639 Experimental: user reported problems with this option.
640 EODESCR
641 };
642
643 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
644 $confdesc->{"parallel$i"} = $paralleldesc;
645 }
646
647 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
648 $confdesc->{"serial$i"} = $serialdesc;
649 }
650
651 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
652 $confdesc->{"hostpci$i"} = $hostpcidesc;
653 }
654
655 for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
656 $drivename_hash->{"ide$i"} = 1;
657 $confdesc->{"ide$i"} = $idedesc;
658 }
659
660 for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
661 $drivename_hash->{"sata$i"} = 1;
662 $confdesc->{"sata$i"} = $satadesc;
663 }
664
665 for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
666 $drivename_hash->{"scsi$i"} = 1;
667 $confdesc->{"scsi$i"} = $scsidesc ;
668 }
669
670 for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
671 $drivename_hash->{"virtio$i"} = 1;
672 $confdesc->{"virtio$i"} = $virtiodesc;
673 }
674
675 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
676 $confdesc->{"usb$i"} = $usbdesc;
677 }
678
679 my $unuseddesc = {
680 optional => 1,
681 type => 'string', format => 'pve-volume-id',
682 description => "Reference to unused volumes.",
683 };
684
685 for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
686 $confdesc->{"unused$i"} = $unuseddesc;
687 }
688
689 my $kvm_api_version = 0;
690
691 sub kvm_version {
692
693 return $kvm_api_version if $kvm_api_version;
694
695 my $fh = IO::File->new("</dev/kvm") ||
696 return 0;
697
698 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
699 $kvm_api_version = $v;
700 }
701
702 $fh->close();
703
704 return $kvm_api_version;
705 }
706
707 my $kvm_user_version;
708
709 sub kvm_user_version {
710
711 return $kvm_user_version if $kvm_user_version;
712
713 $kvm_user_version = 'unknown';
714
715 my $tmp = `kvm -help 2>/dev/null`;
716
717 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
718 $kvm_user_version = $2;
719 }
720
721 return $kvm_user_version;
722
723 }
724
725 my $kernel_has_vhost_net = -c '/dev/vhost-net';
726
727 sub disknames {
728 # order is important - used to autoselect boot disk
729 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
730 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
731 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
732 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
733 }
734
735 sub valid_drivename {
736 my $dev = shift;
737
738 return defined($drivename_hash->{$dev});
739 }
740
741 sub option_exists {
742 my $key = shift;
743 return defined($confdesc->{$key});
744 }
745
746 sub nic_models {
747 return $nic_model_list;
748 }
749
750 sub os_list_description {
751
752 return {
753 other => 'Other',
754 wxp => 'Windows XP',
755 w2k => 'Windows 2000',
756 w2k3 =>, 'Windows 2003',
757 w2k8 => 'Windows 2008',
758 wvista => 'Windows Vista',
759 win7 => 'Windows 7',
760 win8 => 'Windows 8/2012',
761 l24 => 'Linux 2.4',
762 l26 => 'Linux 2.6',
763 };
764 }
765
766 my $cdrom_path;
767
768 sub get_cdrom_path {
769
770 return $cdrom_path if $cdrom_path;
771
772 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
773 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
774 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
775 }
776
777 sub get_iso_path {
778 my ($storecfg, $vmid, $cdrom) = @_;
779
780 if ($cdrom eq 'cdrom') {
781 return get_cdrom_path();
782 } elsif ($cdrom eq 'none') {
783 return '';
784 } elsif ($cdrom =~ m|^/|) {
785 return $cdrom;
786 } else {
787 return PVE::Storage::path($storecfg, $cdrom);
788 }
789 }
790
791 # try to convert old style file names to volume IDs
792 sub filename_to_volume_id {
793 my ($vmid, $file, $media) = @_;
794
795 if (!($file eq 'none' || $file eq 'cdrom' ||
796 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
797
798 return undef if $file =~ m|/|;
799
800 if ($media && $media eq 'cdrom') {
801 $file = "local:iso/$file";
802 } else {
803 $file = "local:$vmid/$file";
804 }
805 }
806
807 return $file;
808 }
809
810 sub verify_media_type {
811 my ($opt, $vtype, $media) = @_;
812
813 return if !$media;
814
815 my $etype;
816 if ($media eq 'disk') {
817 $etype = 'images';
818 } elsif ($media eq 'cdrom') {
819 $etype = 'iso';
820 } else {
821 die "internal error";
822 }
823
824 return if ($vtype eq $etype);
825
826 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
827 }
828
829 sub cleanup_drive_path {
830 my ($opt, $storecfg, $drive) = @_;
831
832 # try to convert filesystem paths to volume IDs
833
834 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
835 ($drive->{file} !~ m|^/dev/.+|) &&
836 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
837 ($drive->{file} !~ m/^\d+$/)) {
838 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
839 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
840 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
841 verify_media_type($opt, $vtype, $drive->{media});
842 $drive->{file} = $volid;
843 }
844
845 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
846 }
847
848 sub create_conf_nolock {
849 my ($vmid, $settings) = @_;
850
851 my $filename = config_file($vmid);
852
853 die "configuration file '$filename' already exists\n" if -f $filename;
854
855 my $defaults = load_defaults();
856
857 $settings->{name} = "vm$vmid" if !$settings->{name};
858 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
859
860 my $data = '';
861 foreach my $opt (keys %$settings) {
862 next if !$confdesc->{$opt};
863
864 my $value = $settings->{$opt};
865 next if !$value;
866
867 $data .= "$opt: $value\n";
868 }
869
870 PVE::Tools::file_set_contents($filename, $data);
871 }
872
873 my $parse_size = sub {
874 my ($value) = @_;
875
876 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
877 my ($size, $unit) = ($1, $3);
878 if ($unit) {
879 if ($unit eq 'K') {
880 $size = $size * 1024;
881 } elsif ($unit eq 'M') {
882 $size = $size * 1024 * 1024;
883 } elsif ($unit eq 'G') {
884 $size = $size * 1024 * 1024 * 1024;
885 }
886 }
887 return int($size);
888 };
889
890 my $format_size = sub {
891 my ($size) = @_;
892
893 $size = int($size);
894
895 my $kb = int($size/1024);
896 return $size if $kb*1024 != $size;
897
898 my $mb = int($kb/1024);
899 return "${kb}K" if $mb*1024 != $kb;
900
901 my $gb = int($mb/1024);
902 return "${mb}M" if $gb*1024 != $mb;
903
904 return "${gb}G";
905 };
906
907 # ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
908 # [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
909 # [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
910 # [,aio=native|threads][,discard=ignore|on]
911
912 sub parse_drive {
913 my ($key, $data) = @_;
914
915 my $res = {};
916
917 # $key may be undefined - used to verify JSON parameters
918 if (!defined($key)) {
919 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
920 $res->{index} = 0;
921 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
922 $res->{interface} = $1;
923 $res->{index} = $2;
924 } else {
925 return undef;
926 }
927
928 foreach my $p (split (/,/, $data)) {
929 next if $p =~ m/^\s*$/;
930
931 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
932 my ($k, $v) = ($1, $2);
933
934 $k = 'file' if $k eq 'volume';
935
936 return undef if defined $res->{$k};
937
938 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
939 return undef if !$v || $v !~ m/^\d+/;
940 $k = "m$k";
941 $v = sprintf("%.3f", $v / (1024*1024));
942 }
943 $res->{$k} = $v;
944 } else {
945 if (!$res->{file} && $p !~ m/=/) {
946 $res->{file} = $p;
947 } else {
948 return undef;
949 }
950 }
951 }
952
953 return undef if !$res->{file};
954
955 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
956 $res->{format} = $1;
957 }
958
959 return undef if $res->{cache} &&
960 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
961 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
962 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
963 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
964 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
965 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
966 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
967 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
968 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
969 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
970 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
971 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
972 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
973
974 return undef if $res->{mbps_rd} && $res->{mbps};
975 return undef if $res->{mbps_wr} && $res->{mbps};
976
977 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
978 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
979 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
980 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
981 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
982 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
983
984 return undef if $res->{iops_rd} && $res->{iops};
985 return undef if $res->{iops_wr} && $res->{iops};
986
987
988 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
989 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
990 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
991 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
992 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
993 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
994
995
996 if ($res->{size}) {
997 return undef if !defined($res->{size} = &$parse_size($res->{size}));
998 }
999
1000 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1001 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
1002 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1003 return undef if $res->{interface} eq 'virtio';
1004 }
1005
1006 # rerror does not work with scsi drives
1007 if ($res->{rerror}) {
1008 return undef if $res->{interface} eq 'scsi';
1009 }
1010
1011 return $res;
1012 }
1013
1014 my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1015
1016 sub print_drive {
1017 my ($vmid, $drive) = @_;
1018
1019 my $opts = '';
1020 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1021 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1022 }
1023
1024 if ($drive->{size}) {
1025 $opts .= ",size=" . &$format_size($drive->{size});
1026 }
1027
1028 return "$drive->{file}$opts";
1029 }
1030
1031 sub scsi_inquiry {
1032 my($fh, $noerr) = @_;
1033
1034 my $SG_IO = 0x2285;
1035 my $SG_GET_VERSION_NUM = 0x2282;
1036
1037 my $versionbuf = "\x00" x 8;
1038 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1039 if (!$ret) {
1040 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1041 return undef;
1042 }
1043 my $version = unpack("I", $versionbuf);
1044 if ($version < 30000) {
1045 die "scsi generic interface too old\n" if !$noerr;
1046 return undef;
1047 }
1048
1049 my $buf = "\x00" x 36;
1050 my $sensebuf = "\x00" x 8;
1051 my $cmd = pack("C x3 C x1", 0x12, 36);
1052
1053 # see /usr/include/scsi/sg.h
1054 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1055
1056 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1057 length($sensebuf), 0, length($buf), $buf,
1058 $cmd, $sensebuf, 6000);
1059
1060 $ret = ioctl($fh, $SG_IO, $packet);
1061 if (!$ret) {
1062 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1063 return undef;
1064 }
1065
1066 my @res = unpack($sg_io_hdr_t, $packet);
1067 if ($res[17] || $res[18]) {
1068 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1069 return undef;
1070 }
1071
1072 my $res = {};
1073 (my $byte0, my $byte1, $res->{vendor},
1074 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1075
1076 $res->{removable} = $byte1 & 128 ? 1 : 0;
1077 $res->{type} = $byte0 & 31;
1078
1079 return $res;
1080 }
1081
1082 sub path_is_scsi {
1083 my ($path) = @_;
1084
1085 my $fh = IO::File->new("+<$path") || return undef;
1086 my $res = scsi_inquiry($fh, 1);
1087 close($fh);
1088
1089 return $res;
1090 }
1091
1092 sub machine_type_is_q35 {
1093 my ($conf) = @_;
1094
1095 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1096 }
1097
1098 sub print_tabletdevice_full {
1099 my ($conf) = @_;
1100
1101 my $q35 = machine_type_is_q35($conf);
1102
1103 # we use uhci for old VMs because tablet driver was buggy in older qemu
1104 my $usbbus = $q35 ? "ehci" : "uhci";
1105
1106 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1107 }
1108
1109 sub print_drivedevice_full {
1110 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
1111
1112 my $device = '';
1113 my $maxdev = 0;
1114
1115 if ($drive->{interface} eq 'virtio') {
1116 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
1117 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
1118 $device .= ",iothread=iothread0" if $conf->{iothread};
1119 } elsif ($drive->{interface} eq 'scsi') {
1120 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
1121 my $controller = int($drive->{index} / $maxdev);
1122 my $unit = $drive->{index} % $maxdev;
1123 my $devicetype = 'hd';
1124 my $path = '';
1125 if (drive_is_cdrom($drive)) {
1126 $devicetype = 'cd';
1127 } else {
1128 if ($drive->{file} =~ m|^/|) {
1129 $path = $drive->{file};
1130 } else {
1131 $path = PVE::Storage::path($storecfg, $drive->{file});
1132 }
1133
1134 if($path =~ m/^iscsi\:\/\//){
1135 $devicetype = 'generic';
1136 } else {
1137 if (my $info = path_is_scsi($path)) {
1138 if ($info->{type} == 0) {
1139 $devicetype = 'block';
1140 } elsif ($info->{type} == 1) { # tape
1141 $devicetype = 'generic';
1142 }
1143 }
1144 }
1145 }
1146
1147 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1148 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1149 } else {
1150 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1151 }
1152
1153 } elsif ($drive->{interface} eq 'ide'){
1154 $maxdev = 2;
1155 my $controller = int($drive->{index} / $maxdev);
1156 my $unit = $drive->{index} % $maxdev;
1157 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1158
1159 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1160 } elsif ($drive->{interface} eq 'sata'){
1161 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1162 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1163 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1164 } elsif ($drive->{interface} eq 'usb') {
1165 die "implement me";
1166 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1167 } else {
1168 die "unsupported interface type";
1169 }
1170
1171 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1172
1173 return $device;
1174 }
1175
1176 sub get_initiator_name {
1177 my $initiator;
1178
1179 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1180 while (defined(my $line = <$fh>)) {
1181 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
1182 $initiator = $1;
1183 last;
1184 }
1185 $fh->close();
1186
1187 return $initiator;
1188 }
1189
1190 sub print_drive_full {
1191 my ($storecfg, $vmid, $drive) = @_;
1192
1193 my $opts = '';
1194 foreach my $o (@qemu_drive_options) {
1195 next if $o eq 'bootindex';
1196 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1197 }
1198
1199 foreach my $o (qw(bps bps_rd bps_wr)) {
1200 my $v = $drive->{"m$o"};
1201 $opts .= ",$o=" . int($v*1024*1024) if $v;
1202 }
1203
1204 # use linux-aio by default (qemu default is threads)
1205 $opts .= ",aio=native" if !$drive->{aio};
1206
1207 my $path;
1208 my $volid = $drive->{file};
1209 if (drive_is_cdrom($drive)) {
1210 $path = get_iso_path($storecfg, $vmid, $volid);
1211 } else {
1212 if ($volid =~ m|^/|) {
1213 $path = $volid;
1214 } else {
1215 $path = PVE::Storage::path($storecfg, $volid);
1216 }
1217 }
1218
1219 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
1220
1221 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1222 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1223
1224 my $pathinfo = $path ? "file=$path," : '';
1225
1226 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1227 }
1228
1229 sub print_netdevice_full {
1230 my ($vmid, $conf, $net, $netid, $bridges) = @_;
1231
1232 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1233
1234 my $device = $net->{model};
1235 if ($net->{model} eq 'virtio') {
1236 $device = 'virtio-net-pci';
1237 };
1238
1239 # qemu > 0.15 always try to boot from network - we disable that by
1240 # not loading the pxe rom file
1241 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
1242 my $pciaddr = print_pci_addr("$netid", $bridges);
1243 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
1244 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1245 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1246 my $vectors = $net->{queues} * 2 + 2;
1247 $tmpstr .= ",vectors=$vectors,mq=on";
1248 }
1249 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1250 return $tmpstr;
1251 }
1252
1253 sub print_netdev_full {
1254 my ($vmid, $conf, $net, $netid) = @_;
1255
1256 my $i = '';
1257 if ($netid =~ m/^net(\d+)$/) {
1258 $i = int($1);
1259 }
1260
1261 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1262
1263 my $ifname = "tap${vmid}i$i";
1264
1265 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1266 die "interface name '$ifname' is too long (max 15 character)\n"
1267 if length($ifname) >= 16;
1268
1269 my $vhostparam = '';
1270 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1271
1272 my $vmname = $conf->{name} || "vm$vmid";
1273
1274 my $netdev = "";
1275
1276 if ($net->{bridge}) {
1277 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
1278 } else {
1279 $netdev = "type=user,id=$netid,hostname=$vmname";
1280 }
1281
1282 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1283
1284 return $netdev;
1285 }
1286
1287 sub drive_is_cdrom {
1288 my ($drive) = @_;
1289
1290 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1291
1292 }
1293
1294 sub parse_numa {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 foreach my $kvp (split(/,/, $data)) {
1300
1301 if ($kvp =~ m/^memory=(\S+)$/) {
1302 $res->{memory} = $1;
1303 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1304 $res->{policy} = $1;
1305 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1306 $res->{cpus}->{start} = $1;
1307 $res->{cpus}->{end} = $3;
1308 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1309 $res->{hostnodes}->{start} = $1;
1310 $res->{hostnodes}->{end} = $3;
1311 } else {
1312 return undef;
1313 }
1314 }
1315
1316 return $res;
1317 }
1318
1319 sub parse_hostpci {
1320 my ($value) = @_;
1321
1322 return undef if !$value;
1323
1324
1325 my @list = split(/,/, $value);
1326 my $found;
1327
1328 my $res = {};
1329 foreach my $kv (@list) {
1330
1331 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
1332 $found = 1;
1333 if(defined($4)){
1334 push @{$res->{pciid}}, { id => $2 , function => $4};
1335
1336 }else{
1337 my $pcidevices = lspci($2);
1338 $res->{pciid} = $pcidevices->{$2};
1339 }
1340 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1341 $res->{driver} = $1;
1342 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1343 $res->{rombar} = $1;
1344 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1345 $res->{'x-vga'} = $1;
1346 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1347 $res->{pcie} = 1 if $1 == 1;
1348 } else {
1349 warn "unknown hostpci setting '$kv'\n";
1350 }
1351 }
1352
1353 return undef if !$found;
1354
1355 return $res;
1356 }
1357
1358 # netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1359 sub parse_net {
1360 my ($data) = @_;
1361
1362 my $res = {};
1363
1364 foreach my $kvp (split(/,/, $data)) {
1365
1366 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
1367 my $model = lc($1);
1368 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1369 $res->{model} = $model;
1370 $res->{macaddr} = $mac;
1371 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1372 $res->{bridge} = $1;
1373 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1374 $res->{queues} = $1;
1375 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1376 $res->{rate} = $1;
1377 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1378 $res->{tag} = $1;
1379 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1380 $res->{firewall} = $1;
1381 } else {
1382 return undef;
1383 }
1384
1385 }
1386
1387 return undef if !$res->{model};
1388
1389 return $res;
1390 }
1391
1392 sub print_net {
1393 my $net = shift;
1394
1395 my $res = "$net->{model}";
1396 $res .= "=$net->{macaddr}" if $net->{macaddr};
1397 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1398 $res .= ",rate=$net->{rate}" if $net->{rate};
1399 $res .= ",tag=$net->{tag}" if $net->{tag};
1400 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1401
1402 return $res;
1403 }
1404
1405 sub add_random_macs {
1406 my ($settings) = @_;
1407
1408 foreach my $opt (keys %$settings) {
1409 next if $opt !~ m/^net(\d+)$/;
1410 my $net = parse_net($settings->{$opt});
1411 next if !$net;
1412 $settings->{$opt} = print_net($net);
1413 }
1414 }
1415
1416 sub add_unused_volume {
1417 my ($config, $volid) = @_;
1418
1419 my $key;
1420 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1421 my $test = "unused$ind";
1422 if (my $vid = $config->{$test}) {
1423 return if $vid eq $volid; # do not add duplicates
1424 } else {
1425 $key = $test;
1426 }
1427 }
1428
1429 die "To many unused volume - please delete them first.\n" if !$key;
1430
1431 $config->{$key} = $volid;
1432
1433 return $key;
1434 }
1435
1436 sub vm_is_volid_owner {
1437 my ($storecfg, $vmid, $volid) = @_;
1438
1439 if ($volid !~ m|^/|) {
1440 my ($path, $owner);
1441 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1442 if ($owner && ($owner == $vmid)) {
1443 return 1;
1444 }
1445 }
1446
1447 return undef;
1448 }
1449
1450 sub vmconfig_delete_pending_option {
1451 my ($conf, $key) = @_;
1452
1453 delete $conf->{pending}->{$key};
1454 my $pending_delete_hash = { $key => 1 };
1455 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1456 $pending_delete_hash->{$opt} = 1;
1457 }
1458 $conf->{pending}->{delete} = join(',', keys %$pending_delete_hash);
1459 }
1460
1461 sub vmconfig_undelete_pending_option {
1462 my ($conf, $key) = @_;
1463
1464 my $pending_delete_hash = {};
1465 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1466 $pending_delete_hash->{$opt} = 1;
1467 }
1468 delete $pending_delete_hash->{$key};
1469
1470 my @keylist = keys %$pending_delete_hash;
1471 if (scalar(@keylist)) {
1472 $conf->{pending}->{delete} = join(',', @keylist);
1473 } else {
1474 delete $conf->{pending}->{delete};
1475 }
1476 }
1477
1478 sub vmconfig_register_unused_drive {
1479 my ($storecfg, $vmid, $conf, $drive) = @_;
1480
1481 if (!drive_is_cdrom($drive)) {
1482 my $volid = $drive->{file};
1483 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
1484 add_unused_volume($conf, $volid, $vmid);
1485 }
1486 }
1487 }
1488
1489 sub vmconfig_cleanup_pending {
1490 my ($conf) = @_;
1491
1492 # remove pending changes when nothing changed
1493 my $changes;
1494 foreach my $opt (keys %{$conf->{pending}}) {
1495 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1496 $changes = 1;
1497 delete $conf->{pending}->{$opt};
1498 }
1499 }
1500
1501 # remove delete if option is not set
1502 my $pending_delete_hash = {};
1503 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1504 if (defined($conf->{$opt})) {
1505 $pending_delete_hash->{$opt} = 1;
1506 } else {
1507 $changes = 1;
1508 }
1509 }
1510
1511 my @keylist = keys %$pending_delete_hash;
1512 if (scalar(@keylist)) {
1513 $conf->{pending}->{delete} = join(',', @keylist);
1514 } else {
1515 delete $conf->{pending}->{delete};
1516 }
1517
1518 return $changes;
1519 }
1520
1521 my $valid_smbios1_options = {
1522 manufacturer => '\S+',
1523 product => '\S+',
1524 version => '\S+',
1525 serial => '\S+',
1526 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1527 sku => '\S+',
1528 family => '\S+',
1529 };
1530
1531 # smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1532 sub parse_smbios1 {
1533 my ($data) = @_;
1534
1535 my $res = {};
1536
1537 foreach my $kvp (split(/,/, $data)) {
1538 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1539 my ($k, $v) = split(/=/, $kvp);
1540 return undef if !defined($k) || !defined($v);
1541 return undef if !$valid_smbios1_options->{$k};
1542 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1543 $res->{$k} = $v;
1544 }
1545
1546 return $res;
1547 }
1548
1549 sub print_smbios1 {
1550 my ($smbios1) = @_;
1551
1552 my $data = '';
1553 foreach my $k (keys %$smbios1) {
1554 next if !defined($smbios1->{$k});
1555 next if !$valid_smbios1_options->{$k};
1556 $data .= ',' if $data;
1557 $data .= "$k=$smbios1->{$k}";
1558 }
1559 return $data;
1560 }
1561
1562 PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1563 sub verify_smbios1 {
1564 my ($value, $noerr) = @_;
1565
1566 return $value if parse_smbios1($value);
1567
1568 return undef if $noerr;
1569
1570 die "unable to parse smbios (type 1) options\n";
1571 }
1572
1573 PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1574 sub verify_bootdisk {
1575 my ($value, $noerr) = @_;
1576
1577 return $value if valid_drivename($value);
1578
1579 return undef if $noerr;
1580
1581 die "invalid boot disk '$value'\n";
1582 }
1583
1584 PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1585 sub verify_numa {
1586 my ($value, $noerr) = @_;
1587
1588 return $value if parse_numa($value);
1589
1590 return undef if $noerr;
1591
1592 die "unable to parse numa options\n";
1593 }
1594
1595 PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1596 sub verify_net {
1597 my ($value, $noerr) = @_;
1598
1599 return $value if parse_net($value);
1600
1601 return undef if $noerr;
1602
1603 die "unable to parse network options\n";
1604 }
1605
1606 PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1607 sub verify_drive {
1608 my ($value, $noerr) = @_;
1609
1610 return $value if parse_drive(undef, $value);
1611
1612 return undef if $noerr;
1613
1614 die "unable to parse drive options\n";
1615 }
1616
1617 PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1618 sub verify_hostpci {
1619 my ($value, $noerr) = @_;
1620
1621 return $value if parse_hostpci($value);
1622
1623 return undef if $noerr;
1624
1625 die "unable to parse pci id\n";
1626 }
1627
1628 PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1629 sub verify_watchdog {
1630 my ($value, $noerr) = @_;
1631
1632 return $value if parse_watchdog($value);
1633
1634 return undef if $noerr;
1635
1636 die "unable to parse watchdog options\n";
1637 }
1638
1639 sub parse_watchdog {
1640 my ($value) = @_;
1641
1642 return undef if !$value;
1643
1644 my $res = {};
1645
1646 foreach my $p (split(/,/, $value)) {
1647 next if $p =~ m/^\s*$/;
1648
1649 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1650 $res->{model} = $2;
1651 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1652 $res->{action} = $2;
1653 } else {
1654 return undef;
1655 }
1656 }
1657
1658 return $res;
1659 }
1660
1661 PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1662 sub verify_startup {
1663 my ($value, $noerr) = @_;
1664
1665 return $value if parse_startup($value);
1666
1667 return undef if $noerr;
1668
1669 die "unable to parse startup options\n";
1670 }
1671
1672 sub parse_startup {
1673 my ($value) = @_;
1674
1675 return undef if !$value;
1676
1677 my $res = {};
1678
1679 foreach my $p (split(/,/, $value)) {
1680 next if $p =~ m/^\s*$/;
1681
1682 if ($p =~ m/^(order=)?(\d+)$/) {
1683 $res->{order} = $2;
1684 } elsif ($p =~ m/^up=(\d+)$/) {
1685 $res->{up} = $1;
1686 } elsif ($p =~ m/^down=(\d+)$/) {
1687 $res->{down} = $1;
1688 } else {
1689 return undef;
1690 }
1691 }
1692
1693 return $res;
1694 }
1695
1696 sub parse_usb_device {
1697 my ($value) = @_;
1698
1699 return undef if !$value;
1700
1701 my @dl = split(/,/, $value);
1702 my $found;
1703
1704 my $res = {};
1705 foreach my $v (@dl) {
1706 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1707 $found = 1;
1708 $res->{vendorid} = $2;
1709 $res->{productid} = $4;
1710 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1711 $found = 1;
1712 $res->{hostbus} = $1;
1713 $res->{hostport} = $2;
1714 } elsif ($v =~ m/^spice$/) {
1715 $found = 1;
1716 $res->{spice} = 1;
1717 } else {
1718 return undef;
1719 }
1720 }
1721 return undef if !$found;
1722
1723 return $res;
1724 }
1725
1726 PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1727 sub verify_usb_device {
1728 my ($value, $noerr) = @_;
1729
1730 return $value if parse_usb_device($value);
1731
1732 return undef if $noerr;
1733
1734 die "unable to parse usb device\n";
1735 }
1736
1737 # add JSON properties for create and set function
1738 sub json_config_properties {
1739 my $prop = shift;
1740
1741 foreach my $opt (keys %$confdesc) {
1742 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1743 $prop->{$opt} = $confdesc->{$opt};
1744 }
1745
1746 return $prop;
1747 }
1748
1749 sub check_type {
1750 my ($key, $value) = @_;
1751
1752 die "unknown setting '$key'\n" if !$confdesc->{$key};
1753
1754 my $type = $confdesc->{$key}->{type};
1755
1756 if (!defined($value)) {
1757 die "got undefined value\n";
1758 }
1759
1760 if ($value =~ m/[\n\r]/) {
1761 die "property contains a line feed\n";
1762 }
1763
1764 if ($type eq 'boolean') {
1765 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1766 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1767 die "type check ('boolean') failed - got '$value'\n";
1768 } elsif ($type eq 'integer') {
1769 return int($1) if $value =~ m/^(\d+)$/;
1770 die "type check ('integer') failed - got '$value'\n";
1771 } elsif ($type eq 'number') {
1772 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1773 die "type check ('number') failed - got '$value'\n";
1774 } elsif ($type eq 'string') {
1775 if (my $fmt = $confdesc->{$key}->{format}) {
1776 if ($fmt eq 'pve-qm-drive') {
1777 # special case - we need to pass $key to parse_drive()
1778 my $drive = parse_drive($key, $value);
1779 return $value if $drive;
1780 die "unable to parse drive options\n";
1781 }
1782 PVE::JSONSchema::check_format($fmt, $value);
1783 return $value;
1784 }
1785 $value =~ s/^\"(.*)\"$/$1/;
1786 return $value;
1787 } else {
1788 die "internal error"
1789 }
1790 }
1791
1792 sub lock_config_full {
1793 my ($vmid, $timeout, $code, @param) = @_;
1794
1795 my $filename = config_file_lock($vmid);
1796
1797 my $res = lock_file($filename, $timeout, $code, @param);
1798
1799 die $@ if $@;
1800
1801 return $res;
1802 }
1803
1804 sub lock_config_mode {
1805 my ($vmid, $timeout, $shared, $code, @param) = @_;
1806
1807 my $filename = config_file_lock($vmid);
1808
1809 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
1810
1811 die $@ if $@;
1812
1813 return $res;
1814 }
1815
1816 sub lock_config {
1817 my ($vmid, $code, @param) = @_;
1818
1819 return lock_config_full($vmid, 10, $code, @param);
1820 }
1821
1822 sub cfs_config_path {
1823 my ($vmid, $node) = @_;
1824
1825 $node = $nodename if !$node;
1826 return "nodes/$node/qemu-server/$vmid.conf";
1827 }
1828
1829 sub check_iommu_support{
1830 #fixme : need to check IOMMU support
1831 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1832
1833 my $iommu=1;
1834 return $iommu;
1835
1836 }
1837
1838 sub config_file {
1839 my ($vmid, $node) = @_;
1840
1841 my $cfspath = cfs_config_path($vmid, $node);
1842 return "/etc/pve/$cfspath";
1843 }
1844
1845 sub config_file_lock {
1846 my ($vmid) = @_;
1847
1848 return "$lock_dir/lock-$vmid.conf";
1849 }
1850
1851 sub touch_config {
1852 my ($vmid) = @_;
1853
1854 my $conf = config_file($vmid);
1855 utime undef, undef, $conf;
1856 }
1857
1858 sub destroy_vm {
1859 my ($storecfg, $vmid, $keep_empty_config) = @_;
1860
1861 my $conffile = config_file($vmid);
1862
1863 my $conf = load_config($vmid);
1864
1865 check_lock($conf);
1866
1867 # only remove disks owned by this VM
1868 foreach_drive($conf, sub {
1869 my ($ds, $drive) = @_;
1870
1871 return if drive_is_cdrom($drive);
1872
1873 my $volid = $drive->{file};
1874
1875 return if !$volid || $volid =~ m|^/|;
1876
1877 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
1878 return if !$path || !$owner || ($owner != $vmid);
1879
1880 PVE::Storage::vdisk_free($storecfg, $volid);
1881 });
1882
1883 if ($keep_empty_config) {
1884 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
1885 } else {
1886 unlink $conffile;
1887 }
1888
1889 # also remove unused disk
1890 eval {
1891 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1892
1893 eval {
1894 PVE::Storage::foreach_volid($dl, sub {
1895 my ($volid, $sid, $volname, $d) = @_;
1896 PVE::Storage::vdisk_free($storecfg, $volid);
1897 });
1898 };
1899 warn $@ if $@;
1900
1901 };
1902 warn $@ if $@;
1903 }
1904
1905 sub load_config {
1906 my ($vmid, $node) = @_;
1907
1908 my $cfspath = cfs_config_path($vmid, $node);
1909
1910 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1911
1912 die "no such VM ('$vmid')\n" if !defined($conf);
1913
1914 return $conf;
1915 }
1916
1917 sub parse_vm_config {
1918 my ($filename, $raw) = @_;
1919
1920 return undef if !defined($raw);
1921
1922 my $res = {
1923 digest => Digest::SHA::sha1_hex($raw),
1924 snapshots => {},
1925 pending => {},
1926 };
1927
1928 $filename =~ m|/qemu-server/(\d+)\.conf$|
1929 || die "got strange filename '$filename'";
1930
1931 my $vmid = $1;
1932
1933 my $conf = $res;
1934 my $descr = '';
1935 my $section = '';
1936
1937 my @lines = split(/\n/, $raw);
1938 foreach my $line (@lines) {
1939 next if $line =~ m/^\s*$/;
1940
1941 if ($line =~ m/^\[PENDING\]\s*$/i) {
1942 $section = 'pending';
1943 $conf->{description} = $descr if $descr;
1944 $descr = '';
1945 $conf = $res->{$section} = {};
1946 next;
1947
1948 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
1949 $section = $1;
1950 $conf->{description} = $descr if $descr;
1951 $descr = '';
1952 $conf = $res->{snapshots}->{$section} = {};
1953 next;
1954 }
1955
1956 if ($line =~ m/^\#(.*)\s*$/) {
1957 $descr .= PVE::Tools::decode_text($1) . "\n";
1958 next;
1959 }
1960
1961 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
1962 $descr .= PVE::Tools::decode_text($2);
1963 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1964 $conf->{snapstate} = $1;
1965 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1966 my $key = $1;
1967 my $value = $2;
1968 $conf->{$key} = $value;
1969 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
1970 my $value = $1;
1971 if ($section eq 'pending') {
1972 $conf->{delete} = $value; # we parse this later
1973 } else {
1974 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
1975 }
1976 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1977 my $key = $1;
1978 my $value = $2;
1979 eval { $value = check_type($key, $value); };
1980 if ($@) {
1981 warn "vm $vmid - unable to parse value of '$key' - $@";
1982 } else {
1983 my $fmt = $confdesc->{$key}->{format};
1984 if ($fmt && $fmt eq 'pve-qm-drive') {
1985 my $v = parse_drive($key, $value);
1986 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1987 $v->{file} = $volid;
1988 $value = print_drive($vmid, $v);
1989 } else {
1990 warn "vm $vmid - unable to parse value of '$key'\n";
1991 next;
1992 }
1993 }
1994
1995 if ($key eq 'cdrom') {
1996 $conf->{ide2} = $value;
1997 } else {
1998 $conf->{$key} = $value;
1999 }
2000 }
2001 }
2002 }
2003
2004 $conf->{description} = $descr if $descr;
2005
2006 delete $res->{snapstate}; # just to be sure
2007
2008 return $res;
2009 }
2010
2011 sub write_vm_config {
2012 my ($filename, $conf) = @_;
2013
2014 delete $conf->{snapstate}; # just to be sure
2015
2016 if ($conf->{cdrom}) {
2017 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2018 $conf->{ide2} = $conf->{cdrom};
2019 delete $conf->{cdrom};
2020 }
2021
2022 # we do not use 'smp' any longer
2023 if ($conf->{sockets}) {
2024 delete $conf->{smp};
2025 } elsif ($conf->{smp}) {
2026 $conf->{sockets} = $conf->{smp};
2027 delete $conf->{cores};
2028 delete $conf->{smp};
2029 }
2030
2031 if ($conf->{maxcpus} && $conf->{sockets}) {
2032 delete $conf->{sockets};
2033 }
2034
2035 my $used_volids = {};
2036
2037 my $cleanup_config = sub {
2038 my ($cref, $pending, $snapname) = @_;
2039
2040 foreach my $key (keys %$cref) {
2041 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
2042 $key eq 'snapstate' || $key eq 'pending';
2043 my $value = $cref->{$key};
2044 if ($key eq 'delete') {
2045 die "propertry 'delete' is only allowed in [PENDING]\n"
2046 if !$pending;
2047 # fixme: check syntax?
2048 next;
2049 }
2050 eval { $value = check_type($key, $value); };
2051 die "unable to parse value of '$key' - $@" if $@;
2052
2053 $cref->{$key} = $value;
2054
2055 if (!$snapname && valid_drivename($key)) {
2056 my $drive = parse_drive($key, $value);
2057 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2058 }
2059 }
2060 };
2061
2062 &$cleanup_config($conf);
2063
2064 &$cleanup_config($conf->{pending}, 1);
2065
2066 foreach my $snapname (keys %{$conf->{snapshots}}) {
2067 die "internal error" if $snapname eq 'pending';
2068 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
2069 }
2070
2071 # remove 'unusedX' settings if we re-add a volume
2072 foreach my $key (keys %$conf) {
2073 my $value = $conf->{$key};
2074 if ($key =~ m/^unused/ && $used_volids->{$value}) {
2075 delete $conf->{$key};
2076 }
2077 }
2078
2079 my $generate_raw_config = sub {
2080 my ($conf) = @_;
2081
2082 my $raw = '';
2083
2084 # add description as comment to top of file
2085 my $descr = $conf->{description} || '';
2086 foreach my $cl (split(/\n/, $descr)) {
2087 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2088 }
2089
2090 foreach my $key (sort keys %$conf) {
2091 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
2092 $raw .= "$key: $conf->{$key}\n";
2093 }
2094 return $raw;
2095 };
2096
2097 my $raw = &$generate_raw_config($conf);
2098
2099 if (scalar(keys %{$conf->{pending}})){
2100 $raw .= "\n[PENDING]\n";
2101 $raw .= &$generate_raw_config($conf->{pending});
2102 }
2103
2104 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2105 $raw .= "\n[$snapname]\n";
2106 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
2107 }
2108
2109 return $raw;
2110 }
2111
2112 sub update_config_nolock {
2113 my ($vmid, $conf, $skiplock) = @_;
2114
2115 check_lock($conf) if !$skiplock;
2116
2117 my $cfspath = cfs_config_path($vmid);
2118
2119 PVE::Cluster::cfs_write_file($cfspath, $conf);
2120 }
2121
2122 sub update_config {
2123 my ($vmid, $conf, $skiplock) = @_;
2124
2125 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
2126 }
2127
2128 sub load_defaults {
2129
2130 my $res = {};
2131
2132 # we use static defaults from our JSON schema configuration
2133 foreach my $key (keys %$confdesc) {
2134 if (defined(my $default = $confdesc->{$key}->{default})) {
2135 $res->{$key} = $default;
2136 }
2137 }
2138
2139 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2140 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2141
2142 return $res;
2143 }
2144
2145 sub config_list {
2146 my $vmlist = PVE::Cluster::get_vmlist();
2147 my $res = {};
2148 return $res if !$vmlist || !$vmlist->{ids};
2149 my $ids = $vmlist->{ids};
2150
2151 foreach my $vmid (keys %$ids) {
2152 my $d = $ids->{$vmid};
2153 next if !$d->{node} || $d->{node} ne $nodename;
2154 next if !$d->{type} || $d->{type} ne 'qemu';
2155 $res->{$vmid}->{exists} = 1;
2156 }
2157 return $res;
2158 }
2159
2160 # test if VM uses local resources (to prevent migration)
2161 sub check_local_resources {
2162 my ($conf, $noerr) = @_;
2163
2164 my $loc_res = 0;
2165
2166 $loc_res = 1 if $conf->{hostusb}; # old syntax
2167 $loc_res = 1 if $conf->{hostpci}; # old syntax
2168
2169 foreach my $k (keys %$conf) {
2170 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2171 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
2172 }
2173
2174 die "VM uses local resources\n" if $loc_res && !$noerr;
2175
2176 return $loc_res;
2177 }
2178
2179 # check if used storages are available on all nodes (use by migrate)
2180 sub check_storage_availability {
2181 my ($storecfg, $conf, $node) = @_;
2182
2183 foreach_drive($conf, sub {
2184 my ($ds, $drive) = @_;
2185
2186 my $volid = $drive->{file};
2187 return if !$volid;
2188
2189 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2190 return if !$sid;
2191
2192 # check if storage is available on both nodes
2193 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2194 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2195 });
2196 }
2197
2198 # list nodes where all VM images are available (used by has_feature API)
2199 sub shared_nodes {
2200 my ($conf, $storecfg) = @_;
2201
2202 my $nodelist = PVE::Cluster::get_nodelist();
2203 my $nodehash = { map { $_ => 1 } @$nodelist };
2204 my $nodename = PVE::INotify::nodename();
2205
2206 foreach_drive($conf, sub {
2207 my ($ds, $drive) = @_;
2208
2209 my $volid = $drive->{file};
2210 return if !$volid;
2211
2212 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2213 if ($storeid) {
2214 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2215 if ($scfg->{disable}) {
2216 $nodehash = {};
2217 } elsif (my $avail = $scfg->{nodes}) {
2218 foreach my $node (keys %$nodehash) {
2219 delete $nodehash->{$node} if !$avail->{$node};
2220 }
2221 } elsif (!$scfg->{shared}) {
2222 foreach my $node (keys %$nodehash) {
2223 delete $nodehash->{$node} if $node ne $nodename
2224 }
2225 }
2226 }
2227 });
2228
2229 return $nodehash
2230 }
2231
2232 sub check_lock {
2233 my ($conf) = @_;
2234
2235 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2236 }
2237
2238 sub check_cmdline {
2239 my ($pidfile, $pid) = @_;
2240
2241 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2242 if (defined($fh)) {
2243 my $line = <$fh>;
2244 $fh->close;
2245 return undef if !$line;
2246 my @param = split(/\0/, $line);
2247
2248 my $cmd = $param[0];
2249 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
2250
2251 for (my $i = 0; $i < scalar (@param); $i++) {
2252 my $p = $param[$i];
2253 next if !$p;
2254 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2255 my $p = $param[$i+1];
2256 return 1 if $p && ($p eq $pidfile);
2257 return undef;
2258 }
2259 }
2260 }
2261 return undef;
2262 }
2263
2264 sub check_running {
2265 my ($vmid, $nocheck, $node) = @_;
2266
2267 my $filename = config_file($vmid, $node);
2268
2269 die "unable to find configuration file for VM $vmid - no such machine\n"
2270 if !$nocheck && ! -f $filename;
2271
2272 my $pidfile = pidfile_name($vmid);
2273
2274 if (my $fd = IO::File->new("<$pidfile")) {
2275 my $st = stat($fd);
2276 my $line = <$fd>;
2277 close($fd);
2278
2279 my $mtime = $st->mtime;
2280 if ($mtime > time()) {
2281 warn "file '$filename' modified in future\n";
2282 }
2283
2284 if ($line =~ m/^(\d+)$/) {
2285 my $pid = $1;
2286 if (check_cmdline($pidfile, $pid)) {
2287 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2288 return $pid;
2289 }
2290 }
2291 }
2292 }
2293
2294 return undef;
2295 }
2296
2297 sub vzlist {
2298
2299 my $vzlist = config_list();
2300
2301 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
2302
2303 while (defined(my $de = $fd->read)) {
2304 next if $de !~ m/^(\d+)\.pid$/;
2305 my $vmid = $1;
2306 next if !defined($vzlist->{$vmid});
2307 if (my $pid = check_running($vmid)) {
2308 $vzlist->{$vmid}->{pid} = $pid;
2309 }
2310 }
2311
2312 return $vzlist;
2313 }
2314
2315 sub disksize {
2316 my ($storecfg, $conf) = @_;
2317
2318 my $bootdisk = $conf->{bootdisk};
2319 return undef if !$bootdisk;
2320 return undef if !valid_drivename($bootdisk);
2321
2322 return undef if !$conf->{$bootdisk};
2323
2324 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2325 return undef if !defined($drive);
2326
2327 return undef if drive_is_cdrom($drive);
2328
2329 my $volid = $drive->{file};
2330 return undef if !$volid;
2331
2332 return $drive->{size};
2333 }
2334
2335 my $last_proc_pid_stat;
2336
2337 # get VM status information
2338 # This must be fast and should not block ($full == false)
2339 # We only query KVM using QMP if $full == true (this can be slow)
2340 sub vmstatus {
2341 my ($opt_vmid, $full) = @_;
2342
2343 my $res = {};
2344
2345 my $storecfg = PVE::Storage::config();
2346
2347 my $list = vzlist();
2348 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
2349
2350 my $cpucount = $cpuinfo->{cpus} || 1;
2351
2352 foreach my $vmid (keys %$list) {
2353 next if $opt_vmid && ($vmid ne $opt_vmid);
2354
2355 my $cfspath = cfs_config_path($vmid);
2356 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2357
2358 my $d = {};
2359 $d->{pid} = $list->{$vmid}->{pid};
2360
2361 # fixme: better status?
2362 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2363
2364 my $size = disksize($storecfg, $conf);
2365 if (defined($size)) {
2366 $d->{disk} = 0; # no info available
2367 $d->{maxdisk} = $size;
2368 } else {
2369 $d->{disk} = 0;
2370 $d->{maxdisk} = 0;
2371 }
2372
2373 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
2374 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2375
2376 $d->{name} = $conf->{name} || "VM $vmid";
2377 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
2378
2379 if ($conf->{balloon}) {
2380 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
2381 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
2382 }
2383
2384 $d->{uptime} = 0;
2385 $d->{cpu} = 0;
2386 $d->{mem} = 0;
2387
2388 $d->{netout} = 0;
2389 $d->{netin} = 0;
2390
2391 $d->{diskread} = 0;
2392 $d->{diskwrite} = 0;
2393
2394 $d->{template} = is_template($conf);
2395
2396 $res->{$vmid} = $d;
2397 }
2398
2399 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2400 foreach my $dev (keys %$netdev) {
2401 next if $dev !~ m/^tap([1-9]\d*)i/;
2402 my $vmid = $1;
2403 my $d = $res->{$vmid};
2404 next if !$d;
2405
2406 $d->{netout} += $netdev->{$dev}->{receive};
2407 $d->{netin} += $netdev->{$dev}->{transmit};
2408 }
2409
2410 my $ctime = gettimeofday;
2411
2412 foreach my $vmid (keys %$list) {
2413
2414 my $d = $res->{$vmid};
2415 my $pid = $d->{pid};
2416 next if !$pid;
2417
2418 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2419 next if !$pstat; # not running
2420
2421 my $used = $pstat->{utime} + $pstat->{stime};
2422
2423 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
2424
2425 if ($pstat->{vsize}) {
2426 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
2427 }
2428
2429 my $old = $last_proc_pid_stat->{$pid};
2430 if (!$old) {
2431 $last_proc_pid_stat->{$pid} = {
2432 time => $ctime,
2433 used => $used,
2434 cpu => 0,
2435 };
2436 next;
2437 }
2438
2439 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
2440
2441 if ($dtime > 1000) {
2442 my $dutime = $used - $old->{used};
2443
2444 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
2445 $last_proc_pid_stat->{$pid} = {
2446 time => $ctime,
2447 used => $used,
2448 cpu => $d->{cpu},
2449 };
2450 } else {
2451 $d->{cpu} = $old->{cpu};
2452 }
2453 }
2454
2455 return $res if !$full;
2456
2457 my $qmpclient = PVE::QMPClient->new();
2458
2459 my $ballooncb = sub {
2460 my ($vmid, $resp) = @_;
2461
2462 my $info = $resp->{'return'};
2463 return if !$info->{max_mem};
2464
2465 my $d = $res->{$vmid};
2466
2467 # use memory assigned to VM
2468 $d->{maxmem} = $info->{max_mem};
2469 $d->{balloon} = $info->{actual};
2470
2471 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2472 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2473 $d->{freemem} = $info->{free_mem};
2474 }
2475
2476 };
2477
2478 my $blockstatscb = sub {
2479 my ($vmid, $resp) = @_;
2480 my $data = $resp->{'return'} || [];
2481 my $totalrdbytes = 0;
2482 my $totalwrbytes = 0;
2483 for my $blockstat (@$data) {
2484 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2485 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2486 }
2487 $res->{$vmid}->{diskread} = $totalrdbytes;
2488 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2489 };
2490
2491 my $statuscb = sub {
2492 my ($vmid, $resp) = @_;
2493
2494 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
2495 # this fails if ballon driver is not loaded, so this must be
2496 # the last commnand (following command are aborted if this fails).
2497 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
2498
2499 my $status = 'unknown';
2500 if (!defined($status = $resp->{'return'}->{status})) {
2501 warn "unable to get VM status\n";
2502 return;
2503 }
2504
2505 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2506 };
2507
2508 foreach my $vmid (keys %$list) {
2509 next if $opt_vmid && ($vmid ne $opt_vmid);
2510 next if !$res->{$vmid}->{pid}; # not running
2511 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2512 }
2513
2514 $qmpclient->queue_execute(undef, 1);
2515
2516 foreach my $vmid (keys %$list) {
2517 next if $opt_vmid && ($vmid ne $opt_vmid);
2518 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2519 }
2520
2521 return $res;
2522 }
2523
2524 sub foreach_drive {
2525 my ($conf, $func) = @_;
2526
2527 foreach my $ds (keys %$conf) {
2528 next if !valid_drivename($ds);
2529
2530 my $drive = parse_drive($ds, $conf->{$ds});
2531 next if !$drive;
2532
2533 &$func($ds, $drive);
2534 }
2535 }
2536
2537 sub foreach_volid {
2538 my ($conf, $func) = @_;
2539
2540 my $volhash = {};
2541
2542 my $test_volid = sub {
2543 my ($volid, $is_cdrom) = @_;
2544
2545 return if !$volid;
2546
2547 $volhash->{$volid} = $is_cdrom || 0;
2548 };
2549
2550 foreach_drive($conf, sub {
2551 my ($ds, $drive) = @_;
2552 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2553 });
2554
2555 foreach my $snapname (keys %{$conf->{snapshots}}) {
2556 my $snap = $conf->{snapshots}->{$snapname};
2557 &$test_volid($snap->{vmstate}, 0);
2558 foreach_drive($snap, sub {
2559 my ($ds, $drive) = @_;
2560 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2561 });
2562 }
2563
2564 foreach my $volid (keys %$volhash) {
2565 &$func($volid, $volhash->{$volid});
2566 }
2567 }
2568
2569 sub vga_conf_has_spice {
2570 my ($vga) = @_;
2571
2572 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2573
2574 return $1 || 1;
2575 }
2576
2577 sub config_to_command {
2578 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
2579
2580 my $cmd = [];
2581 my $globalFlags = [];
2582 my $machineFlags = [];
2583 my $rtcFlags = [];
2584 my $cpuFlags = [];
2585 my $devices = [];
2586 my $pciaddr = '';
2587 my $bridges = {};
2588 my $kvmver = kvm_user_version();
2589 my $vernum = 0; # unknown
2590 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2591 $vernum = $1*1000000+$2*1000;
2592 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
2593 $vernum = $1*1000000+$2*1000+$3;
2594 }
2595
2596 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
2597
2598 my $have_ovz = -f '/proc/vz/vestat';
2599
2600 my $q35 = machine_type_is_q35($conf);
2601
2602 push @$cmd, '/usr/bin/kvm';
2603
2604 push @$cmd, '-id', $vmid;
2605
2606 my $use_virtio = 0;
2607
2608 my $qmpsocket = qmp_socket($vmid);
2609 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2610 push @$cmd, '-mon', "chardev=qmp,mode=control";
2611
2612 my $socket = vnc_socket($vmid);
2613 push @$cmd, '-vnc', "unix:$socket,x509,password";
2614
2615 push @$cmd, '-pidfile' , pidfile_name($vmid);
2616
2617 push @$cmd, '-daemonize';
2618
2619 if ($conf->{smbios1}) {
2620 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2621 }
2622
2623 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2624
2625 if ($q35) {
2626 # the q35 chipset support native usb2, so we enable usb controller
2627 # by default for this machine type
2628 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
2629 } else {
2630 $pciaddr = print_pci_addr("piix3", $bridges);
2631 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
2632
2633 my $use_usb2 = 0;
2634 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2635 next if !$conf->{"usb$i"};
2636 $use_usb2 = 1;
2637 }
2638 # include usb device config
2639 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
2640 }
2641
2642 my $vga = $conf->{vga};
2643
2644 my $qxlnum = vga_conf_has_spice($vga);
2645 $vga = 'qxl' if $qxlnum;
2646
2647 if (!$vga) {
2648 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2649 $conf->{ostype} eq 'win7' ||
2650 $conf->{ostype} eq 'w2k8')) {
2651 $vga = 'std';
2652 } else {
2653 $vga = 'cirrus';
2654 }
2655 }
2656
2657 # enable absolute mouse coordinates (needed by vnc)
2658 my $tablet;
2659 if (defined($conf->{tablet})) {
2660 $tablet = $conf->{tablet};
2661 } else {
2662 $tablet = $defaults->{tablet};
2663 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
2664 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
2665 }
2666
2667 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
2668
2669 # host pci devices
2670 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2671 my $d = parse_hostpci($conf->{"hostpci$i"});
2672 next if !$d;
2673
2674 my $pcie = $d->{pcie};
2675 if($pcie){
2676 die "q35 machine model is not enabled" if !$q35;
2677 $pciaddr = print_pcie_addr("hostpci$i");
2678 }else{
2679 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2680 }
2681
2682 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2683 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2684 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
2685 if ($xvga && $xvga ne '') {
2686 push @$cpuFlags, 'kvm=off';
2687 $vga = 'none';
2688 }
2689 $driver = "vfio-pci" if $xvga ne '';
2690 my $pcidevices = $d->{pciid};
2691 my $multifunction = 1 if @$pcidevices > 1;
2692
2693 my $j=0;
2694 foreach my $pcidevice (@$pcidevices) {
2695
2696 my $id = "hostpci$i";
2697 $id .= ".$j" if $multifunction;
2698 my $addr = $pciaddr;
2699 $addr .= ".$j" if $multifunction;
2700 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2701
2702 if($j == 0){
2703 $devicestr .= "$rombar$xvga";
2704 $devicestr .= ",multifunction=on" if $multifunction;
2705 }
2706
2707 push @$devices, '-device', $devicestr;
2708 $j++;
2709 }
2710 }
2711
2712 # usb devices
2713 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2714 my $d = parse_usb_device($conf->{"usb$i"});
2715 next if !$d;
2716 if ($d->{vendorid} && $d->{productid}) {
2717 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
2718 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
2719 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
2720 } elsif ($d->{spice}) {
2721 # usb redir support for spice
2722 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2723 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
2724 }
2725 }
2726
2727 # serial devices
2728 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
2729 if (my $path = $conf->{"serial$i"}) {
2730 if ($path eq 'socket') {
2731 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2732 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2733 push @$devices, '-device', "isa-serial,chardev=serial$i";
2734 } else {
2735 die "no such serial device\n" if ! -c $path;
2736 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2737 push @$devices, '-device', "isa-serial,chardev=serial$i";
2738 }
2739 }
2740 }
2741
2742 # parallel devices
2743 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
2744 if (my $path = $conf->{"parallel$i"}) {
2745 die "no such parallel device\n" if ! -c $path;
2746 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
2747 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
2748 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
2749 }
2750 }
2751
2752 my $vmname = $conf->{name} || "vm$vmid";
2753
2754 push @$cmd, '-name', $vmname;
2755
2756 my $sockets = 1;
2757 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2758 $sockets = $conf->{sockets} if $conf->{sockets};
2759
2760 my $cores = $conf->{cores} || 1;
2761 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2762
2763 my $total_cores = $sockets * $cores;
2764 my $allowed_cores = $cpuinfo->{cpus};
2765
2766 die "MAX $allowed_cores cores allowed per VM on this node\n"
2767 if ($allowed_cores < $total_cores);
2768
2769 if ($maxcpus) {
2770 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
2771 } else {
2772 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2773 }
2774
2775 push @$cmd, '-nodefaults';
2776
2777 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
2778
2779 my $bootindex_hash = {};
2780 my $i = 1;
2781 foreach my $o (split(//, $bootorder)) {
2782 $bootindex_hash->{$o} = $i*100;
2783 $i++;
2784 }
2785
2786 push @$cmd, '-boot', "menu=on";
2787
2788 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
2789
2790 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
2791
2792 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
2793
2794 # time drift fix
2795 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
2796
2797 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
2798 my $useLocaltime = $conf->{localtime};
2799
2800 if (my $ost = $conf->{ostype}) {
2801 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
2802
2803 if ($ost =~ m/^w/) { # windows
2804 $useLocaltime = 1 if !defined($conf->{localtime});
2805
2806 # use time drift fix when acpi is enabled
2807 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
2808 $tdf = 1 if !defined($conf->{tdf});
2809 }
2810 }
2811
2812 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
2813 $ost eq 'wvista') {
2814 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
2815 push @$cmd, '-no-hpet';
2816 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2817 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2818 }
2819
2820 if ($ost eq 'win7' || $ost eq 'win8') {
2821 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
2822 }
2823 }
2824
2825 push @$rtcFlags, 'driftfix=slew' if $tdf;
2826
2827 if ($nokvm) {
2828 push @$machineFlags, 'accel=tcg';
2829 } else {
2830 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2831 }
2832
2833 my $machine_type = $forcemachine || $conf->{machine};
2834 if ($machine_type) {
2835 push @$machineFlags, "type=${machine_type}";
2836 }
2837
2838 if ($conf->{startdate}) {
2839 push @$rtcFlags, "base=$conf->{startdate}";
2840 } elsif ($useLocaltime) {
2841 push @$rtcFlags, 'base=localtime';
2842 }
2843
2844 my $cpu = $nokvm ? "qemu64" : "kvm64";
2845 $cpu = $conf->{cpu} if $conf->{cpu};
2846
2847 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2848
2849 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2850
2851 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
2852
2853 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2854
2855 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
2856
2857 # Note: enforce needs kernel 3.10, so we do not use it for now
2858 # push @$cmd, '-cpu', "$cpu,enforce";
2859 push @$cmd, '-cpu', $cpu;
2860
2861 my $memory = $conf->{memory} || $defaults->{memory};
2862 push @$cmd, '-m', $memory;
2863
2864 if ($conf->{numa}) {
2865
2866 my $numa_totalmemory = undef;
2867 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2868 next if !$conf->{"numa$i"};
2869 my $numa = parse_numa($conf->{"numa$i"});
2870 next if !$numa;
2871 # memory
2872 die "missing numa node$i memory value\n" if !$numa->{memory};
2873 my $numa_memory = $numa->{memory};
2874 $numa_totalmemory += $numa_memory;
2875 my $numa_object = "memory-backend-ram,id=ram-node$i,size=$numa_memory"."M";
2876
2877 # cpus
2878 my $cpus_start = $numa->{cpus}->{start};
2879 die "missing numa node$i cpus\n" if !defined($cpus_start);
2880 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2881 my $cpus = $cpus_start;
2882 if (defined($cpus_end)) {
2883 $cpus .= "-$cpus_end";
2884 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2885 }
2886
2887 # hostnodes
2888 my $hostnodes_start = $numa->{hostnodes}->{start};
2889 if (defined($hostnodes_start)) {
2890 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2891 my $hostnodes = $hostnodes_start;
2892 if (defined($hostnodes_end)) {
2893 $hostnodes .= "-$hostnodes_end";
2894 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2895 }
2896
2897 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2898 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
2899 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2900 }
2901
2902 # policy
2903 my $policy = $numa->{policy};
2904 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2905 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2906 }
2907
2908 push @$cmd, '-object', $numa_object;
2909 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2910 }
2911
2912 die "total memory for NUMA nodes must be equal to vm memory\n"
2913 if $numa_totalmemory && $numa_totalmemory != $memory;
2914
2915 #if no custom tology, we split memory and cores across numa nodes
2916 if(!$numa_totalmemory) {
2917
2918 my $numa_memory = ($memory / $sockets) . "M";
2919
2920 for (my $i = 0; $i < $sockets; $i++) {
2921
2922 my $cpustart = ($cores * $i);
2923 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2924 my $cpus = $cpustart;
2925 $cpus .= "-$cpuend" if $cpuend;
2926
2927 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2928 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2929 }
2930 }
2931 }
2932
2933 push @$cmd, '-S' if $conf->{freeze};
2934
2935 # set keyboard layout
2936 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2937 push @$cmd, '-k', $kb if $kb;
2938
2939 # enable sound
2940 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2941 #push @$cmd, '-soundhw', 'es1370';
2942 #push @$cmd, '-soundhw', $soundhw if $soundhw;
2943
2944 if($conf->{agent}) {
2945 my $qgasocket = qmp_socket($vmid, 1);
2946 my $pciaddr = print_pci_addr("qga0", $bridges);
2947 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2948 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2949 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2950 }
2951
2952 my $spice_port;
2953
2954 if ($qxlnum) {
2955 if ($qxlnum > 1) {
2956 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2957 for(my $i = 1; $i < $qxlnum; $i++){
2958 my $pciaddr = print_pci_addr("vga$i", $bridges);
2959 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2960 }
2961 } else {
2962 # assume other OS works like Linux
2963 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2964 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2965 }
2966 }
2967
2968 my $pciaddr = print_pci_addr("spice", $bridges);
2969
2970 $spice_port = PVE::Tools::next_spice_port();
2971
2972 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
2973
2974 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2975 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2976 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
2977 }
2978
2979 # enable balloon by default, unless explicitly disabled
2980 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2981 $pciaddr = print_pci_addr("balloon0", $bridges);
2982 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2983 }
2984
2985 if ($conf->{watchdog}) {
2986 my $wdopts = parse_watchdog($conf->{watchdog});
2987 $pciaddr = print_pci_addr("watchdog", $bridges);
2988 my $watchdog = $wdopts->{model} || 'i6300esb';
2989 push @$devices, '-device', "$watchdog$pciaddr";
2990 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
2991 }
2992
2993 my $vollist = [];
2994 my $scsicontroller = {};
2995 my $ahcicontroller = {};
2996 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
2997
2998 # Add iscsi initiator name if available
2999 if (my $initiator = get_initiator_name()) {
3000 push @$devices, '-iscsi', "initiator-name=$initiator";
3001 }
3002
3003 foreach_drive($conf, sub {
3004 my ($ds, $drive) = @_;
3005
3006 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
3007 push @$vollist, $drive->{file};
3008 }
3009
3010 $use_virtio = 1 if $ds =~ m/^virtio/;
3011
3012 if (drive_is_cdrom ($drive)) {
3013 if ($bootindex_hash->{d}) {
3014 $drive->{bootindex} = $bootindex_hash->{d};
3015 $bootindex_hash->{d} += 1;
3016 }
3017 } else {
3018 if ($bootindex_hash->{c}) {
3019 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3020 $bootindex_hash->{c} += 1;
3021 }
3022 }
3023
3024 if ($drive->{interface} eq 'scsi') {
3025
3026 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
3027 my $controller = int($drive->{index} / $maxdev);
3028 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
3029 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
3030 $scsicontroller->{$controller}=1;
3031 }
3032
3033 if ($drive->{interface} eq 'sata') {
3034 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
3035 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3036 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
3037 $ahcicontroller->{$controller}=1;
3038 }
3039
3040 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3041 push @$devices, '-drive',$drive_cmd;
3042 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
3043 });
3044
3045 for (my $i = 0; $i < $MAX_NETS; $i++) {
3046 next if !$conf->{"net$i"};
3047 my $d = parse_net($conf->{"net$i"});
3048 next if !$d;
3049
3050 $use_virtio = 1 if $d->{model} eq 'virtio';
3051
3052 if ($bootindex_hash->{n}) {
3053 $d->{bootindex} = $bootindex_hash->{n};
3054 $bootindex_hash->{n} += 1;
3055 }
3056
3057 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
3058 push @$devices, '-netdev', $netdevfull;
3059
3060 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
3061 push @$devices, '-device', $netdevicefull;
3062 }
3063
3064 if (!$q35) {
3065 # add pci bridges
3066 while (my ($k, $v) = each %$bridges) {
3067 $pciaddr = print_pci_addr("pci.$k");
3068 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3069 }
3070 }
3071
3072 # hack: virtio with fairsched is unreliable, so we do not use fairsched
3073 # when the VM uses virtio devices.
3074 if (!$use_virtio && $have_ovz) {
3075
3076 my $cpuunits = defined($conf->{cpuunits}) ?
3077 $conf->{cpuunits} : $defaults->{cpuunits};
3078
3079 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
3080
3081 # fixme: cpulimit is currently ignored
3082 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
3083 }
3084
3085 # add custom args
3086 if ($conf->{args}) {
3087 my $aa = PVE::Tools::split_args($conf->{args});
3088 push @$cmd, @$aa;
3089 }
3090
3091 push @$cmd, @$devices;
3092 push @$cmd, '-rtc', join(',', @$rtcFlags)
3093 if scalar(@$rtcFlags);
3094 push @$cmd, '-machine', join(',', @$machineFlags)
3095 if scalar(@$machineFlags);
3096 push @$cmd, '-global', join(',', @$globalFlags)
3097 if scalar(@$globalFlags);
3098
3099 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
3100 }
3101
3102 sub vnc_socket {
3103 my ($vmid) = @_;
3104 return "${var_run_tmpdir}/$vmid.vnc";
3105 }
3106
3107 sub spice_port {
3108 my ($vmid) = @_;
3109
3110 my $res = vm_mon_cmd($vmid, 'query-spice');
3111
3112 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
3113 }
3114
3115 sub qmp_socket {
3116 my ($vmid, $qga) = @_;
3117 my $sockettype = $qga ? 'qga' : 'qmp';
3118 return "${var_run_tmpdir}/$vmid.$sockettype";
3119 }
3120
3121 sub pidfile_name {
3122 my ($vmid) = @_;
3123 return "${var_run_tmpdir}/$vmid.pid";
3124 }
3125
3126 sub vm_devices_list {
3127 my ($vmid) = @_;
3128
3129 my $res = vm_mon_cmd($vmid, 'query-pci');
3130 my $devices = {};
3131 foreach my $pcibus (@$res) {
3132 foreach my $device (@{$pcibus->{devices}}) {
3133 next if !$device->{'qdev_id'};
3134 $devices->{$device->{'qdev_id'}} = 1;
3135 }
3136 }
3137
3138 my $resblock = vm_mon_cmd($vmid, 'query-block');
3139 foreach my $block (@$resblock) {
3140 if($block->{device} =~ m/^drive-(\S+)/){
3141 $devices->{$1} = 1;
3142 }
3143 }
3144
3145 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3146 foreach my $mice (@$resmice) {
3147 if ($mice->{name} eq 'QEMU HID Tablet') {
3148 $devices->{tablet} = 1;
3149 last;
3150 }
3151 }
3152
3153 return $devices;
3154 }
3155
3156 sub vm_deviceplug {
3157 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
3158
3159 return 1 if !check_running($vmid);
3160
3161 my $q35 = machine_type_is_q35($conf);
3162
3163 return 1 if !$conf->{hotplug};
3164
3165 my $devices_list = vm_devices_list($vmid);
3166 return 1 if defined($devices_list->{$deviceid});
3167
3168 if ($deviceid eq 'tablet') {
3169 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3170 return 1;
3171 }
3172
3173 qemu_bridgeadd($storecfg, $conf, $vmid, $deviceid); #add bridge if we need it for the device
3174
3175 if ($deviceid =~ m/^(virtio)(\d+)$/) {
3176 return undef if !qemu_driveadd($storecfg, $vmid, $device);
3177 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3178 qemu_deviceadd($vmid, $devicefull);
3179 if(!qemu_deviceaddverify($vmid, $deviceid)) {
3180 qemu_drivedel($vmid, $deviceid);
3181 return undef;
3182 }
3183 }
3184
3185 if ($deviceid =~ m/^(scsihw)(\d+)$/) {
3186 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
3187 my $pciaddr = print_pci_addr($deviceid);
3188 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
3189 qemu_deviceadd($vmid, $devicefull);
3190 return undef if(!qemu_deviceaddverify($vmid, $deviceid));
3191 }
3192
3193 if ($deviceid =~ m/^(scsi)(\d+)$/) {
3194 return undef if !qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
3195 return undef if !qemu_driveadd($storecfg, $vmid, $device);
3196 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3197 if(!qemu_deviceadd($vmid, $devicefull)) {
3198 qemu_drivedel($vmid, $deviceid);
3199 return undef;
3200 }
3201 }
3202
3203 if ($deviceid =~ m/^(net)(\d+)$/) {
3204 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3205 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3206 qemu_deviceadd($vmid, $netdevicefull);
3207 if(!qemu_deviceaddverify($vmid, $deviceid)) {
3208 qemu_netdevdel($vmid, $deviceid);
3209 return undef;
3210 }
3211 }
3212
3213
3214 if (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
3215 my $bridgeid = $2;
3216 my $pciaddr = print_pci_addr($deviceid);
3217 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
3218 qemu_deviceadd($vmid, $devicefull);
3219 return undef if !qemu_deviceaddverify($vmid, $deviceid);
3220 }
3221
3222 return 1;
3223 }
3224
3225 sub vm_deviceunplug {
3226 my ($vmid, $conf, $deviceid) = @_;
3227
3228 return 1 if !check_running ($vmid);
3229
3230 return 1 if !$conf->{hotplug};
3231
3232 my $devices_list = vm_devices_list($vmid);
3233 return 1 if !defined($devices_list->{$deviceid});
3234
3235 if ($deviceid eq 'tablet') {
3236 qemu_devicedel($vmid, $deviceid);
3237 return 1;
3238 }
3239
3240 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3241
3242 if ($deviceid =~ m/^(virtio)(\d+)$/) {
3243 qemu_devicedel($vmid, $deviceid);
3244 return undef if !qemu_devicedelverify($vmid, $deviceid);
3245 return undef if !qemu_drivedel($vmid, $deviceid);
3246 }
3247
3248 if ($deviceid =~ m/^(lsi)(\d+)$/) {
3249 return undef if !qemu_devicedel($vmid, $deviceid);
3250 }
3251
3252 if ($deviceid =~ m/^(scsi)(\d+)$/) {
3253 return undef if !qemu_devicedel($vmid, $deviceid);
3254 return undef if !qemu_drivedel($vmid, $deviceid);
3255 }
3256
3257 if ($deviceid =~ m/^(net)(\d+)$/) {
3258 qemu_devicedel($vmid, $deviceid);
3259 return undef if !qemu_devicedelverify($vmid, $deviceid);
3260 return undef if !qemu_netdevdel($vmid, $deviceid);
3261 }
3262
3263 return 1;
3264 }
3265
3266 sub qemu_deviceadd {
3267 my ($vmid, $devicefull) = @_;
3268
3269 $devicefull = "driver=".$devicefull;
3270 my %options = split(/[=,]/, $devicefull);
3271
3272 vm_mon_cmd($vmid, "device_add" , %options);
3273 return 1;
3274 }
3275
3276 sub qemu_devicedel {
3277 my($vmid, $deviceid) = @_;
3278 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
3279 return 1;
3280 }
3281
3282 sub qemu_driveadd {
3283 my($storecfg, $vmid, $device) = @_;
3284
3285 my $drive = print_drive_full($storecfg, $vmid, $device);
3286 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
3287 # If the command succeeds qemu prints: "OK"
3288 if ($ret !~ m/OK/s) {
3289 syslog("err", "adding drive failed: $ret");
3290 return undef;
3291 }
3292 return 1;
3293 }
3294
3295 sub qemu_drivedel {
3296 my($vmid, $deviceid) = @_;
3297
3298 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
3299 $ret =~ s/^\s+//;
3300 if ($ret =~ m/Device \'.*?\' not found/s) {
3301 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
3302 }
3303 elsif ($ret ne "") {
3304 syslog("err", "deleting drive $deviceid failed : $ret");
3305 return undef;
3306 }
3307 return 1;
3308 }
3309
3310 sub qemu_deviceaddverify {
3311 my ($vmid,$deviceid) = @_;
3312
3313 for (my $i = 0; $i <= 5; $i++) {
3314 my $devices_list = vm_devices_list($vmid);
3315 return 1 if defined($devices_list->{$deviceid});
3316 sleep 1;
3317 }
3318 syslog("err", "error on hotplug device $deviceid");
3319 return undef;
3320 }
3321
3322
3323 sub qemu_devicedelverify {
3324 my ($vmid,$deviceid) = @_;
3325
3326 #need to verify the device is correctly remove as device_del is async and empty return is not reliable
3327 for (my $i = 0; $i <= 5; $i++) {
3328 my $devices_list = vm_devices_list($vmid);
3329 return 1 if !defined($devices_list->{$deviceid});
3330 sleep 1;
3331 }
3332 syslog("err", "error on hot-unplugging device $deviceid");
3333 return undef;
3334 }
3335
3336 sub qemu_findorcreatescsihw {
3337 my ($storecfg, $conf, $vmid, $device) = @_;
3338
3339 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
3340 my $controller = int($device->{index} / $maxdev);
3341 my $scsihwid="scsihw$controller";
3342 my $devices_list = vm_devices_list($vmid);
3343
3344 if(!defined($devices_list->{$scsihwid})) {
3345 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
3346 }
3347 return 1;
3348 }
3349
3350 sub qemu_bridgeadd {
3351 my ($storecfg, $conf, $vmid, $device) = @_;
3352
3353 my $bridges = {};
3354 my $bridgeid = undef;
3355 print_pci_addr($device, $bridges);
3356
3357 while (my ($k, $v) = each %$bridges) {
3358 $bridgeid = $k;
3359 }
3360 return if !$bridgeid || $bridgeid < 1;
3361 my $bridge = "pci.$bridgeid";
3362 my $devices_list = vm_devices_list($vmid);
3363
3364 if(!defined($devices_list->{$bridge})) {
3365 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $bridge);
3366 }
3367 return 1;
3368 }
3369
3370 sub qemu_netdevadd {
3371 my ($vmid, $conf, $device, $deviceid) = @_;
3372
3373 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
3374 my %options = split(/[=,]/, $netdev);
3375
3376 vm_mon_cmd($vmid, "netdev_add", %options);
3377 return 1;
3378 }
3379
3380 sub qemu_netdevdel {
3381 my ($vmid, $deviceid) = @_;
3382
3383 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
3384 return 1;
3385 }
3386
3387 sub qemu_cpu_hotplug {
3388 my ($vmid, $conf, $cores) = @_;
3389
3390 die "new cores config is not defined" if !$cores;
3391 die "you can't add more cores than maxcpus"
3392 if $conf->{maxcpus} && ($cores > $conf->{maxcpus});
3393 return if !check_running($vmid);
3394
3395 my $currentcores = $conf->{cores} if $conf->{cores};
3396 die "current cores is not defined" if !$currentcores;
3397 die "maxcpus is not defined" if !$conf->{maxcpus};
3398 raise_param_exc({ 'cores' => "online cpu unplug is not yet possible" })
3399 if($cores < $currentcores);
3400
3401 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
3402 raise_param_exc({ 'cores' => "cores number if running vm is different than configuration" })
3403 if scalar (@{$currentrunningcores}) != $currentcores;
3404
3405 for(my $i = $currentcores; $i < $cores; $i++) {
3406 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3407 }
3408 }
3409
3410 sub qemu_block_set_io_throttle {
3411 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3412
3413 return if !check_running($vmid) ;
3414
3415 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3416
3417 }
3418
3419 # old code, only used to shutdown old VM after update
3420 sub __read_avail {
3421 my ($fh, $timeout) = @_;
3422
3423 my $sel = new IO::Select;
3424 $sel->add($fh);
3425
3426 my $res = '';
3427 my $buf;
3428
3429 my @ready;
3430 while (scalar (@ready = $sel->can_read($timeout))) {
3431 my $count;
3432 if ($count = $fh->sysread($buf, 8192)) {
3433 if ($buf =~ /^(.*)\(qemu\) $/s) {
3434 $res .= $1;
3435 last;
3436 } else {
3437 $res .= $buf;
3438 }
3439 } else {
3440 if (!defined($count)) {
3441 die "$!\n";
3442 }
3443 last;
3444 }
3445 }
3446
3447 die "monitor read timeout\n" if !scalar(@ready);
3448
3449 return $res;
3450 }
3451
3452 # old code, only used to shutdown old VM after update
3453 sub vm_monitor_command {
3454 my ($vmid, $cmdstr, $nocheck) = @_;
3455
3456 my $res;
3457
3458 eval {
3459 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3460
3461 my $sname = "${var_run_tmpdir}/$vmid.mon";
3462
3463 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3464 die "unable to connect to VM $vmid socket - $!\n";
3465
3466 my $timeout = 3;
3467
3468 # hack: migrate sometime blocks the monitor (when migrate_downtime
3469 # is set)
3470 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3471 $timeout = 60*60; # 1 hour
3472 }
3473
3474 # read banner;
3475 my $data = __read_avail($sock, $timeout);
3476
3477 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3478 die "got unexpected qemu monitor banner\n";
3479 }
3480
3481 my $sel = new IO::Select;
3482 $sel->add($sock);
3483
3484 if (!scalar(my @ready = $sel->can_write($timeout))) {
3485 die "monitor write error - timeout";
3486 }
3487
3488 my $fullcmd = "$cmdstr\r";
3489
3490 # syslog('info', "VM $vmid monitor command: $cmdstr");
3491
3492 my $b;
3493 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3494 die "monitor write error - $!";
3495 }
3496
3497 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3498
3499 $timeout = 20;
3500
3501 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3502 $timeout = 60*60; # 1 hour
3503 } elsif ($cmdstr =~ m/^(eject|change)/) {
3504 $timeout = 60; # note: cdrom mount command is slow
3505 }
3506 if ($res = __read_avail($sock, $timeout)) {
3507
3508 my @lines = split("\r?\n", $res);
3509
3510 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
3511
3512 $res = join("\n", @lines);
3513 $res .= "\n";
3514 }
3515 };
3516
3517 my $err = $@;
3518
3519 if ($err) {
3520 syslog("err", "VM $vmid monitor command failed - $err");
3521 die $err;
3522 }
3523
3524 return $res;
3525 }
3526
3527 sub qemu_block_resize {
3528 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3529
3530 my $running = check_running($vmid);
3531
3532 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3533
3534 return if !$running;
3535
3536 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3537
3538 }
3539
3540 sub qemu_volume_snapshot {
3541 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3542
3543 my $running = check_running($vmid);
3544
3545 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3546
3547 return if !$running;
3548
3549 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3550
3551 }
3552
3553 sub qemu_volume_snapshot_delete {
3554 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3555
3556 my $running = check_running($vmid);
3557
3558 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3559
3560 return if !$running;
3561
3562 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
3563 }
3564
3565 sub set_migration_caps {
3566 my ($vmid) = @_;
3567
3568 my $cap_ref = [];
3569
3570 my $enabled_cap = {
3571 "auto-converge" => 1,
3572 "xbzrle" => 0,
3573 "x-rdma-pin-all" => 0,
3574 "zero-blocks" => 0,
3575 };
3576
3577 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
3578
3579 for my $supported_capability (@$supported_capabilities) {
3580 push @$cap_ref, {
3581 capability => $supported_capability->{capability},
3582 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3583 };
3584 }
3585
3586 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3587 }
3588
3589 sub vmconfig_hotplug_pending {
3590 my ($vmid, $conf, $storecfg) = @_;
3591
3592 my $defaults = load_defaults();
3593
3594 # commit values which do not have any impact on running VM first
3595
3596 my $changes = 0;
3597 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3598 if ($opt eq 'name' || $opt eq 'hotplug' || $opt eq 'onboot' || $opt eq 'shares') {
3599 $conf->{$opt} = $conf->{pending}->{$opt};
3600 delete $conf->{pending}->{$opt};
3601 $changes = 1;
3602 }
3603 }
3604
3605 if ($changes) {
3606 update_config_nolock($vmid, $conf, 1);
3607 $conf = load_config($vmid); # update/reload
3608 }
3609
3610 $changes = 0;
3611
3612 # allow manual ballooning if shares is set to zero
3613
3614 if (defined($conf->{pending}->{balloon}) && defined($conf->{shares}) && ($conf->{shares} == 0)) {
3615 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
3616 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
3617 $conf->{balloon} = $conf->{pending}->{balloon};
3618 delete $conf->{pending}->{balloon};
3619 $changes = 1;
3620 }
3621
3622 if ($changes) {
3623 update_config_nolock($vmid, $conf, 1);
3624 $conf = load_config($vmid); # update/reload
3625 }
3626
3627 return if !$conf->{hotplug};
3628
3629 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3630 foreach my $opt (@delete) {
3631 if ($opt eq 'tablet') {
3632 if ($defaults->{tablet}) {
3633 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3634 } else {
3635 vm_deviceunplug($vmid, $conf, $opt);
3636 }
3637 } else {
3638 # skip non-hot-pluggable options
3639 next;
3640 }
3641
3642 # save new config if hotplug was successful
3643 delete $conf->{$opt};
3644 vmconfig_undelete_pending_option($conf, $opt);
3645 update_config_nolock($vmid, $conf, 1);
3646
3647 $conf = load_config($vmid); # update/reload
3648 }
3649
3650 foreach my $opt (keys %{$conf->{pending}}) {
3651 my $value = $conf->{pending}->{$opt};
3652
3653 if ($opt eq 'tablet') {
3654 if ($value == 1) {
3655 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3656 } elsif ($value == 0) {
3657 vm_deviceunplug($vmid, $conf, $opt);
3658 }
3659 } else {
3660 # skip non-hot-pluggable options
3661 next;
3662 }
3663
3664 # save new config if hotplug was successful
3665 $conf->{$opt} = $value;
3666 delete $conf->{pending}->{$opt};
3667 update_config_nolock($vmid, $conf, 1);
3668
3669 $conf = load_config($vmid); # update/reload
3670 }
3671 }
3672
3673 sub vmconfig_apply_pending {
3674 my ($vmid, $conf, $storecfg, $running) = @_;
3675
3676 return vmconfig_hotplug_pending($vmid, $conf, $storecfg) if $running;
3677
3678 # cold plug
3679
3680 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3681 foreach my $opt (@delete) { # delete
3682 die "internal error" if $opt =~ m/^unused/;
3683 $conf = load_config($vmid); # update/reload
3684 if (!defined($conf->{$opt})) {
3685 vmconfig_undelete_pending_option($conf, $opt);
3686 update_config_nolock($vmid, $conf, 1);
3687 } elsif (valid_drivename($opt)) {
3688 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
3689 vmconfig_undelete_pending_option($conf, $opt);
3690 delete $conf->{$opt};
3691 update_config_nolock($vmid, $conf, 1);
3692 } else {
3693 vmconfig_undelete_pending_option($conf, $opt);
3694 delete $conf->{$opt};
3695 update_config_nolock($vmid, $conf, 1);
3696 }
3697 }
3698
3699 $conf = load_config($vmid); # update/reload
3700
3701 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3702 $conf = load_config($vmid); # update/reload
3703
3704 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
3705 # skip if nothing changed
3706 } elsif (valid_drivename($opt)) {
3707 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
3708 if defined($conf->{$opt});
3709 $conf->{$opt} = $conf->{pending}->{$opt};
3710 } else {
3711 $conf->{$opt} = $conf->{pending}->{$opt};
3712 }
3713
3714 delete $conf->{pending}->{$opt};
3715 update_config_nolock($vmid, $conf, 1);
3716 }
3717 }
3718
3719 sub vm_start {
3720 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
3721
3722 lock_config($vmid, sub {
3723 my $conf = load_config($vmid, $migratedfrom);
3724
3725 die "you can't start a vm if it's a template\n" if is_template($conf);
3726
3727 check_lock($conf) if !$skiplock;
3728
3729 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
3730
3731 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3732 vmconfig_apply_pending($vmid, $conf, $storecfg, 0);
3733 $conf = load_config($vmid); # update/reload
3734 }
3735
3736 my $defaults = load_defaults();
3737
3738 # set environment variable useful inside network script
3739 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3740
3741 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
3742
3743 my $migrate_port = 0;
3744 my $migrate_uri;
3745 if ($statefile) {
3746 if ($statefile eq 'tcp') {
3747 my $localip = "localhost";
3748 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3749 if ($datacenterconf->{migration_unsecure}) {
3750 my $nodename = PVE::INotify::nodename();
3751 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3752 }
3753 $migrate_port = PVE::Tools::next_migrate_port();
3754 $migrate_uri = "tcp:${localip}:${migrate_port}";
3755 push @$cmd, '-incoming', $migrate_uri;
3756 push @$cmd, '-S';
3757 } else {
3758 push @$cmd, '-loadstate', $statefile;
3759 }
3760 } elsif ($paused) {
3761 push @$cmd, '-S';
3762 }
3763
3764 # host pci devices
3765 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3766 my $d = parse_hostpci($conf->{"hostpci$i"});
3767 next if !$d;
3768 my $pcidevices = $d->{pciid};
3769 foreach my $pcidevice (@$pcidevices) {
3770 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
3771
3772 my $info = pci_device_info("0000:$pciid");
3773 die "IOMMU not present\n" if !check_iommu_support();
3774 die "no pci device info for device '$pciid'\n" if !$info;
3775
3776 if ($d->{driver} && $d->{driver} eq "vfio") {
3777 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3778 } else {
3779 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3780 }
3781
3782 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
3783 }
3784 }
3785
3786 PVE::Storage::activate_volumes($storecfg, $vollist);
3787
3788 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3789 umask => 0077); };
3790 my $err = $@;
3791 die "start failed: $err" if $err;
3792
3793 print "migration listens on $migrate_uri\n" if $migrate_uri;
3794
3795 if ($statefile && $statefile ne 'tcp') {
3796 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
3797 warn $@ if $@;
3798 }
3799
3800 if ($migratedfrom) {
3801
3802 eval {
3803 set_migration_caps($vmid);
3804 };
3805 warn $@ if $@;
3806
3807 if ($spice_port) {
3808 print "spice listens on port $spice_port\n";
3809 if ($spice_ticket) {
3810 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
3811 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
3812 }
3813 }
3814
3815 } else {
3816
3817 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
3818 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
3819 if $conf->{balloon};
3820 vm_mon_cmd_nocheck($vmid, 'qom-set',
3821 path => "machine/peripheral/balloon0",
3822 property => "guest-stats-polling-interval",
3823 value => 2);
3824 }
3825 }
3826 });
3827 }
3828
3829 sub vm_mon_cmd {
3830 my ($vmid, $execute, %params) = @_;
3831
3832 my $cmd = { execute => $execute, arguments => \%params };
3833 vm_qmp_command($vmid, $cmd);
3834 }
3835
3836 sub vm_mon_cmd_nocheck {
3837 my ($vmid, $execute, %params) = @_;
3838
3839 my $cmd = { execute => $execute, arguments => \%params };
3840 vm_qmp_command($vmid, $cmd, 1);
3841 }
3842
3843 sub vm_qmp_command {
3844 my ($vmid, $cmd, $nocheck) = @_;
3845
3846 my $res;
3847
3848 my $timeout;
3849 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
3850 $timeout = $cmd->{arguments}->{timeout};
3851 delete $cmd->{arguments}->{timeout};
3852 }
3853
3854 eval {
3855 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3856 my $sname = qmp_socket($vmid);
3857 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
3858 my $qmpclient = PVE::QMPClient->new();
3859
3860 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
3861 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
3862 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
3863 if scalar(%{$cmd->{arguments}});
3864 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
3865 } else {
3866 die "unable to open monitor socket\n";
3867 }
3868 };
3869 if (my $err = $@) {
3870 syslog("err", "VM $vmid qmp command failed - $err");
3871 die $err;
3872 }
3873
3874 return $res;
3875 }
3876
3877 sub vm_human_monitor_command {
3878 my ($vmid, $cmdline) = @_;
3879
3880 my $res;
3881
3882 my $cmd = {
3883 execute => 'human-monitor-command',
3884 arguments => { 'command-line' => $cmdline},
3885 };
3886
3887 return vm_qmp_command($vmid, $cmd);
3888 }
3889
3890 sub vm_commandline {
3891 my ($storecfg, $vmid) = @_;
3892
3893 my $conf = load_config($vmid);
3894
3895 my $defaults = load_defaults();
3896
3897 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
3898
3899 return join(' ', @$cmd);
3900 }
3901
3902 sub vm_reset {
3903 my ($vmid, $skiplock) = @_;
3904
3905 lock_config($vmid, sub {
3906
3907 my $conf = load_config($vmid);
3908
3909 check_lock($conf) if !$skiplock;
3910
3911 vm_mon_cmd($vmid, "system_reset");
3912 });
3913 }
3914
3915 sub get_vm_volumes {
3916 my ($conf) = @_;
3917
3918 my $vollist = [];
3919 foreach_volid($conf, sub {
3920 my ($volid, $is_cdrom) = @_;
3921
3922 return if $volid =~ m|^/|;
3923
3924 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
3925 return if !$sid;
3926
3927 push @$vollist, $volid;
3928 });
3929
3930 return $vollist;
3931 }
3932
3933 sub vm_stop_cleanup {
3934 my ($storecfg, $vmid, $conf, $keepActive) = @_;
3935
3936 eval {
3937 fairsched_rmnod($vmid); # try to destroy group
3938
3939 if (!$keepActive) {
3940 my $vollist = get_vm_volumes($conf);
3941 PVE::Storage::deactivate_volumes($storecfg, $vollist);
3942 }
3943
3944 foreach my $ext (qw(mon qmp pid vnc qga)) {
3945 unlink "/var/run/qemu-server/${vmid}.$ext";
3946 }
3947 };
3948 warn $@ if $@; # avoid errors - just warn
3949 }
3950
3951 # Note: use $nockeck to skip tests if VM configuration file exists.
3952 # We need that when migration VMs to other nodes (files already moved)
3953 # Note: we set $keepActive in vzdump stop mode - volumes need to stay active
3954 sub vm_stop {
3955 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
3956
3957 $force = 1 if !defined($force) && !$shutdown;
3958
3959 if ($migratedfrom){
3960 my $pid = check_running($vmid, $nocheck, $migratedfrom);
3961 kill 15, $pid if $pid;
3962 my $conf = load_config($vmid, $migratedfrom);
3963 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
3964 return;
3965 }
3966
3967 lock_config($vmid, sub {
3968
3969 my $pid = check_running($vmid, $nocheck);
3970 return if !$pid;
3971
3972 my $conf;
3973 if (!$nocheck) {
3974 $conf = load_config($vmid);
3975 check_lock($conf) if !$skiplock;
3976 if (!defined($timeout) && $shutdown && $conf->{startup}) {
3977 my $opts = parse_startup($conf->{startup});
3978 $timeout = $opts->{down} if $opts->{down};
3979 }
3980 }
3981
3982 $timeout = 60 if !defined($timeout);
3983
3984 eval {
3985 if ($shutdown) {
3986 if (!$nocheck && $conf->{agent}) {
3987 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
3988 } else {
3989 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
3990 }
3991 } else {
3992 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
3993 }
3994 };
3995 my $err = $@;
3996
3997 if (!$err) {
3998 my $count = 0;
3999 while (($count < $timeout) && check_running($vmid, $nocheck)) {
4000 $count++;
4001 sleep 1;
4002 }
4003
4004 if ($count >= $timeout) {
4005 if ($force) {
4006 warn "VM still running - terminating now with SIGTERM\n";
4007 kill 15, $pid;
4008 } else {
4009 die "VM quit/powerdown failed - got timeout\n";
4010 }
4011 } else {
4012 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
4013 return;
4014 }
4015 } else {
4016 if ($force) {
4017 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4018 kill 15, $pid;
4019 } else {
4020 die "VM quit/powerdown failed\n";
4021 }
4022 }
4023
4024 # wait again
4025 $timeout = 10;
4026
4027 my $count = 0;
4028 while (($count < $timeout) && check_running($vmid, $nocheck)) {
4029 $count++;
4030 sleep 1;
4031 }
4032
4033 if ($count >= $timeout) {
4034 warn "VM still running - terminating now with SIGKILL\n";
4035 kill 9, $pid;
4036 sleep 1;
4037 }
4038
4039 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
4040 });
4041 }
4042
4043 sub vm_suspend {
4044 my ($vmid, $skiplock) = @_;
4045
4046 lock_config($vmid, sub {
4047
4048 my $conf = load_config($vmid);
4049
4050 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
4051
4052 vm_mon_cmd($vmid, "stop");
4053 });
4054 }
4055
4056 sub vm_resume {
4057 my ($vmid, $skiplock) = @_;
4058
4059 lock_config($vmid, sub {
4060
4061 my $conf = load_config($vmid);
4062
4063 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
4064
4065 vm_mon_cmd($vmid, "cont");
4066 });
4067 }
4068
4069 sub vm_sendkey {
4070 my ($vmid, $skiplock, $key) = @_;
4071
4072 lock_config($vmid, sub {
4073
4074 my $conf = load_config($vmid);
4075
4076 # there is no qmp command, so we use the human monitor command
4077 vm_human_monitor_command($vmid, "sendkey $key");
4078 });
4079 }
4080
4081 sub vm_destroy {
4082 my ($storecfg, $vmid, $skiplock) = @_;
4083
4084 lock_config($vmid, sub {
4085
4086 my $conf = load_config($vmid);
4087
4088 check_lock($conf) if !$skiplock;
4089
4090 if (!check_running($vmid)) {
4091 fairsched_rmnod($vmid); # try to destroy group
4092 destroy_vm($storecfg, $vmid);
4093 } else {
4094 die "VM $vmid is running - destroy failed\n";
4095 }
4096 });
4097 }
4098
4099 # pci helpers
4100
4101 sub file_write {
4102 my ($filename, $buf) = @_;
4103
4104 my $fh = IO::File->new($filename, "w");
4105 return undef if !$fh;
4106
4107 my $res = print $fh $buf;
4108
4109 $fh->close();
4110
4111 return $res;
4112 }
4113
4114 sub pci_device_info {
4115 my ($name) = @_;
4116
4117 my $res;
4118
4119 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
4120 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
4121
4122 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
4123 return undef if !defined($irq) || $irq !~ m/^\d+$/;
4124
4125 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
4126 return undef if !defined($vendor) || $vendor !~ s/^0x//;
4127
4128 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
4129 return undef if !defined($product) || $product !~ s/^0x//;
4130
4131 $res = {
4132 name => $name,
4133 vendor => $vendor,
4134 product => $product,
4135 domain => $domain,
4136 bus => $bus,
4137 slot => $slot,
4138 func => $func,
4139 irq => $irq,
4140 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
4141 };
4142
4143 return $res;
4144 }
4145
4146 sub pci_dev_reset {
4147 my ($dev) = @_;
4148
4149 my $name = $dev->{name};
4150
4151 my $fn = "$pcisysfs/devices/$name/reset";
4152
4153 return file_write($fn, "1");
4154 }
4155
4156 sub pci_dev_bind_to_stub {
4157 my ($dev) = @_;
4158
4159 my $name = $dev->{name};
4160
4161 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
4162 return 1 if -d $testdir;
4163
4164 my $data = "$dev->{vendor} $dev->{product}";
4165 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
4166
4167 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4168 if (!file_write($fn, $name)) {
4169 return undef if -f $fn;
4170 }
4171
4172 $fn = "$pcisysfs/drivers/pci-stub/bind";
4173 if (! -d $testdir) {
4174 return undef if !file_write($fn, $name);
4175 }
4176
4177 return -d $testdir;
4178 }
4179
4180 sub pci_dev_bind_to_vfio {
4181 my ($dev) = @_;
4182
4183 my $name = $dev->{name};
4184
4185 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4186
4187 if (!-d $vfio_basedir) {
4188 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4189 }
4190 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4191
4192 my $testdir = "$vfio_basedir/$name";
4193 return 1 if -d $testdir;
4194
4195 my $data = "$dev->{vendor} $dev->{product}";
4196 return undef if !file_write("$vfio_basedir/new_id", $data);
4197
4198 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4199 if (!file_write($fn, $name)) {
4200 return undef if -f $fn;
4201 }
4202
4203 $fn = "$vfio_basedir/bind";
4204 if (! -d $testdir) {
4205 return undef if !file_write($fn, $name);
4206 }
4207
4208 return -d $testdir;
4209 }
4210
4211 sub pci_dev_group_bind_to_vfio {
4212 my ($pciid) = @_;
4213
4214 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4215
4216 if (!-d $vfio_basedir) {
4217 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4218 }
4219 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4220
4221 # get IOMMU group devices
4222 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
4223 my @devs = grep /^0000:/, readdir($D);
4224 closedir($D);
4225
4226 foreach my $pciid (@devs) {
4227 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
4228 my $info = pci_device_info($1);
4229 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
4230 }
4231
4232 return 1;
4233 }
4234
4235 sub print_pci_addr {
4236 my ($id, $bridges) = @_;
4237
4238 my $res = '';
4239 my $devices = {
4240 piix3 => { bus => 0, addr => 1 },
4241 #addr2 : first videocard
4242 balloon0 => { bus => 0, addr => 3 },
4243 watchdog => { bus => 0, addr => 4 },
4244 scsihw0 => { bus => 0, addr => 5 },
4245 scsihw1 => { bus => 0, addr => 6 },
4246 ahci0 => { bus => 0, addr => 7 },
4247 qga0 => { bus => 0, addr => 8 },
4248 spice => { bus => 0, addr => 9 },
4249 virtio0 => { bus => 0, addr => 10 },
4250 virtio1 => { bus => 0, addr => 11 },
4251 virtio2 => { bus => 0, addr => 12 },
4252 virtio3 => { bus => 0, addr => 13 },
4253 virtio4 => { bus => 0, addr => 14 },
4254 virtio5 => { bus => 0, addr => 15 },
4255 hostpci0 => { bus => 0, addr => 16 },
4256 hostpci1 => { bus => 0, addr => 17 },
4257 net0 => { bus => 0, addr => 18 },
4258 net1 => { bus => 0, addr => 19 },
4259 net2 => { bus => 0, addr => 20 },
4260 net3 => { bus => 0, addr => 21 },
4261 net4 => { bus => 0, addr => 22 },
4262 net5 => { bus => 0, addr => 23 },
4263 vga1 => { bus => 0, addr => 24 },
4264 vga2 => { bus => 0, addr => 25 },
4265 vga3 => { bus => 0, addr => 26 },
4266 hostpci2 => { bus => 0, addr => 27 },
4267 hostpci3 => { bus => 0, addr => 28 },
4268 #addr29 : usb-host (pve-usb.cfg)
4269 'pci.1' => { bus => 0, addr => 30 },
4270 'pci.2' => { bus => 0, addr => 31 },
4271 'net6' => { bus => 1, addr => 1 },
4272 'net7' => { bus => 1, addr => 2 },
4273 'net8' => { bus => 1, addr => 3 },
4274 'net9' => { bus => 1, addr => 4 },
4275 'net10' => { bus => 1, addr => 5 },
4276 'net11' => { bus => 1, addr => 6 },
4277 'net12' => { bus => 1, addr => 7 },
4278 'net13' => { bus => 1, addr => 8 },
4279 'net14' => { bus => 1, addr => 9 },
4280 'net15' => { bus => 1, addr => 10 },
4281 'net16' => { bus => 1, addr => 11 },
4282 'net17' => { bus => 1, addr => 12 },
4283 'net18' => { bus => 1, addr => 13 },
4284 'net19' => { bus => 1, addr => 14 },
4285 'net20' => { bus => 1, addr => 15 },
4286 'net21' => { bus => 1, addr => 16 },
4287 'net22' => { bus => 1, addr => 17 },
4288 'net23' => { bus => 1, addr => 18 },
4289 'net24' => { bus => 1, addr => 19 },
4290 'net25' => { bus => 1, addr => 20 },
4291 'net26' => { bus => 1, addr => 21 },
4292 'net27' => { bus => 1, addr => 22 },
4293 'net28' => { bus => 1, addr => 23 },
4294 'net29' => { bus => 1, addr => 24 },
4295 'net30' => { bus => 1, addr => 25 },
4296 'net31' => { bus => 1, addr => 26 },
4297 'virtio6' => { bus => 2, addr => 1 },
4298 'virtio7' => { bus => 2, addr => 2 },
4299 'virtio8' => { bus => 2, addr => 3 },
4300 'virtio9' => { bus => 2, addr => 4 },
4301 'virtio10' => { bus => 2, addr => 5 },
4302 'virtio11' => { bus => 2, addr => 6 },
4303 'virtio12' => { bus => 2, addr => 7 },
4304 'virtio13' => { bus => 2, addr => 8 },
4305 'virtio14' => { bus => 2, addr => 9 },
4306 'virtio15' => { bus => 2, addr => 10 },
4307 };
4308
4309 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4310 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4311 my $bus = $devices->{$id}->{bus};
4312 $res = ",bus=pci.$bus,addr=$addr";
4313 $bridges->{$bus} = 1 if $bridges;
4314 }
4315 return $res;
4316
4317 }
4318
4319 sub print_pcie_addr {
4320 my ($id) = @_;
4321
4322 my $res = '';
4323 my $devices = {
4324 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4325 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4326 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4327 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4328 };
4329
4330 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4331 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4332 my $bus = $devices->{$id}->{bus};
4333 $res = ",bus=$bus,addr=$addr";
4334 }
4335 return $res;
4336
4337 }
4338
4339 # vzdump restore implementaion
4340
4341 sub tar_archive_read_firstfile {
4342 my $archive = shift;
4343
4344 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4345
4346 # try to detect archive type first
4347 my $pid = open (TMP, "tar tf '$archive'|") ||
4348 die "unable to open file '$archive'\n";
4349 my $firstfile = <TMP>;
4350 kill 15, $pid;
4351 close TMP;
4352
4353 die "ERROR: archive contaions no data\n" if !$firstfile;
4354 chomp $firstfile;
4355
4356 return $firstfile;
4357 }
4358
4359 sub tar_restore_cleanup {
4360 my ($storecfg, $statfile) = @_;
4361
4362 print STDERR "starting cleanup\n";
4363
4364 if (my $fd = IO::File->new($statfile, "r")) {
4365 while (defined(my $line = <$fd>)) {
4366 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4367 my $volid = $2;
4368 eval {
4369 if ($volid =~ m|^/|) {
4370 unlink $volid || die 'unlink failed\n';
4371 } else {
4372 PVE::Storage::vdisk_free($storecfg, $volid);
4373 }
4374 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4375 };
4376 print STDERR "unable to cleanup '$volid' - $@" if $@;
4377 } else {
4378 print STDERR "unable to parse line in statfile - $line";
4379 }
4380 }
4381 $fd->close();
4382 }
4383 }
4384
4385 sub restore_archive {
4386 my ($archive, $vmid, $user, $opts) = @_;
4387
4388 my $format = $opts->{format};
4389 my $comp;
4390
4391 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4392 $format = 'tar' if !$format;
4393 $comp = 'gzip';
4394 } elsif ($archive =~ m/\.tar$/) {
4395 $format = 'tar' if !$format;
4396 } elsif ($archive =~ m/.tar.lzo$/) {
4397 $format = 'tar' if !$format;
4398 $comp = 'lzop';
4399 } elsif ($archive =~ m/\.vma$/) {
4400 $format = 'vma' if !$format;
4401 } elsif ($archive =~ m/\.vma\.gz$/) {
4402 $format = 'vma' if !$format;
4403 $comp = 'gzip';
4404 } elsif ($archive =~ m/\.vma\.lzo$/) {
4405 $format = 'vma' if !$format;
4406 $comp = 'lzop';
4407 } else {
4408 $format = 'vma' if !$format; # default
4409 }
4410
4411 # try to detect archive format
4412 if ($format eq 'tar') {
4413 return restore_tar_archive($archive, $vmid, $user, $opts);
4414 } else {
4415 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4416 }
4417 }
4418
4419 sub restore_update_config_line {
4420 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4421
4422 return if $line =~ m/^\#qmdump\#/;
4423 return if $line =~ m/^\#vzdump\#/;
4424 return if $line =~ m/^lock:/;
4425 return if $line =~ m/^unused\d+:/;
4426 return if $line =~ m/^parent:/;
4427 return if $line =~ m/^template:/; # restored VM is never a template
4428
4429 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4430 # try to convert old 1.X settings
4431 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4432 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4433 my ($model, $macaddr) = split(/\=/, $devconfig);
4434 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4435 my $net = {
4436 model => $model,
4437 bridge => "vmbr$ind",
4438 macaddr => $macaddr,
4439 };
4440 my $netstr = print_net($net);
4441
4442 print $outfd "net$cookie->{netcount}: $netstr\n";
4443 $cookie->{netcount}++;
4444 }
4445 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4446 my ($id, $netstr) = ($1, $2);
4447 my $net = parse_net($netstr);
4448 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4449 $netstr = print_net($net);
4450 print $outfd "$id: $netstr\n";
4451 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4452 my $virtdev = $1;
4453 my $value = $3;
4454 if ($line =~ m/backup=no/) {
4455 print $outfd "#$line";
4456 } elsif ($virtdev && $map->{$virtdev}) {
4457 my $di = parse_drive($virtdev, $value);
4458 delete $di->{format}; # format can change on restore
4459 $di->{file} = $map->{$virtdev};
4460 $value = print_drive($vmid, $di);
4461 print $outfd "$virtdev: $value\n";
4462 } else {
4463 print $outfd $line;
4464 }
4465 } else {
4466 print $outfd $line;
4467 }
4468 }
4469
4470 sub scan_volids {
4471 my ($cfg, $vmid) = @_;
4472
4473 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4474
4475 my $volid_hash = {};
4476 foreach my $storeid (keys %$info) {
4477 foreach my $item (@{$info->{$storeid}}) {
4478 next if !($item->{volid} && $item->{size});
4479 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
4480 $volid_hash->{$item->{volid}} = $item;
4481 }
4482 }
4483
4484 return $volid_hash;
4485 }
4486
4487 sub get_used_paths {
4488 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4489
4490 my $used_path = {};
4491
4492 my $scan_config = sub {
4493 my ($cref, $snapname) = @_;
4494
4495 foreach my $key (keys %$cref) {
4496 my $value = $cref->{$key};
4497 if (valid_drivename($key)) {
4498 next if $skip_drive && $key eq $skip_drive;
4499 my $drive = parse_drive($key, $value);
4500 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4501 if ($drive->{file} =~ m!^/!) {
4502 $used_path->{$drive->{file}}++; # = 1;
4503 } else {
4504 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4505 next if !$storeid;
4506 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4507 next if !$scfg;
4508 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4509 $used_path->{$path}++; # = 1;
4510 }
4511 }
4512 }
4513 };
4514
4515 &$scan_config($conf);
4516
4517 undef $skip_drive;
4518
4519 if ($scan_snapshots) {
4520 foreach my $snapname (keys %{$conf->{snapshots}}) {
4521 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4522 }
4523 }
4524
4525 return $used_path;
4526 }
4527
4528 sub update_disksize {
4529 my ($vmid, $conf, $volid_hash) = @_;
4530
4531 my $changes;
4532
4533 my $used = {};
4534
4535 # Note: it is allowed to define multiple storages with same path (alias), so
4536 # we need to check both 'volid' and real 'path' (two different volid can point
4537 # to the same path).
4538
4539 my $usedpath = {};
4540
4541 # update size info
4542 foreach my $opt (keys %$conf) {
4543 if (valid_drivename($opt)) {
4544 my $drive = parse_drive($opt, $conf->{$opt});
4545 my $volid = $drive->{file};
4546 next if !$volid;
4547
4548 $used->{$volid} = 1;
4549 if ($volid_hash->{$volid} &&
4550 (my $path = $volid_hash->{$volid}->{path})) {
4551 $usedpath->{$path} = 1;
4552 }
4553
4554 next if drive_is_cdrom($drive);
4555 next if !$volid_hash->{$volid};
4556
4557 $drive->{size} = $volid_hash->{$volid}->{size};
4558 my $new = print_drive($vmid, $drive);
4559 if ($new ne $conf->{$opt}) {
4560 $changes = 1;
4561 $conf->{$opt} = $new;
4562 }
4563 }
4564 }
4565
4566 # remove 'unusedX' entry if volume is used
4567 foreach my $opt (keys %$conf) {
4568 next if $opt !~ m/^unused\d+$/;
4569 my $volid = $conf->{$opt};
4570 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
4571 if ($used->{$volid} || ($path && $usedpath->{$path})) {
4572 $changes = 1;
4573 delete $conf->{$opt};
4574 }
4575 }
4576
4577 foreach my $volid (sort keys %$volid_hash) {
4578 next if $volid =~ m/vm-$vmid-state-/;
4579 next if $used->{$volid};
4580 my $path = $volid_hash->{$volid}->{path};
4581 next if !$path; # just to be sure
4582 next if $usedpath->{$path};
4583 $changes = 1;
4584 add_unused_volume($conf, $volid);
4585 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
4586 }
4587
4588 return $changes;
4589 }
4590
4591 sub rescan {
4592 my ($vmid, $nolock) = @_;
4593
4594 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4595
4596 my $volid_hash = scan_volids($cfg, $vmid);
4597
4598 my $updatefn = sub {
4599 my ($vmid) = @_;
4600
4601 my $conf = load_config($vmid);
4602
4603 check_lock($conf);
4604
4605 my $vm_volids = {};
4606 foreach my $volid (keys %$volid_hash) {
4607 my $info = $volid_hash->{$volid};
4608 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4609 }
4610
4611 my $changes = update_disksize($vmid, $conf, $vm_volids);
4612
4613 update_config_nolock($vmid, $conf, 1) if $changes;
4614 };
4615
4616 if (defined($vmid)) {
4617 if ($nolock) {
4618 &$updatefn($vmid);
4619 } else {
4620 lock_config($vmid, $updatefn, $vmid);
4621 }
4622 } else {
4623 my $vmlist = config_list();
4624 foreach my $vmid (keys %$vmlist) {
4625 if ($nolock) {
4626 &$updatefn($vmid);
4627 } else {
4628 lock_config($vmid, $updatefn, $vmid);
4629 }
4630 }
4631 }
4632 }
4633
4634 sub restore_vma_archive {
4635 my ($archive, $vmid, $user, $opts, $comp) = @_;
4636
4637 my $input = $archive eq '-' ? "<&STDIN" : undef;
4638 my $readfrom = $archive;
4639
4640 my $uncomp = '';
4641 if ($comp) {
4642 $readfrom = '-';
4643 my $qarchive = PVE::Tools::shellquote($archive);
4644 if ($comp eq 'gzip') {
4645 $uncomp = "zcat $qarchive|";
4646 } elsif ($comp eq 'lzop') {
4647 $uncomp = "lzop -d -c $qarchive|";
4648 } else {
4649 die "unknown compression method '$comp'\n";
4650 }
4651
4652 }
4653
4654 my $tmpdir = "/var/tmp/vzdumptmp$$";
4655 rmtree $tmpdir;
4656
4657 # disable interrupts (always do cleanups)
4658 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4659 warn "got interrupt - ignored\n";
4660 };
4661
4662 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4663 POSIX::mkfifo($mapfifo, 0600);
4664 my $fifofh;
4665
4666 my $openfifo = sub {
4667 open($fifofh, '>', $mapfifo) || die $!;
4668 };
4669
4670 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4671
4672 my $oldtimeout;
4673 my $timeout = 5;
4674
4675 my $devinfo = {};
4676
4677 my $rpcenv = PVE::RPCEnvironment::get();
4678
4679 my $conffile = config_file($vmid);
4680 my $tmpfn = "$conffile.$$.tmp";
4681
4682 # Note: $oldconf is undef if VM does not exists
4683 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4684
4685 my $print_devmap = sub {
4686 my $virtdev_hash = {};
4687
4688 my $cfgfn = "$tmpdir/qemu-server.conf";
4689
4690 # we can read the config - that is already extracted
4691 my $fh = IO::File->new($cfgfn, "r") ||
4692 "unable to read qemu-server.conf - $!\n";
4693
4694 while (defined(my $line = <$fh>)) {
4695 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4696 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4697 die "archive does not contain data for drive '$virtdev'\n"
4698 if !$devinfo->{$devname};
4699 if (defined($opts->{storage})) {
4700 $storeid = $opts->{storage} || 'local';
4701 } elsif (!$storeid) {
4702 $storeid = 'local';
4703 }
4704 $format = 'raw' if !$format;
4705 $devinfo->{$devname}->{devname} = $devname;
4706 $devinfo->{$devname}->{virtdev} = $virtdev;
4707 $devinfo->{$devname}->{format} = $format;
4708 $devinfo->{$devname}->{storeid} = $storeid;
4709
4710 # check permission on storage
4711 my $pool = $opts->{pool}; # todo: do we need that?
4712 if ($user ne 'root@pam') {
4713 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4714 }
4715
4716 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4717 }
4718 }
4719
4720 foreach my $devname (keys %$devinfo) {
4721 die "found no device mapping information for device '$devname'\n"
4722 if !$devinfo->{$devname}->{virtdev};
4723 }
4724
4725 my $cfg = cfs_read_file('storage.cfg');
4726
4727 # create empty/temp config
4728 if ($oldconf) {
4729 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4730 foreach_drive($oldconf, sub {
4731 my ($ds, $drive) = @_;
4732
4733 return if drive_is_cdrom($drive);
4734
4735 my $volid = $drive->{file};
4736
4737 return if !$volid || $volid =~ m|^/|;
4738
4739 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4740 return if !$path || !$owner || ($owner != $vmid);
4741
4742 # Note: only delete disk we want to restore
4743 # other volumes will become unused
4744 if ($virtdev_hash->{$ds}) {
4745 PVE::Storage::vdisk_free($cfg, $volid);
4746 }
4747 });
4748 }
4749
4750 my $map = {};
4751 foreach my $virtdev (sort keys %$virtdev_hash) {
4752 my $d = $virtdev_hash->{$virtdev};
4753 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4754 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
4755
4756 # test if requested format is supported
4757 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4758 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4759 $d->{format} = $defFormat if !$supported;
4760
4761 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4762 $d->{format}, undef, $alloc_size);
4763 print STDERR "new volume ID is '$volid'\n";
4764 $d->{volid} = $volid;
4765 my $path = PVE::Storage::path($cfg, $volid);
4766
4767 my $write_zeros = 1;
4768 # fixme: what other storages types initialize volumes with zero?
4769 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
4770 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
4771 $write_zeros = 0;
4772 }
4773
4774 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4775
4776 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4777 $map->{$virtdev} = $volid;
4778 }
4779
4780 $fh->seek(0, 0) || die "seek failed - $!\n";
4781
4782 my $outfd = new IO::File ($tmpfn, "w") ||
4783 die "unable to write config for VM $vmid\n";
4784
4785 my $cookie = { netcount => 0 };
4786 while (defined(my $line = <$fh>)) {
4787 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
4788 }
4789
4790 $fh->close();
4791 $outfd->close();
4792 };
4793
4794 eval {
4795 # enable interrupts
4796 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4797 die "interrupted by signal\n";
4798 };
4799 local $SIG{ALRM} = sub { die "got timeout\n"; };
4800
4801 $oldtimeout = alarm($timeout);
4802
4803 my $parser = sub {
4804 my $line = shift;
4805
4806 print "$line\n";
4807
4808 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
4809 my ($dev_id, $size, $devname) = ($1, $2, $3);
4810 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
4811 } elsif ($line =~ m/^CTIME: /) {
4812 # we correctly received the vma config, so we can disable
4813 # the timeout now for disk allocation (set to 10 minutes, so
4814 # that we always timeout if something goes wrong)
4815 alarm(600);
4816 &$print_devmap();
4817 print $fifofh "done\n";
4818 my $tmp = $oldtimeout || 0;
4819 $oldtimeout = undef;
4820 alarm($tmp);
4821 close($fifofh);
4822 }
4823 };
4824
4825 print "restore vma archive: $cmd\n";
4826 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
4827 };
4828 my $err = $@;
4829
4830 alarm($oldtimeout) if $oldtimeout;
4831
4832 unlink $mapfifo;
4833
4834 if ($err) {
4835 rmtree $tmpdir;
4836 unlink $tmpfn;
4837
4838 my $cfg = cfs_read_file('storage.cfg');
4839 foreach my $devname (keys %$devinfo) {
4840 my $volid = $devinfo->{$devname}->{volid};
4841 next if !$volid;
4842 eval {
4843 if ($volid =~ m|^/|) {
4844 unlink $volid || die 'unlink failed\n';
4845 } else {
4846 PVE::Storage::vdisk_free($cfg, $volid);
4847 }
4848 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4849 };
4850 print STDERR "unable to cleanup '$volid' - $@" if $@;
4851 }
4852 die $err;
4853 }
4854
4855 rmtree $tmpdir;
4856
4857 rename($tmpfn, $conffile) ||
4858 die "unable to commit configuration file '$conffile'\n";
4859
4860 PVE::Cluster::cfs_update(); # make sure we read new file
4861
4862 eval { rescan($vmid, 1); };
4863 warn $@ if $@;
4864 }
4865
4866 sub restore_tar_archive {
4867 my ($archive, $vmid, $user, $opts) = @_;
4868
4869 if ($archive ne '-') {
4870 my $firstfile = tar_archive_read_firstfile($archive);
4871 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
4872 if $firstfile ne 'qemu-server.conf';
4873 }
4874
4875 my $storecfg = cfs_read_file('storage.cfg');
4876
4877 # destroy existing data - keep empty config
4878 my $vmcfgfn = config_file($vmid);
4879 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
4880
4881 my $tocmd = "/usr/lib/qemu-server/qmextract";
4882
4883 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
4884 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
4885 $tocmd .= ' --prealloc' if $opts->{prealloc};
4886 $tocmd .= ' --info' if $opts->{info};
4887
4888 # tar option "xf" does not autodetect compression when read from STDIN,
4889 # so we pipe to zcat
4890 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
4891 PVE::Tools::shellquote("--to-command=$tocmd");
4892
4893 my $tmpdir = "/var/tmp/vzdumptmp$$";
4894 mkpath $tmpdir;
4895
4896 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
4897 local $ENV{VZDUMP_VMID} = $vmid;
4898 local $ENV{VZDUMP_USER} = $user;
4899
4900 my $conffile = config_file($vmid);
4901 my $tmpfn = "$conffile.$$.tmp";
4902
4903 # disable interrupts (always do cleanups)
4904 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4905 print STDERR "got interrupt - ignored\n";
4906 };
4907
4908 eval {
4909 # enable interrupts
4910 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4911 die "interrupted by signal\n";
4912 };
4913
4914 if ($archive eq '-') {
4915 print "extracting archive from STDIN\n";
4916 run_command($cmd, input => "<&STDIN");
4917 } else {
4918 print "extracting archive '$archive'\n";
4919 run_command($cmd);
4920 }
4921
4922 return if $opts->{info};
4923
4924 # read new mapping
4925 my $map = {};
4926 my $statfile = "$tmpdir/qmrestore.stat";
4927 if (my $fd = IO::File->new($statfile, "r")) {
4928 while (defined (my $line = <$fd>)) {
4929 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4930 $map->{$1} = $2 if $1;
4931 } else {
4932 print STDERR "unable to parse line in statfile - $line\n";
4933 }
4934 }
4935 $fd->close();
4936 }
4937
4938 my $confsrc = "$tmpdir/qemu-server.conf";
4939
4940 my $srcfd = new IO::File($confsrc, "r") ||
4941 die "unable to open file '$confsrc'\n";
4942
4943 my $outfd = new IO::File ($tmpfn, "w") ||
4944 die "unable to write config for VM $vmid\n";
4945
4946 my $cookie = { netcount => 0 };
4947 while (defined (my $line = <$srcfd>)) {
4948 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
4949 }
4950
4951 $srcfd->close();
4952 $outfd->close();
4953 };
4954 my $err = $@;
4955
4956 if ($err) {
4957
4958 unlink $tmpfn;
4959
4960 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
4961
4962 die $err;
4963 }
4964
4965 rmtree $tmpdir;
4966
4967 rename $tmpfn, $conffile ||
4968 die "unable to commit configuration file '$conffile'\n";
4969
4970 PVE::Cluster::cfs_update(); # make sure we read new file
4971
4972 eval { rescan($vmid, 1); };
4973 warn $@ if $@;
4974 };
4975
4976
4977 # Internal snapshots
4978
4979 # NOTE: Snapshot create/delete involves several non-atomic
4980 # action, and can take a long time.
4981 # So we try to avoid locking the file and use 'lock' variable
4982 # inside the config file instead.
4983
4984 my $snapshot_copy_config = sub {
4985 my ($source, $dest) = @_;
4986
4987 foreach my $k (keys %$source) {
4988 next if $k eq 'snapshots';
4989 next if $k eq 'snapstate';
4990 next if $k eq 'snaptime';
4991 next if $k eq 'vmstate';
4992 next if $k eq 'lock';
4993 next if $k eq 'digest';
4994 next if $k eq 'description';
4995 next if $k =~ m/^unused\d+$/;
4996
4997 $dest->{$k} = $source->{$k};
4998 }
4999 };
5000
5001 my $snapshot_apply_config = sub {
5002 my ($conf, $snap) = @_;
5003
5004 # copy snapshot list
5005 my $newconf = {
5006 snapshots => $conf->{snapshots},
5007 };
5008
5009 # keep description and list of unused disks
5010 foreach my $k (keys %$conf) {
5011 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
5012 $newconf->{$k} = $conf->{$k};
5013 }
5014
5015 &$snapshot_copy_config($snap, $newconf);
5016
5017 return $newconf;
5018 };
5019
5020 sub foreach_writable_storage {
5021 my ($conf, $func) = @_;
5022
5023 my $sidhash = {};
5024
5025 foreach my $ds (keys %$conf) {
5026 next if !valid_drivename($ds);
5027
5028 my $drive = parse_drive($ds, $conf->{$ds});
5029 next if !$drive;
5030 next if drive_is_cdrom($drive);
5031
5032 my $volid = $drive->{file};
5033
5034 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
5035 $sidhash->{$sid} = $sid if $sid;
5036 }
5037
5038 foreach my $sid (sort keys %$sidhash) {
5039 &$func($sid);
5040 }
5041 }
5042
5043 my $alloc_vmstate_volid = sub {
5044 my ($storecfg, $vmid, $conf, $snapname) = @_;
5045
5046 # Note: we try to be smart when selecting a $target storage
5047
5048 my $target;
5049
5050 # search shared storage first
5051 foreach_writable_storage($conf, sub {
5052 my ($sid) = @_;
5053 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5054 return if !$scfg->{shared};
5055
5056 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
5057 });
5058
5059 if (!$target) {
5060 # now search local storage
5061 foreach_writable_storage($conf, sub {
5062 my ($sid) = @_;
5063 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5064 return if $scfg->{shared};
5065
5066 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
5067 });
5068 }
5069
5070 $target = 'local' if !$target;
5071
5072 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
5073 # we abort live save after $conf->{memory}, so we need at max twice that space
5074 my $size = $conf->{memory}*2 + $driver_state_size;
5075
5076 my $name = "vm-$vmid-state-$snapname";
5077 my $scfg = PVE::Storage::storage_config($storecfg, $target);
5078 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
5079 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
5080
5081 return $volid;
5082 };
5083
5084 my $snapshot_prepare = sub {
5085 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
5086
5087 my $snap;
5088
5089 my $updatefn = sub {
5090
5091 my $conf = load_config($vmid);
5092
5093 die "you can't take a snapshot if it's a template\n"
5094 if is_template($conf);
5095
5096 check_lock($conf);
5097
5098 $conf->{lock} = 'snapshot';
5099
5100 die "snapshot name '$snapname' already used\n"
5101 if defined($conf->{snapshots}->{$snapname});
5102
5103 my $storecfg = PVE::Storage::config();
5104 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
5105
5106 $snap = $conf->{snapshots}->{$snapname} = {};
5107
5108 if ($save_vmstate && check_running($vmid)) {
5109 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
5110 }
5111
5112 &$snapshot_copy_config($conf, $snap);
5113
5114 $snap->{snapstate} = "prepare";
5115 $snap->{snaptime} = time();
5116 $snap->{description} = $comment if $comment;
5117
5118 # always overwrite machine if we save vmstate. This makes sure we
5119 # can restore it later using correct machine type
5120 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
5121
5122 update_config_nolock($vmid, $conf, 1);
5123 };
5124
5125 lock_config($vmid, $updatefn);
5126
5127 return $snap;
5128 };
5129
5130 my $snapshot_commit = sub {
5131 my ($vmid, $snapname) = @_;
5132
5133 my $updatefn = sub {
5134
5135 my $conf = load_config($vmid);
5136
5137 die "missing snapshot lock\n"
5138 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
5139
5140 my $has_machine_config = defined($conf->{machine});
5141
5142 my $snap = $conf->{snapshots}->{$snapname};
5143
5144 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5145
5146 die "wrong snapshot state\n"
5147 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
5148
5149 delete $snap->{snapstate};
5150 delete $conf->{lock};
5151
5152 my $newconf = &$snapshot_apply_config($conf, $snap);
5153
5154 delete $newconf->{machine} if !$has_machine_config;
5155
5156 $newconf->{parent} = $snapname;
5157
5158 update_config_nolock($vmid, $newconf, 1);
5159 };
5160
5161 lock_config($vmid, $updatefn);
5162 };
5163
5164 sub snapshot_rollback {
5165 my ($vmid, $snapname) = @_;
5166
5167 my $snap;
5168
5169 my $prepare = 1;
5170
5171 my $storecfg = PVE::Storage::config();
5172
5173 my $updatefn = sub {
5174
5175 my $conf = load_config($vmid);
5176
5177 die "you can't rollback if vm is a template\n" if is_template($conf);
5178
5179 $snap = $conf->{snapshots}->{$snapname};
5180
5181 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5182
5183 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
5184 if $snap->{snapstate};
5185
5186 if ($prepare) {
5187 check_lock($conf);
5188 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
5189 }
5190
5191 die "unable to rollback vm $vmid: vm is running\n"
5192 if check_running($vmid);
5193
5194 if ($prepare) {
5195 $conf->{lock} = 'rollback';
5196 } else {
5197 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
5198 delete $conf->{lock};
5199 }
5200
5201 my $forcemachine;
5202
5203 if (!$prepare) {
5204 my $has_machine_config = defined($conf->{machine});
5205
5206 # copy snapshot config to current config
5207 $conf = &$snapshot_apply_config($conf, $snap);
5208 $conf->{parent} = $snapname;
5209
5210 # Note: old code did not store 'machine', so we try to be smart
5211 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
5212 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
5213 # we remove the 'machine' configuration if not explicitly specified
5214 # in the original config.
5215 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
5216 }
5217
5218 update_config_nolock($vmid, $conf, 1);
5219
5220 if (!$prepare && $snap->{vmstate}) {
5221 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
5222 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
5223 }
5224 };
5225
5226 lock_config($vmid, $updatefn);
5227
5228 foreach_drive($snap, sub {
5229 my ($ds, $drive) = @_;
5230
5231 return if drive_is_cdrom($drive);
5232
5233 my $volid = $drive->{file};
5234 my $device = "drive-$ds";
5235
5236 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
5237 });
5238
5239 $prepare = 0;
5240 lock_config($vmid, $updatefn);
5241 }
5242
5243 my $savevm_wait = sub {
5244 my ($vmid) = @_;
5245
5246 for(;;) {
5247 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5248 if (!$stat->{status}) {
5249 die "savevm not active\n";
5250 } elsif ($stat->{status} eq 'active') {
5251 sleep(1);
5252 next;
5253 } elsif ($stat->{status} eq 'completed') {
5254 last;
5255 } else {
5256 die "query-savevm returned status '$stat->{status}'\n";
5257 }
5258 }
5259 };
5260
5261 sub snapshot_create {
5262 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
5263
5264 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
5265
5266 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
5267
5268 my $config = load_config($vmid);
5269
5270 my $running = check_running($vmid);
5271
5272 my $freezefs = $running && $config->{agent};
5273 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5274
5275 my $drivehash = {};
5276
5277 if ($freezefs) {
5278 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5279 warn "guest-fsfreeze-freeze problems - $@" if $@;
5280 }
5281
5282 eval {
5283 # create internal snapshots of all drives
5284
5285 my $storecfg = PVE::Storage::config();
5286
5287 if ($running) {
5288 if ($snap->{vmstate}) {
5289 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
5290 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5291 &$savevm_wait($vmid);
5292 } else {
5293 vm_mon_cmd($vmid, "savevm-start");
5294 }
5295 };
5296
5297 foreach_drive($snap, sub {
5298 my ($ds, $drive) = @_;
5299
5300 return if drive_is_cdrom($drive);
5301
5302 my $volid = $drive->{file};
5303 my $device = "drive-$ds";
5304
5305 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
5306 $drivehash->{$ds} = 1;
5307 });
5308 };
5309 my $err = $@;
5310
5311 if ($running) {
5312 eval { vm_mon_cmd($vmid, "savevm-end") };
5313 warn $@ if $@;
5314
5315 if ($freezefs) {
5316 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
5317 warn "guest-fsfreeze-thaw problems - $@" if $@;
5318 }
5319
5320 # savevm-end is async, we need to wait
5321 for (;;) {
5322 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5323 if (!$stat->{bytes}) {
5324 last;
5325 } else {
5326 print "savevm not yet finished\n";
5327 sleep(1);
5328 next;
5329 }
5330 }
5331 }
5332
5333 if ($err) {
5334 warn "snapshot create failed: starting cleanup\n";
5335 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
5336 warn $@ if $@;
5337 die $err;
5338 }
5339
5340 &$snapshot_commit($vmid, $snapname);
5341 }
5342
5343 # Note: $drivehash is only set when called from snapshot_create.
5344 sub snapshot_delete {
5345 my ($vmid, $snapname, $force, $drivehash) = @_;
5346
5347 my $prepare = 1;
5348
5349 my $snap;
5350 my $unused = [];
5351
5352 my $unlink_parent = sub {
5353 my ($confref, $new_parent) = @_;
5354
5355 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5356 if ($new_parent) {
5357 $confref->{parent} = $new_parent;
5358 } else {
5359 delete $confref->{parent};
5360 }
5361 }
5362 };
5363
5364 my $updatefn = sub {
5365 my ($remove_drive) = @_;
5366
5367 my $conf = load_config($vmid);
5368
5369 if (!$drivehash) {
5370 check_lock($conf);
5371 die "you can't delete a snapshot if vm is a template\n"
5372 if is_template($conf);
5373 }
5374
5375 $snap = $conf->{snapshots}->{$snapname};
5376
5377 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5378
5379 # remove parent refs
5380 if (!$prepare) {
5381 &$unlink_parent($conf, $snap->{parent});
5382 foreach my $sn (keys %{$conf->{snapshots}}) {
5383 next if $sn eq $snapname;
5384 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5385 }
5386 }
5387
5388 if ($remove_drive) {
5389 if ($remove_drive eq 'vmstate') {
5390 delete $snap->{$remove_drive};
5391 } else {
5392 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5393 my $volid = $drive->{file};
5394 delete $snap->{$remove_drive};
5395 add_unused_volume($conf, $volid);
5396 }
5397 }
5398
5399 if ($prepare) {
5400 $snap->{snapstate} = 'delete';
5401 } else {
5402 delete $conf->{snapshots}->{$snapname};
5403 delete $conf->{lock} if $drivehash;
5404 foreach my $volid (@$unused) {
5405 add_unused_volume($conf, $volid);
5406 }
5407 }
5408
5409 update_config_nolock($vmid, $conf, 1);
5410 };
5411
5412 lock_config($vmid, $updatefn);
5413
5414 # now remove vmstate file
5415
5416 my $storecfg = PVE::Storage::config();
5417
5418 if ($snap->{vmstate}) {
5419 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5420 if (my $err = $@) {
5421 die $err if !$force;
5422 warn $err;
5423 }
5424 # save changes (remove vmstate from snapshot)
5425 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5426 };
5427
5428 # now remove all internal snapshots
5429 foreach_drive($snap, sub {
5430 my ($ds, $drive) = @_;
5431
5432 return if drive_is_cdrom($drive);
5433
5434 my $volid = $drive->{file};
5435 my $device = "drive-$ds";
5436
5437 if (!$drivehash || $drivehash->{$ds}) {
5438 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5439 if (my $err = $@) {
5440 die $err if !$force;
5441 warn $err;
5442 }
5443 }
5444
5445 # save changes (remove drive fron snapshot)
5446 lock_config($vmid, $updatefn, $ds) if !$force;
5447 push @$unused, $volid;
5448 });
5449
5450 # now cleanup config
5451 $prepare = 0;
5452 lock_config($vmid, $updatefn);
5453 }
5454
5455 sub has_feature {
5456 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5457
5458 my $err;
5459 foreach_drive($conf, sub {
5460 my ($ds, $drive) = @_;
5461
5462 return if drive_is_cdrom($drive);
5463 my $volid = $drive->{file};
5464 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5465 });
5466
5467 return $err ? 0 : 1;
5468 }
5469
5470 sub template_create {
5471 my ($vmid, $conf, $disk) = @_;
5472
5473 my $storecfg = PVE::Storage::config();
5474
5475 foreach_drive($conf, sub {
5476 my ($ds, $drive) = @_;
5477
5478 return if drive_is_cdrom($drive);
5479 return if $disk && $ds ne $disk;
5480
5481 my $volid = $drive->{file};
5482 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
5483
5484 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5485 $drive->{file} = $voliddst;
5486 $conf->{$ds} = print_drive($vmid, $drive);
5487 update_config_nolock($vmid, $conf, 1);
5488 });
5489 }
5490
5491 sub is_template {
5492 my ($conf) = @_;
5493
5494 return 1 if defined $conf->{template} && $conf->{template} == 1;
5495 }
5496
5497 sub qemu_img_convert {
5498 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5499
5500 my $storecfg = PVE::Storage::config();
5501 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5502 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5503
5504 if ($src_storeid && $dst_storeid) {
5505 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5506 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5507
5508 my $src_format = qemu_img_format($src_scfg, $src_volname);
5509 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5510
5511 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5512 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5513
5514 my $cmd = [];
5515 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5516 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5517 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5518
5519 my $parser = sub {
5520 my $line = shift;
5521 if($line =~ m/\((\S+)\/100\%\)/){
5522 my $percent = $1;
5523 my $transferred = int($size * $percent / 100);
5524 my $remaining = $size - $transferred;
5525
5526 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5527 }
5528
5529 };
5530
5531 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5532 my $err = $@;
5533 die "copy failed: $err" if $err;
5534 }
5535 }
5536
5537 sub qemu_img_format {
5538 my ($scfg, $volname) = @_;
5539
5540 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5541 return $1;
5542 } elsif ($scfg->{type} eq 'iscsi') {
5543 return "host_device";
5544 } else {
5545 return "raw";
5546 }
5547 }
5548
5549 sub qemu_drive_mirror {
5550 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
5551
5552 my $count = 0;
5553 my $old_len = 0;
5554 my $frozen = undef;
5555 my $maxwait = 120;
5556
5557 my $storecfg = PVE::Storage::config();
5558 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
5559
5560 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5561
5562 my $format;
5563 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5564 $format = $1;
5565 }
5566
5567 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5568
5569 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5570 $opts->{format} = $format if $format;
5571
5572 #fixme : sometime drive-mirror timeout, but works fine after.
5573 # (I have see the problem with big volume > 200GB), so we need to eval
5574 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
5575 # ignore errors here
5576
5577 eval {
5578 while (1) {
5579 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5580 my $stat = @$stats[0];
5581 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5582 die "error job is not mirroring" if $stat->{type} ne "mirror";
5583
5584 my $busy = $stat->{busy};
5585
5586 if (my $total = $stat->{len}) {
5587 my $transferred = $stat->{offset} || 0;
5588 my $remaining = $total - $transferred;
5589 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
5590
5591 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
5592 }
5593
5594 if ($stat->{len} == $stat->{offset}) {
5595 if ($busy eq 'false') {
5596
5597 last if $vmiddst != $vmid;
5598
5599 # try to switch the disk if source and destination are on the same guest
5600 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
5601 last if !$@;
5602 die $@ if $@ !~ m/cannot be completed/;
5603 }
5604
5605 if ($count > $maxwait) {
5606 # if too much writes to disk occurs at the end of migration
5607 #the disk needs to be freezed to be able to complete the migration
5608 vm_suspend($vmid,1);
5609 $frozen = 1;
5610 }
5611 $count ++
5612 }
5613 $old_len = $stat->{offset};
5614 sleep 1;
5615 }
5616
5617 vm_resume($vmid, 1) if $frozen;
5618
5619 };
5620 my $err = $@;
5621
5622 my $cancel_job = sub {
5623 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
5624 while (1) {
5625 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5626 my $stat = @$stats[0];
5627 last if !$stat;
5628 sleep 1;
5629 }
5630 };
5631
5632 if ($err) {
5633 eval { &$cancel_job(); };
5634 die "mirroring error: $err";
5635 }
5636
5637 if ($vmiddst != $vmid) {
5638 # if we clone a disk for a new target vm, we don't switch the disk
5639 &$cancel_job(); # so we call block-job-cancel
5640 }
5641 }
5642
5643 sub clone_disk {
5644 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
5645 $newvmid, $storage, $format, $full, $newvollist) = @_;
5646
5647 my $newvolid;
5648
5649 if (!$full) {
5650 print "create linked clone of drive $drivename ($drive->{file})\n";
5651 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
5652 push @$newvollist, $newvolid;
5653 } else {
5654 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5655 $storeid = $storage if $storage;
5656
5657 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5658 if (!$format) {
5659 $format = $drive->{format} || $defFormat;
5660 }
5661
5662 # test if requested format is supported - else use default
5663 my $supported = grep { $_ eq $format } @$validFormats;
5664 $format = $defFormat if !$supported;
5665
5666 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5667
5668 print "create full clone of drive $drivename ($drive->{file})\n";
5669 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5670 push @$newvollist, $newvolid;
5671
5672 if (!$running || $snapname) {
5673 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5674 } else {
5675 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
5676 }
5677 }
5678
5679 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5680
5681 my $disk = $drive;
5682 $disk->{format} = undef;
5683 $disk->{file} = $newvolid;
5684 $disk->{size} = $size;
5685
5686 return $disk;
5687 }
5688
5689 # this only works if VM is running
5690 sub get_current_qemu_machine {
5691 my ($vmid) = @_;
5692
5693 my $cmd = { execute => 'query-machines', arguments => {} };
5694 my $res = vm_qmp_command($vmid, $cmd);
5695
5696 my ($current, $default);
5697 foreach my $e (@$res) {
5698 $default = $e->{name} if $e->{'is-default'};
5699 $current = $e->{name} if $e->{'is-current'};
5700 }
5701
5702 # fallback to the default machine if current is not supported by qemu
5703 return $current || $default || 'pc';
5704 }
5705
5706 sub lspci {
5707
5708 my $devices = {};
5709
5710 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5711 my (undef, $id, $function) = @_;
5712 my $res = { id => $id, function => $function};
5713 push @{$devices->{$id}}, $res;
5714 });
5715
5716 return $devices;
5717 }
5718
5719 1;