]> git.proxmox.com Git - qemu-server.git/blob - PVE/QemuServer.pm
vm_deviceplug: always raise exception on error
[qemu-server.git] / PVE / QemuServer.pm
1 package PVE::QemuServer;
2
3 use strict;
4 use warnings;
5 use POSIX;
6 use IO::Handle;
7 use IO::Select;
8 use IO::File;
9 use IO::Dir;
10 use IO::Socket::UNIX;
11 use File::Basename;
12 use File::Path;
13 use File::stat;
14 use Getopt::Long;
15 use Digest::SHA;
16 use Fcntl ':flock';
17 use Cwd 'abs_path';
18 use IPC::Open3;
19 use JSON;
20 use Fcntl;
21 use PVE::SafeSyslog;
22 use Storable qw(dclone);
23 use PVE::Exception qw(raise raise_param_exc);
24 use PVE::Storage;
25 use PVE::Tools qw(run_command lock_file lock_file_full file_read_firstline dir_glob_foreach);
26 use PVE::JSONSchema qw(get_standard_option);
27 use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
28 use PVE::INotify;
29 use PVE::ProcFSTools;
30 use PVE::QMPClient;
31 use PVE::RPCEnvironment;
32 use Time::HiRes qw(gettimeofday);
33
34 my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
35
36 # Note about locking: we use flock on the config file protect
37 # against concurent actions.
38 # Aditionaly, we have a 'lock' setting in the config file. This
39 # can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
40 # allowed when such lock is set. But you can ignore this kind of
41 # lock with the --skiplock flag.
42
43 cfs_register_file('/qemu-server/',
44 \&parse_vm_config,
45 \&write_vm_config);
46
47 PVE::JSONSchema::register_standard_option('skiplock', {
48 description => "Ignore locks - only root is allowed to use this option.",
49 type => 'boolean',
50 optional => 1,
51 });
52
53 PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
54 description => "Some command save/restore state from this location.",
55 type => 'string',
56 maxLength => 128,
57 optional => 1,
58 });
59
60 PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
61 description => "The name of the snapshot.",
62 type => 'string', format => 'pve-configid',
63 maxLength => 40,
64 });
65
66 #no warnings 'redefine';
67
68 unless(defined(&_VZSYSCALLS_H_)) {
69 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
70 require 'sys/syscall.ph';
71 if(defined(&__x86_64__)) {
72 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
73 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
74 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
75 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
76 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
77 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
78 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
79 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
80 }
81 elsif(defined( &__i386__) ) {
82 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
83 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
84 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
85 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
86 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
87 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
88 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
89 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
90 } else {
91 die("no fairsched syscall for this arch");
92 }
93 require 'asm/ioctl.ph';
94 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
95 }
96
97 sub fairsched_mknod {
98 my ($parent, $weight, $desired) = @_;
99
100 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
101 }
102
103 sub fairsched_rmnod {
104 my ($id) = @_;
105
106 return syscall(&__NR_fairsched_rmnod, int($id));
107 }
108
109 sub fairsched_mvpr {
110 my ($pid, $newid) = @_;
111
112 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
113 }
114
115 sub fairsched_vcpus {
116 my ($id, $vcpus) = @_;
117
118 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
119 }
120
121 sub fairsched_rate {
122 my ($id, $op, $rate) = @_;
123
124 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
125 }
126
127 use constant FAIRSCHED_SET_RATE => 0;
128 use constant FAIRSCHED_DROP_RATE => 1;
129 use constant FAIRSCHED_GET_RATE => 2;
130
131 sub fairsched_cpulimit {
132 my ($id, $limit) = @_;
133
134 my $cpulim1024 = int($limit * 1024 / 100);
135 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
136
137 return fairsched_rate($id, $op, $cpulim1024);
138 }
139
140 my $nodename = PVE::INotify::nodename();
141
142 mkdir "/etc/pve/nodes/$nodename";
143 my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
144 mkdir $confdir;
145
146 my $var_run_tmpdir = "/var/run/qemu-server";
147 mkdir $var_run_tmpdir;
148
149 my $lock_dir = "/var/lock/qemu-server";
150 mkdir $lock_dir;
151
152 my $pcisysfs = "/sys/bus/pci";
153
154 my $confdesc = {
155 iothread => {
156 optional => 1,
157 type => 'boolean',
158 description => "Enable iothread dataplane.",
159 default => 0,
160 },
161 onboot => {
162 optional => 1,
163 type => 'boolean',
164 description => "Specifies whether a VM will be started during system bootup.",
165 default => 0,
166 },
167 autostart => {
168 optional => 1,
169 type => 'boolean',
170 description => "Automatic restart after crash (currently ignored).",
171 default => 0,
172 },
173 hotplug => {
174 optional => 1,
175 type => 'boolean',
176 description => "Allow hotplug for disk and network device",
177 default => 0,
178 },
179 reboot => {
180 optional => 1,
181 type => 'boolean',
182 description => "Allow reboot. If set to '0' the VM exit on reboot.",
183 default => 1,
184 },
185 lock => {
186 optional => 1,
187 type => 'string',
188 description => "Lock/unlock the VM.",
189 enum => [qw(migrate backup snapshot rollback)],
190 },
191 cpulimit => {
192 optional => 1,
193 type => 'integer',
194 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
195 minimum => 0,
196 default => 0,
197 },
198 cpuunits => {
199 optional => 1,
200 type => 'integer',
201 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
202 minimum => 0,
203 maximum => 500000,
204 default => 1000,
205 },
206 memory => {
207 optional => 1,
208 type => 'integer',
209 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
210 minimum => 16,
211 default => 512,
212 },
213 balloon => {
214 optional => 1,
215 type => 'integer',
216 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
217 minimum => 0,
218 },
219 shares => {
220 optional => 1,
221 type => 'integer',
222 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
223 minimum => 0,
224 maximum => 50000,
225 default => 1000,
226 },
227 keyboard => {
228 optional => 1,
229 type => 'string',
230 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
231 enum => PVE::Tools::kvmkeymaplist(),
232 default => 'en-us',
233 },
234 name => {
235 optional => 1,
236 type => 'string', format => 'dns-name',
237 description => "Set a name for the VM. Only used on the configuration web interface.",
238 },
239 scsihw => {
240 optional => 1,
241 type => 'string',
242 description => "scsi controller model",
243 enum => [qw(lsi lsi53c810 virtio-scsi-pci megasas pvscsi)],
244 default => 'lsi',
245 },
246 description => {
247 optional => 1,
248 type => 'string',
249 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
250 },
251 ostype => {
252 optional => 1,
253 type => 'string',
254 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26 solaris)],
255 description => <<EODESC,
256 Used to enable special optimization/features for specific
257 operating systems:
258
259 other => unspecified OS
260 wxp => Microsoft Windows XP
261 w2k => Microsoft Windows 2000
262 w2k3 => Microsoft Windows 2003
263 w2k8 => Microsoft Windows 2008
264 wvista => Microsoft Windows Vista
265 win7 => Microsoft Windows 7
266 win8 => Microsoft Windows 8/2012
267 l24 => Linux 2.4 Kernel
268 l26 => Linux 2.6/3.X Kernel
269 solaris => solaris/opensolaris/openindiania kernel
270
271 other|l24|l26|solaris ... no special behaviour
272 wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
273 EODESC
274 },
275 boot => {
276 optional => 1,
277 type => 'string',
278 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
279 pattern => '[acdn]{1,4}',
280 default => 'cdn',
281 },
282 bootdisk => {
283 optional => 1,
284 type => 'string', format => 'pve-qm-bootdisk',
285 description => "Enable booting from specified disk.",
286 pattern => '(ide|sata|scsi|virtio)\d+',
287 },
288 smp => {
289 optional => 1,
290 type => 'integer',
291 description => "The number of CPUs. Please use option -sockets instead.",
292 minimum => 1,
293 default => 1,
294 },
295 sockets => {
296 optional => 1,
297 type => 'integer',
298 description => "The number of CPU sockets.",
299 minimum => 1,
300 default => 1,
301 },
302 cores => {
303 optional => 1,
304 type => 'integer',
305 description => "The number of cores per socket.",
306 minimum => 1,
307 default => 1,
308 },
309 numa => {
310 optional => 1,
311 type => 'boolean',
312 description => "Enable/disable Numa.",
313 default => 0,
314 },
315 maxcpus => {
316 optional => 1,
317 type => 'integer',
318 description => "Maximum cpus for hotplug.",
319 minimum => 1,
320 default => 1,
321 },
322 acpi => {
323 optional => 1,
324 type => 'boolean',
325 description => "Enable/disable ACPI.",
326 default => 1,
327 },
328 agent => {
329 optional => 1,
330 type => 'boolean',
331 description => "Enable/disable Qemu GuestAgent.",
332 default => 0,
333 },
334 kvm => {
335 optional => 1,
336 type => 'boolean',
337 description => "Enable/disable KVM hardware virtualization.",
338 default => 1,
339 },
340 tdf => {
341 optional => 1,
342 type => 'boolean',
343 description => "Enable/disable time drift fix.",
344 default => 0,
345 },
346 localtime => {
347 optional => 1,
348 type => 'boolean',
349 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
350 },
351 freeze => {
352 optional => 1,
353 type => 'boolean',
354 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
355 },
356 vga => {
357 optional => 1,
358 type => 'string',
359 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types. Option 'qxl' enables the SPICE display sever. You can also run without any graphic card using a serial devive as terminal.",
360 enum => [qw(std cirrus vmware qxl serial0 serial1 serial2 serial3 qxl2 qxl3 qxl4)],
361 },
362 watchdog => {
363 optional => 1,
364 type => 'string', format => 'pve-qm-watchdog',
365 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
366 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
367 },
368 startdate => {
369 optional => 1,
370 type => 'string',
371 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
372 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
373 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
374 default => 'now',
375 },
376 startup => {
377 optional => 1,
378 type => 'string', format => 'pve-qm-startup',
379 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
380 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
381 },
382 template => {
383 optional => 1,
384 type => 'boolean',
385 description => "Enable/disable Template.",
386 default => 0,
387 },
388 args => {
389 optional => 1,
390 type => 'string',
391 description => <<EODESCR,
392 Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
393
394 args: -no-reboot -no-hpet
395 EODESCR
396 },
397 tablet => {
398 optional => 1,
399 type => 'boolean',
400 default => 1,
401 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with normal VNC clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches. This is turned of by default if you use spice (vga=qxl).",
402 },
403 migrate_speed => {
404 optional => 1,
405 type => 'integer',
406 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
407 minimum => 0,
408 default => 0,
409 },
410 migrate_downtime => {
411 optional => 1,
412 type => 'number',
413 description => "Set maximum tolerated downtime (in seconds) for migrations.",
414 minimum => 0,
415 default => 0.1,
416 },
417 cdrom => {
418 optional => 1,
419 type => 'string', format => 'pve-qm-drive',
420 typetext => 'volume',
421 description => "This is an alias for option -ide2",
422 },
423 cpu => {
424 optional => 1,
425 description => "Emulated CPU type.",
426 type => 'string',
427 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Broadwell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
428 default => 'kvm64',
429 },
430 parent => get_standard_option('pve-snapshot-name', {
431 optional => 1,
432 description => "Parent snapshot name. This is used internally, and should not be modified.",
433 }),
434 snaptime => {
435 optional => 1,
436 description => "Timestamp for snapshots.",
437 type => 'integer',
438 minimum => 0,
439 },
440 vmstate => {
441 optional => 1,
442 type => 'string', format => 'pve-volume-id',
443 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
444 },
445 machine => {
446 description => "Specific the Qemu machine type.",
447 type => 'string',
448 pattern => '(pc|pc(-i440fx)?-\d+\.\d+|q35|pc-q35-\d+\.\d+)',
449 maxLength => 40,
450 optional => 1,
451 },
452 smbios1 => {
453 description => "Specify SMBIOS type 1 fields.",
454 type => 'string', format => 'pve-qm-smbios1',
455 typetext => "[manufacturer=str][,product=str][,version=str][,serial=str] [,uuid=uuid][,sku=str][,family=str]",
456 maxLength => 256,
457 optional => 1,
458 },
459 };
460
461 # what about other qemu settings ?
462 #cpu => 'string',
463 #machine => 'string',
464 #fda => 'file',
465 #fdb => 'file',
466 #mtdblock => 'file',
467 #sd => 'file',
468 #pflash => 'file',
469 #snapshot => 'bool',
470 #bootp => 'file',
471 ##tftp => 'dir',
472 ##smb => 'dir',
473 #kernel => 'file',
474 #append => 'string',
475 #initrd => 'file',
476 ##soundhw => 'string',
477
478 while (my ($k, $v) = each %$confdesc) {
479 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
480 }
481
482 my $MAX_IDE_DISKS = 4;
483 my $MAX_SCSI_DISKS = 14;
484 my $MAX_VIRTIO_DISKS = 16;
485 my $MAX_SATA_DISKS = 6;
486 my $MAX_USB_DEVICES = 5;
487 my $MAX_NETS = 32;
488 my $MAX_UNUSED_DISKS = 8;
489 my $MAX_HOSTPCI_DEVICES = 4;
490 my $MAX_SERIAL_PORTS = 4;
491 my $MAX_PARALLEL_PORTS = 3;
492 my $MAX_NUMA = 8;
493
494 my $numadesc = {
495 optional => 1,
496 type => 'string', format => 'pve-qm-numanode',
497 typetext => "cpus=<id[-id],memory=<mb>[[,hostnodes=<id[-id]>][,policy=<preferred|bind|interleave>]]",
498 description => "numa topology",
499 };
500 PVE::JSONSchema::register_standard_option("pve-qm-numanode", $numadesc);
501
502 for (my $i = 0; $i < $MAX_NUMA; $i++) {
503 $confdesc->{"numa$i"} = $numadesc;
504 }
505
506 my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
507 'ne2k_isa', 'i82551', 'i82557b', 'i82559er', 'vmxnet3'];
508 my $nic_model_list_txt = join(' ', sort @$nic_model_list);
509
510 my $netdesc = {
511 optional => 1,
512 type => 'string', format => 'pve-qm-net',
513 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,queues=<nbqueues>][,rate=<mbps>][,tag=<vlanid>][,firewall=0|1]",
514 description => <<EODESCR,
515 Specify network devices.
516
517 MODEL is one of: $nic_model_list_txt
518
519 XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
520 automatically generated if not specified.
521
522 The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
523
524 Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
525
526 If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
527
528 10.0.2.2 Gateway
529 10.0.2.3 DNS Server
530 10.0.2.4 SMB Server
531
532 The DHCP server assign addresses to the guest starting from 10.0.2.15.
533
534 EODESCR
535 };
536 PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
537
538 for (my $i = 0; $i < $MAX_NETS; $i++) {
539 $confdesc->{"net$i"} = $netdesc;
540 }
541
542 my $drivename_hash;
543
544 my $idedesc = {
545 optional => 1,
546 type => 'string', format => 'pve-qm-drive',
547 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
548 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
549 };
550 PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
551
552 my $scsidesc = {
553 optional => 1,
554 type => 'string', format => 'pve-qm-drive',
555 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
556 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
557 };
558 PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
559
560 my $satadesc = {
561 optional => 1,
562 type => 'string', format => 'pve-qm-drive',
563 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
564 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
565 };
566 PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
567
568 my $virtiodesc = {
569 optional => 1,
570 type => 'string', format => 'pve-qm-drive',
571 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads] [,discard=ignore|on]',
572 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
573 };
574 PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
575
576 my $usbdesc = {
577 optional => 1,
578 type => 'string', format => 'pve-qm-usb-device',
579 typetext => 'host=HOSTUSBDEVICE|spice',
580 description => <<EODESCR,
581 Configure an USB device (n is 0 to 4). This can be used to
582 pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
583
584 'bus-port(.port)*' (decimal numbers) or
585 'vendor_id:product_id' (hexadeciaml numbers)
586
587 You can use the 'lsusb -t' command to list existing usb devices.
588
589 Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
590
591 The value 'spice' can be used to add a usb redirection devices for spice.
592
593 EODESCR
594 };
595 PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
596
597 my $hostpcidesc = {
598 optional => 1,
599 type => 'string', format => 'pve-qm-hostpci',
600 typetext => "[host=]HOSTPCIDEVICE [,driver=kvm|vfio] [,rombar=on|off] [,pcie=0|1] [,x-vga=on|off]",
601 description => <<EODESCR,
602 Map host pci devices. HOSTPCIDEVICE syntax is:
603
604 'bus:dev.func' (hexadecimal numbers)
605
606 You can us the 'lspci' command to list existing pci devices.
607
608 The 'rombar' option determines whether or not the device's ROM will be visible in the guest's memory map (default is 'on').
609
610 Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
611
612 Experimental: user reported problems with this option.
613 EODESCR
614 };
615 PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
616
617 my $serialdesc = {
618 optional => 1,
619 type => 'string',
620 pattern => '(/dev/.+|socket)',
621 description => <<EODESCR,
622 Create a serial device inside the VM (n is 0 to 3), and pass through a host serial device (i.e. /dev/ttyS0), or create a unix socket on the host side (use 'qm terminal' to open a terminal connection).
623
624 Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
625
626 Experimental: user reported problems with this option.
627 EODESCR
628 };
629
630 my $paralleldesc= {
631 optional => 1,
632 type => 'string',
633 pattern => '/dev/parport\d+|/dev/usb/lp\d+',
634 description => <<EODESCR,
635 Map host parallel devices (n is 0 to 2).
636
637 Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
638
639 Experimental: user reported problems with this option.
640 EODESCR
641 };
642
643 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
644 $confdesc->{"parallel$i"} = $paralleldesc;
645 }
646
647 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
648 $confdesc->{"serial$i"} = $serialdesc;
649 }
650
651 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
652 $confdesc->{"hostpci$i"} = $hostpcidesc;
653 }
654
655 for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
656 $drivename_hash->{"ide$i"} = 1;
657 $confdesc->{"ide$i"} = $idedesc;
658 }
659
660 for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
661 $drivename_hash->{"sata$i"} = 1;
662 $confdesc->{"sata$i"} = $satadesc;
663 }
664
665 for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
666 $drivename_hash->{"scsi$i"} = 1;
667 $confdesc->{"scsi$i"} = $scsidesc ;
668 }
669
670 for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
671 $drivename_hash->{"virtio$i"} = 1;
672 $confdesc->{"virtio$i"} = $virtiodesc;
673 }
674
675 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
676 $confdesc->{"usb$i"} = $usbdesc;
677 }
678
679 my $unuseddesc = {
680 optional => 1,
681 type => 'string', format => 'pve-volume-id',
682 description => "Reference to unused volumes.",
683 };
684
685 for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
686 $confdesc->{"unused$i"} = $unuseddesc;
687 }
688
689 my $kvm_api_version = 0;
690
691 sub kvm_version {
692
693 return $kvm_api_version if $kvm_api_version;
694
695 my $fh = IO::File->new("</dev/kvm") ||
696 return 0;
697
698 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
699 $kvm_api_version = $v;
700 }
701
702 $fh->close();
703
704 return $kvm_api_version;
705 }
706
707 my $kvm_user_version;
708
709 sub kvm_user_version {
710
711 return $kvm_user_version if $kvm_user_version;
712
713 $kvm_user_version = 'unknown';
714
715 my $tmp = `kvm -help 2>/dev/null`;
716
717 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
718 $kvm_user_version = $2;
719 }
720
721 return $kvm_user_version;
722
723 }
724
725 my $kernel_has_vhost_net = -c '/dev/vhost-net';
726
727 sub disknames {
728 # order is important - used to autoselect boot disk
729 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
730 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
731 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
732 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
733 }
734
735 sub valid_drivename {
736 my $dev = shift;
737
738 return defined($drivename_hash->{$dev});
739 }
740
741 sub option_exists {
742 my $key = shift;
743 return defined($confdesc->{$key});
744 }
745
746 sub nic_models {
747 return $nic_model_list;
748 }
749
750 sub os_list_description {
751
752 return {
753 other => 'Other',
754 wxp => 'Windows XP',
755 w2k => 'Windows 2000',
756 w2k3 =>, 'Windows 2003',
757 w2k8 => 'Windows 2008',
758 wvista => 'Windows Vista',
759 win7 => 'Windows 7',
760 win8 => 'Windows 8/2012',
761 l24 => 'Linux 2.4',
762 l26 => 'Linux 2.6',
763 };
764 }
765
766 my $cdrom_path;
767
768 sub get_cdrom_path {
769
770 return $cdrom_path if $cdrom_path;
771
772 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
773 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
774 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
775 }
776
777 sub get_iso_path {
778 my ($storecfg, $vmid, $cdrom) = @_;
779
780 if ($cdrom eq 'cdrom') {
781 return get_cdrom_path();
782 } elsif ($cdrom eq 'none') {
783 return '';
784 } elsif ($cdrom =~ m|^/|) {
785 return $cdrom;
786 } else {
787 return PVE::Storage::path($storecfg, $cdrom);
788 }
789 }
790
791 # try to convert old style file names to volume IDs
792 sub filename_to_volume_id {
793 my ($vmid, $file, $media) = @_;
794
795 if (!($file eq 'none' || $file eq 'cdrom' ||
796 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
797
798 return undef if $file =~ m|/|;
799
800 if ($media && $media eq 'cdrom') {
801 $file = "local:iso/$file";
802 } else {
803 $file = "local:$vmid/$file";
804 }
805 }
806
807 return $file;
808 }
809
810 sub verify_media_type {
811 my ($opt, $vtype, $media) = @_;
812
813 return if !$media;
814
815 my $etype;
816 if ($media eq 'disk') {
817 $etype = 'images';
818 } elsif ($media eq 'cdrom') {
819 $etype = 'iso';
820 } else {
821 die "internal error";
822 }
823
824 return if ($vtype eq $etype);
825
826 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
827 }
828
829 sub cleanup_drive_path {
830 my ($opt, $storecfg, $drive) = @_;
831
832 # try to convert filesystem paths to volume IDs
833
834 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
835 ($drive->{file} !~ m|^/dev/.+|) &&
836 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
837 ($drive->{file} !~ m/^\d+$/)) {
838 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
839 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
840 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
841 verify_media_type($opt, $vtype, $drive->{media});
842 $drive->{file} = $volid;
843 }
844
845 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
846 }
847
848 sub create_conf_nolock {
849 my ($vmid, $settings) = @_;
850
851 my $filename = config_file($vmid);
852
853 die "configuration file '$filename' already exists\n" if -f $filename;
854
855 my $defaults = load_defaults();
856
857 $settings->{name} = "vm$vmid" if !$settings->{name};
858 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
859
860 my $data = '';
861 foreach my $opt (keys %$settings) {
862 next if !$confdesc->{$opt};
863
864 my $value = $settings->{$opt};
865 next if !$value;
866
867 $data .= "$opt: $value\n";
868 }
869
870 PVE::Tools::file_set_contents($filename, $data);
871 }
872
873 my $parse_size = sub {
874 my ($value) = @_;
875
876 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
877 my ($size, $unit) = ($1, $3);
878 if ($unit) {
879 if ($unit eq 'K') {
880 $size = $size * 1024;
881 } elsif ($unit eq 'M') {
882 $size = $size * 1024 * 1024;
883 } elsif ($unit eq 'G') {
884 $size = $size * 1024 * 1024 * 1024;
885 }
886 }
887 return int($size);
888 };
889
890 my $format_size = sub {
891 my ($size) = @_;
892
893 $size = int($size);
894
895 my $kb = int($size/1024);
896 return $size if $kb*1024 != $size;
897
898 my $mb = int($kb/1024);
899 return "${kb}K" if $mb*1024 != $kb;
900
901 my $gb = int($mb/1024);
902 return "${mb}M" if $gb*1024 != $mb;
903
904 return "${gb}G";
905 };
906
907 # ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
908 # [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
909 # [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
910 # [,aio=native|threads][,discard=ignore|on]
911
912 sub parse_drive {
913 my ($key, $data) = @_;
914
915 my $res = {};
916
917 # $key may be undefined - used to verify JSON parameters
918 if (!defined($key)) {
919 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
920 $res->{index} = 0;
921 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
922 $res->{interface} = $1;
923 $res->{index} = $2;
924 } else {
925 return undef;
926 }
927
928 foreach my $p (split (/,/, $data)) {
929 next if $p =~ m/^\s*$/;
930
931 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|mbps_max|bps_rd|mbps_rd|mbps_rd_max|bps_wr|mbps_wr|mbps_wr_max|iops|iops_max|iops_rd|iops_rd_max|iops_wr|iops_wr_max|size|discard)=(.+)$/) {
932 my ($k, $v) = ($1, $2);
933
934 $k = 'file' if $k eq 'volume';
935
936 return undef if defined $res->{$k};
937
938 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
939 return undef if !$v || $v !~ m/^\d+/;
940 $k = "m$k";
941 $v = sprintf("%.3f", $v / (1024*1024));
942 }
943 $res->{$k} = $v;
944 } else {
945 if (!$res->{file} && $p !~ m/=/) {
946 $res->{file} = $p;
947 } else {
948 return undef;
949 }
950 }
951 }
952
953 return undef if !$res->{file};
954
955 if($res->{file} =~ m/\.(raw|cow|qcow|qcow2|vmdk|cloop)$/){
956 $res->{format} = $1;
957 }
958
959 return undef if $res->{cache} &&
960 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
961 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
962 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
963 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
964 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
965 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
966 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
967 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
968 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
969 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
970 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
971 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
972 return undef if $res->{discard} && $res->{discard} !~ m/^(ignore|on)$/;
973
974 return undef if $res->{mbps_rd} && $res->{mbps};
975 return undef if $res->{mbps_wr} && $res->{mbps};
976
977 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
978 return undef if $res->{mbps_max} && $res->{mbps_max} !~ m/^\d+(\.\d+)?$/;
979 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
980 return undef if $res->{mbps_rd_max} && $res->{mbps_rd_max} !~ m/^\d+(\.\d+)?$/;
981 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
982 return undef if $res->{mbps_wr_max} && $res->{mbps_wr_max} !~ m/^\d+(\.\d+)?$/;
983
984 return undef if $res->{iops_rd} && $res->{iops};
985 return undef if $res->{iops_wr} && $res->{iops};
986
987
988 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
989 return undef if $res->{iops_max} && $res->{iops_max} !~ m/^\d+$/;
990 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
991 return undef if $res->{iops_rd_max} && $res->{iops_rd_max} !~ m/^\d+$/;
992 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
993 return undef if $res->{iops_wr_max} && $res->{iops_wr_max} !~ m/^\d+$/;
994
995
996 if ($res->{size}) {
997 return undef if !defined($res->{size} = &$parse_size($res->{size}));
998 }
999
1000 if ($res->{media} && ($res->{media} eq 'cdrom')) {
1001 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
1002 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1003 return undef if $res->{interface} eq 'virtio';
1004 }
1005
1006 # rerror does not work with scsi drives
1007 if ($res->{rerror}) {
1008 return undef if $res->{interface} eq 'scsi';
1009 }
1010
1011 return $res;
1012 }
1013
1014 my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio discard iops iops_rd iops_wr iops_max iops_rd_max iops_wr_max);
1015
1016 sub print_drive {
1017 my ($vmid, $drive) = @_;
1018
1019 my $opts = '';
1020 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'mbps_max', 'mbps_rd_max', 'mbps_wr_max', 'backup') {
1021 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1022 }
1023
1024 if ($drive->{size}) {
1025 $opts .= ",size=" . &$format_size($drive->{size});
1026 }
1027
1028 return "$drive->{file}$opts";
1029 }
1030
1031 sub scsi_inquiry {
1032 my($fh, $noerr) = @_;
1033
1034 my $SG_IO = 0x2285;
1035 my $SG_GET_VERSION_NUM = 0x2282;
1036
1037 my $versionbuf = "\x00" x 8;
1038 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1039 if (!$ret) {
1040 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1041 return undef;
1042 }
1043 my $version = unpack("I", $versionbuf);
1044 if ($version < 30000) {
1045 die "scsi generic interface too old\n" if !$noerr;
1046 return undef;
1047 }
1048
1049 my $buf = "\x00" x 36;
1050 my $sensebuf = "\x00" x 8;
1051 my $cmd = pack("C x3 C x1", 0x12, 36);
1052
1053 # see /usr/include/scsi/sg.h
1054 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1055
1056 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
1057 length($sensebuf), 0, length($buf), $buf,
1058 $cmd, $sensebuf, 6000);
1059
1060 $ret = ioctl($fh, $SG_IO, $packet);
1061 if (!$ret) {
1062 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1063 return undef;
1064 }
1065
1066 my @res = unpack($sg_io_hdr_t, $packet);
1067 if ($res[17] || $res[18]) {
1068 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1069 return undef;
1070 }
1071
1072 my $res = {};
1073 (my $byte0, my $byte1, $res->{vendor},
1074 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1075
1076 $res->{removable} = $byte1 & 128 ? 1 : 0;
1077 $res->{type} = $byte0 & 31;
1078
1079 return $res;
1080 }
1081
1082 sub path_is_scsi {
1083 my ($path) = @_;
1084
1085 my $fh = IO::File->new("+<$path") || return undef;
1086 my $res = scsi_inquiry($fh, 1);
1087 close($fh);
1088
1089 return $res;
1090 }
1091
1092 sub machine_type_is_q35 {
1093 my ($conf) = @_;
1094
1095 return $conf->{machine} && ($conf->{machine} =~ m/q35/) ? 1 : 0;
1096 }
1097
1098 sub print_tabletdevice_full {
1099 my ($conf) = @_;
1100
1101 my $q35 = machine_type_is_q35($conf);
1102
1103 # we use uhci for old VMs because tablet driver was buggy in older qemu
1104 my $usbbus = $q35 ? "ehci" : "uhci";
1105
1106 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1107 }
1108
1109 sub print_drivedevice_full {
1110 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
1111
1112 my $device = '';
1113 my $maxdev = 0;
1114
1115 if ($drive->{interface} eq 'virtio') {
1116 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
1117 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
1118 $device .= ",iothread=iothread0" if $conf->{iothread};
1119 } elsif ($drive->{interface} eq 'scsi') {
1120 $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
1121 my $controller = int($drive->{index} / $maxdev);
1122 my $unit = $drive->{index} % $maxdev;
1123 my $devicetype = 'hd';
1124 my $path = '';
1125 if (drive_is_cdrom($drive)) {
1126 $devicetype = 'cd';
1127 } else {
1128 if ($drive->{file} =~ m|^/|) {
1129 $path = $drive->{file};
1130 } else {
1131 $path = PVE::Storage::path($storecfg, $drive->{file});
1132 }
1133
1134 if($path =~ m/^iscsi\:\/\//){
1135 $devicetype = 'generic';
1136 } else {
1137 if (my $info = path_is_scsi($path)) {
1138 if ($info->{type} == 0) {
1139 $devicetype = 'block';
1140 } elsif ($info->{type} == 1) { # tape
1141 $devicetype = 'generic';
1142 }
1143 }
1144 }
1145 }
1146
1147 if (!$conf->{scsihw} || ($conf->{scsihw} =~ m/^lsi/)){
1148 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1149 } else {
1150 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1151 }
1152
1153 } elsif ($drive->{interface} eq 'ide'){
1154 $maxdev = 2;
1155 my $controller = int($drive->{index} / $maxdev);
1156 my $unit = $drive->{index} % $maxdev;
1157 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1158
1159 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1160 } elsif ($drive->{interface} eq 'sata'){
1161 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1162 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1163 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1164 } elsif ($drive->{interface} eq 'usb') {
1165 die "implement me";
1166 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1167 } else {
1168 die "unsupported interface type";
1169 }
1170
1171 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1172
1173 return $device;
1174 }
1175
1176 sub get_initiator_name {
1177 my $initiator;
1178
1179 my $fh = IO::File->new('/etc/iscsi/initiatorname.iscsi') || return undef;
1180 while (defined(my $line = <$fh>)) {
1181 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
1182 $initiator = $1;
1183 last;
1184 }
1185 $fh->close();
1186
1187 return $initiator;
1188 }
1189
1190 sub print_drive_full {
1191 my ($storecfg, $vmid, $drive) = @_;
1192
1193 my $opts = '';
1194 foreach my $o (@qemu_drive_options) {
1195 next if $o eq 'bootindex';
1196 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1197 }
1198
1199 foreach my $o (qw(bps bps_rd bps_wr)) {
1200 my $v = $drive->{"m$o"};
1201 $opts .= ",$o=" . int($v*1024*1024) if $v;
1202 }
1203
1204 # use linux-aio by default (qemu default is threads)
1205 $opts .= ",aio=native" if !$drive->{aio};
1206
1207 my $path;
1208 my $volid = $drive->{file};
1209 if (drive_is_cdrom($drive)) {
1210 $path = get_iso_path($storecfg, $vmid, $volid);
1211 } else {
1212 if ($volid =~ m|^/|) {
1213 $path = $volid;
1214 } else {
1215 $path = PVE::Storage::path($storecfg, $volid);
1216 }
1217 }
1218
1219 $opts .= ",cache=none" if !$drive->{cache} && !drive_is_cdrom($drive);
1220
1221 my $detectzeroes = $drive->{discard} ? "unmap" : "on";
1222 $opts .= ",detect-zeroes=$detectzeroes" if !drive_is_cdrom($drive);
1223
1224 my $pathinfo = $path ? "file=$path," : '';
1225
1226 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1227 }
1228
1229 sub print_netdevice_full {
1230 my ($vmid, $conf, $net, $netid, $bridges) = @_;
1231
1232 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1233
1234 my $device = $net->{model};
1235 if ($net->{model} eq 'virtio') {
1236 $device = 'virtio-net-pci';
1237 };
1238
1239 # qemu > 0.15 always try to boot from network - we disable that by
1240 # not loading the pxe rom file
1241 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
1242 my $pciaddr = print_pci_addr("$netid", $bridges);
1243 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
1244 if ($net->{queues} && $net->{queues} > 1 && $net->{model} eq 'virtio'){
1245 #Consider we have N queues, the number of vectors needed is 2*N + 2 (plus one config interrupt and control vq)
1246 my $vectors = $net->{queues} * 2 + 2;
1247 $tmpstr .= ",vectors=$vectors,mq=on";
1248 }
1249 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1250 return $tmpstr;
1251 }
1252
1253 sub print_netdev_full {
1254 my ($vmid, $conf, $net, $netid) = @_;
1255
1256 my $i = '';
1257 if ($netid =~ m/^net(\d+)$/) {
1258 $i = int($1);
1259 }
1260
1261 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1262
1263 my $ifname = "tap${vmid}i$i";
1264
1265 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1266 die "interface name '$ifname' is too long (max 15 character)\n"
1267 if length($ifname) >= 16;
1268
1269 my $vhostparam = '';
1270 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1271
1272 my $vmname = $conf->{name} || "vm$vmid";
1273
1274 my $netdev = "";
1275
1276 if ($net->{bridge}) {
1277 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge,downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
1278 } else {
1279 $netdev = "type=user,id=$netid,hostname=$vmname";
1280 }
1281
1282 $netdev .= ",queues=$net->{queues}" if ($net->{queues} && $net->{model} eq 'virtio');
1283
1284 return $netdev;
1285 }
1286
1287 sub drive_is_cdrom {
1288 my ($drive) = @_;
1289
1290 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1291
1292 }
1293
1294 sub parse_numa {
1295 my ($data) = @_;
1296
1297 my $res = {};
1298
1299 foreach my $kvp (split(/,/, $data)) {
1300
1301 if ($kvp =~ m/^memory=(\S+)$/) {
1302 $res->{memory} = $1;
1303 } elsif ($kvp =~ m/^policy=(preferred|bind|interleave)$/) {
1304 $res->{policy} = $1;
1305 } elsif ($kvp =~ m/^cpus=(\d+)(-(\d+))?$/) {
1306 $res->{cpus}->{start} = $1;
1307 $res->{cpus}->{end} = $3;
1308 } elsif ($kvp =~ m/^hostnodes=(\d+)(-(\d+))?$/) {
1309 $res->{hostnodes}->{start} = $1;
1310 $res->{hostnodes}->{end} = $3;
1311 } else {
1312 return undef;
1313 }
1314 }
1315
1316 return $res;
1317 }
1318
1319 sub parse_hostpci {
1320 my ($value) = @_;
1321
1322 return undef if !$value;
1323
1324
1325 my @list = split(/,/, $value);
1326 my $found;
1327
1328 my $res = {};
1329 foreach my $kv (@list) {
1330
1331 if ($kv =~ m/^(host=)?([a-f0-9]{2}:[a-f0-9]{2})(\.([a-f0-9]))?$/) {
1332 $found = 1;
1333 if(defined($4)){
1334 push @{$res->{pciid}}, { id => $2 , function => $4};
1335
1336 }else{
1337 my $pcidevices = lspci($2);
1338 $res->{pciid} = $pcidevices->{$2};
1339 }
1340 } elsif ($kv =~ m/^driver=(kvm|vfio)$/) {
1341 $res->{driver} = $1;
1342 } elsif ($kv =~ m/^rombar=(on|off)$/) {
1343 $res->{rombar} = $1;
1344 } elsif ($kv =~ m/^x-vga=(on|off)$/) {
1345 $res->{'x-vga'} = $1;
1346 } elsif ($kv =~ m/^pcie=(\d+)$/) {
1347 $res->{pcie} = 1 if $1 == 1;
1348 } else {
1349 warn "unknown hostpci setting '$kv'\n";
1350 }
1351 }
1352
1353 return undef if !$found;
1354
1355 return $res;
1356 }
1357
1358 # netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1359 sub parse_net {
1360 my ($data) = @_;
1361
1362 my $res = {};
1363
1364 foreach my $kvp (split(/,/, $data)) {
1365
1366 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er|vmxnet3)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
1367 my $model = lc($1);
1368 my $mac = defined($3) ? uc($3) : PVE::Tools::random_ether_addr();
1369 $res->{model} = $model;
1370 $res->{macaddr} = $mac;
1371 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1372 $res->{bridge} = $1;
1373 } elsif ($kvp =~ m/^queues=(\d+)$/) {
1374 $res->{queues} = $1;
1375 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1376 $res->{rate} = $1;
1377 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1378 $res->{tag} = $1;
1379 } elsif ($kvp =~ m/^firewall=(\d+)$/) {
1380 $res->{firewall} = $1;
1381 } else {
1382 return undef;
1383 }
1384
1385 }
1386
1387 return undef if !$res->{model};
1388
1389 return $res;
1390 }
1391
1392 sub print_net {
1393 my $net = shift;
1394
1395 my $res = "$net->{model}";
1396 $res .= "=$net->{macaddr}" if $net->{macaddr};
1397 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1398 $res .= ",rate=$net->{rate}" if $net->{rate};
1399 $res .= ",tag=$net->{tag}" if $net->{tag};
1400 $res .= ",firewall=$net->{firewall}" if $net->{firewall};
1401
1402 return $res;
1403 }
1404
1405 sub add_random_macs {
1406 my ($settings) = @_;
1407
1408 foreach my $opt (keys %$settings) {
1409 next if $opt !~ m/^net(\d+)$/;
1410 my $net = parse_net($settings->{$opt});
1411 next if !$net;
1412 $settings->{$opt} = print_net($net);
1413 }
1414 }
1415
1416 sub add_unused_volume {
1417 my ($config, $volid) = @_;
1418
1419 my $key;
1420 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1421 my $test = "unused$ind";
1422 if (my $vid = $config->{$test}) {
1423 return if $vid eq $volid; # do not add duplicates
1424 } else {
1425 $key = $test;
1426 }
1427 }
1428
1429 die "To many unused volume - please delete them first.\n" if !$key;
1430
1431 $config->{$key} = $volid;
1432
1433 return $key;
1434 }
1435
1436 sub vm_is_volid_owner {
1437 my ($storecfg, $vmid, $volid) = @_;
1438
1439 if ($volid !~ m|^/|) {
1440 my ($path, $owner);
1441 eval { ($path, $owner) = PVE::Storage::path($storecfg, $volid); };
1442 if ($owner && ($owner == $vmid)) {
1443 return 1;
1444 }
1445 }
1446
1447 return undef;
1448 }
1449
1450 sub vmconfig_delete_pending_option {
1451 my ($conf, $key) = @_;
1452
1453 delete $conf->{pending}->{$key};
1454 my $pending_delete_hash = { $key => 1 };
1455 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1456 $pending_delete_hash->{$opt} = 1;
1457 }
1458 $conf->{pending}->{delete} = join(',', keys %$pending_delete_hash);
1459 }
1460
1461 sub vmconfig_undelete_pending_option {
1462 my ($conf, $key) = @_;
1463
1464 my $pending_delete_hash = {};
1465 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1466 $pending_delete_hash->{$opt} = 1;
1467 }
1468 delete $pending_delete_hash->{$key};
1469
1470 my @keylist = keys %$pending_delete_hash;
1471 if (scalar(@keylist)) {
1472 $conf->{pending}->{delete} = join(',', @keylist);
1473 } else {
1474 delete $conf->{pending}->{delete};
1475 }
1476 }
1477
1478 sub vmconfig_register_unused_drive {
1479 my ($storecfg, $vmid, $conf, $drive) = @_;
1480
1481 if (!drive_is_cdrom($drive)) {
1482 my $volid = $drive->{file};
1483 if (vm_is_volid_owner($storecfg, $vmid, $volid)) {
1484 add_unused_volume($conf, $volid, $vmid);
1485 }
1486 }
1487 }
1488
1489 sub vmconfig_cleanup_pending {
1490 my ($conf) = @_;
1491
1492 # remove pending changes when nothing changed
1493 my $changes;
1494 foreach my $opt (keys %{$conf->{pending}}) {
1495 if (defined($conf->{$opt}) && ($conf->{pending}->{$opt} eq $conf->{$opt})) {
1496 $changes = 1;
1497 delete $conf->{pending}->{$opt};
1498 }
1499 }
1500
1501 # remove delete if option is not set
1502 my $pending_delete_hash = {};
1503 foreach my $opt (PVE::Tools::split_list($conf->{pending}->{delete})) {
1504 if (defined($conf->{$opt})) {
1505 $pending_delete_hash->{$opt} = 1;
1506 } else {
1507 $changes = 1;
1508 }
1509 }
1510
1511 my @keylist = keys %$pending_delete_hash;
1512 if (scalar(@keylist)) {
1513 $conf->{pending}->{delete} = join(',', @keylist);
1514 } else {
1515 delete $conf->{pending}->{delete};
1516 }
1517
1518 return $changes;
1519 }
1520
1521 my $valid_smbios1_options = {
1522 manufacturer => '\S+',
1523 product => '\S+',
1524 version => '\S+',
1525 serial => '\S+',
1526 uuid => '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
1527 sku => '\S+',
1528 family => '\S+',
1529 };
1530
1531 # smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str]
1532 sub parse_smbios1 {
1533 my ($data) = @_;
1534
1535 my $res = {};
1536
1537 foreach my $kvp (split(/,/, $data)) {
1538 return undef if $kvp !~ m/^(\S+)=(.+)$/;
1539 my ($k, $v) = split(/=/, $kvp);
1540 return undef if !defined($k) || !defined($v);
1541 return undef if !$valid_smbios1_options->{$k};
1542 return undef if $v !~ m/^$valid_smbios1_options->{$k}$/;
1543 $res->{$k} = $v;
1544 }
1545
1546 return $res;
1547 }
1548
1549 sub print_smbios1 {
1550 my ($smbios1) = @_;
1551
1552 my $data = '';
1553 foreach my $k (keys %$smbios1) {
1554 next if !defined($smbios1->{$k});
1555 next if !$valid_smbios1_options->{$k};
1556 $data .= ',' if $data;
1557 $data .= "$k=$smbios1->{$k}";
1558 }
1559 return $data;
1560 }
1561
1562 PVE::JSONSchema::register_format('pve-qm-smbios1', \&verify_smbios1);
1563 sub verify_smbios1 {
1564 my ($value, $noerr) = @_;
1565
1566 return $value if parse_smbios1($value);
1567
1568 return undef if $noerr;
1569
1570 die "unable to parse smbios (type 1) options\n";
1571 }
1572
1573 PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1574 sub verify_bootdisk {
1575 my ($value, $noerr) = @_;
1576
1577 return $value if valid_drivename($value);
1578
1579 return undef if $noerr;
1580
1581 die "invalid boot disk '$value'\n";
1582 }
1583
1584 PVE::JSONSchema::register_format('pve-qm-numanode', \&verify_numa);
1585 sub verify_numa {
1586 my ($value, $noerr) = @_;
1587
1588 return $value if parse_numa($value);
1589
1590 return undef if $noerr;
1591
1592 die "unable to parse numa options\n";
1593 }
1594
1595 PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1596 sub verify_net {
1597 my ($value, $noerr) = @_;
1598
1599 return $value if parse_net($value);
1600
1601 return undef if $noerr;
1602
1603 die "unable to parse network options\n";
1604 }
1605
1606 PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1607 sub verify_drive {
1608 my ($value, $noerr) = @_;
1609
1610 return $value if parse_drive(undef, $value);
1611
1612 return undef if $noerr;
1613
1614 die "unable to parse drive options\n";
1615 }
1616
1617 PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1618 sub verify_hostpci {
1619 my ($value, $noerr) = @_;
1620
1621 return $value if parse_hostpci($value);
1622
1623 return undef if $noerr;
1624
1625 die "unable to parse pci id\n";
1626 }
1627
1628 PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1629 sub verify_watchdog {
1630 my ($value, $noerr) = @_;
1631
1632 return $value if parse_watchdog($value);
1633
1634 return undef if $noerr;
1635
1636 die "unable to parse watchdog options\n";
1637 }
1638
1639 sub parse_watchdog {
1640 my ($value) = @_;
1641
1642 return undef if !$value;
1643
1644 my $res = {};
1645
1646 foreach my $p (split(/,/, $value)) {
1647 next if $p =~ m/^\s*$/;
1648
1649 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1650 $res->{model} = $2;
1651 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1652 $res->{action} = $2;
1653 } else {
1654 return undef;
1655 }
1656 }
1657
1658 return $res;
1659 }
1660
1661 PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1662 sub verify_startup {
1663 my ($value, $noerr) = @_;
1664
1665 return $value if parse_startup($value);
1666
1667 return undef if $noerr;
1668
1669 die "unable to parse startup options\n";
1670 }
1671
1672 sub parse_startup {
1673 my ($value) = @_;
1674
1675 return undef if !$value;
1676
1677 my $res = {};
1678
1679 foreach my $p (split(/,/, $value)) {
1680 next if $p =~ m/^\s*$/;
1681
1682 if ($p =~ m/^(order=)?(\d+)$/) {
1683 $res->{order} = $2;
1684 } elsif ($p =~ m/^up=(\d+)$/) {
1685 $res->{up} = $1;
1686 } elsif ($p =~ m/^down=(\d+)$/) {
1687 $res->{down} = $1;
1688 } else {
1689 return undef;
1690 }
1691 }
1692
1693 return $res;
1694 }
1695
1696 sub parse_usb_device {
1697 my ($value) = @_;
1698
1699 return undef if !$value;
1700
1701 my @dl = split(/,/, $value);
1702 my $found;
1703
1704 my $res = {};
1705 foreach my $v (@dl) {
1706 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1707 $found = 1;
1708 $res->{vendorid} = $2;
1709 $res->{productid} = $4;
1710 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1711 $found = 1;
1712 $res->{hostbus} = $1;
1713 $res->{hostport} = $2;
1714 } elsif ($v =~ m/^spice$/) {
1715 $found = 1;
1716 $res->{spice} = 1;
1717 } else {
1718 return undef;
1719 }
1720 }
1721 return undef if !$found;
1722
1723 return $res;
1724 }
1725
1726 PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1727 sub verify_usb_device {
1728 my ($value, $noerr) = @_;
1729
1730 return $value if parse_usb_device($value);
1731
1732 return undef if $noerr;
1733
1734 die "unable to parse usb device\n";
1735 }
1736
1737 # add JSON properties for create and set function
1738 sub json_config_properties {
1739 my $prop = shift;
1740
1741 foreach my $opt (keys %$confdesc) {
1742 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1743 $prop->{$opt} = $confdesc->{$opt};
1744 }
1745
1746 return $prop;
1747 }
1748
1749 sub check_type {
1750 my ($key, $value) = @_;
1751
1752 die "unknown setting '$key'\n" if !$confdesc->{$key};
1753
1754 my $type = $confdesc->{$key}->{type};
1755
1756 if (!defined($value)) {
1757 die "got undefined value\n";
1758 }
1759
1760 if ($value =~ m/[\n\r]/) {
1761 die "property contains a line feed\n";
1762 }
1763
1764 if ($type eq 'boolean') {
1765 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1766 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1767 die "type check ('boolean') failed - got '$value'\n";
1768 } elsif ($type eq 'integer') {
1769 return int($1) if $value =~ m/^(\d+)$/;
1770 die "type check ('integer') failed - got '$value'\n";
1771 } elsif ($type eq 'number') {
1772 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1773 die "type check ('number') failed - got '$value'\n";
1774 } elsif ($type eq 'string') {
1775 if (my $fmt = $confdesc->{$key}->{format}) {
1776 if ($fmt eq 'pve-qm-drive') {
1777 # special case - we need to pass $key to parse_drive()
1778 my $drive = parse_drive($key, $value);
1779 return $value if $drive;
1780 die "unable to parse drive options\n";
1781 }
1782 PVE::JSONSchema::check_format($fmt, $value);
1783 return $value;
1784 }
1785 $value =~ s/^\"(.*)\"$/$1/;
1786 return $value;
1787 } else {
1788 die "internal error"
1789 }
1790 }
1791
1792 sub lock_config_full {
1793 my ($vmid, $timeout, $code, @param) = @_;
1794
1795 my $filename = config_file_lock($vmid);
1796
1797 my $res = lock_file($filename, $timeout, $code, @param);
1798
1799 die $@ if $@;
1800
1801 return $res;
1802 }
1803
1804 sub lock_config_mode {
1805 my ($vmid, $timeout, $shared, $code, @param) = @_;
1806
1807 my $filename = config_file_lock($vmid);
1808
1809 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
1810
1811 die $@ if $@;
1812
1813 return $res;
1814 }
1815
1816 sub lock_config {
1817 my ($vmid, $code, @param) = @_;
1818
1819 return lock_config_full($vmid, 10, $code, @param);
1820 }
1821
1822 sub cfs_config_path {
1823 my ($vmid, $node) = @_;
1824
1825 $node = $nodename if !$node;
1826 return "nodes/$node/qemu-server/$vmid.conf";
1827 }
1828
1829 sub check_iommu_support{
1830 #fixme : need to check IOMMU support
1831 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1832
1833 my $iommu=1;
1834 return $iommu;
1835
1836 }
1837
1838 sub config_file {
1839 my ($vmid, $node) = @_;
1840
1841 my $cfspath = cfs_config_path($vmid, $node);
1842 return "/etc/pve/$cfspath";
1843 }
1844
1845 sub config_file_lock {
1846 my ($vmid) = @_;
1847
1848 return "$lock_dir/lock-$vmid.conf";
1849 }
1850
1851 sub touch_config {
1852 my ($vmid) = @_;
1853
1854 my $conf = config_file($vmid);
1855 utime undef, undef, $conf;
1856 }
1857
1858 sub destroy_vm {
1859 my ($storecfg, $vmid, $keep_empty_config) = @_;
1860
1861 my $conffile = config_file($vmid);
1862
1863 my $conf = load_config($vmid);
1864
1865 check_lock($conf);
1866
1867 # only remove disks owned by this VM
1868 foreach_drive($conf, sub {
1869 my ($ds, $drive) = @_;
1870
1871 return if drive_is_cdrom($drive);
1872
1873 my $volid = $drive->{file};
1874
1875 return if !$volid || $volid =~ m|^/|;
1876
1877 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
1878 return if !$path || !$owner || ($owner != $vmid);
1879
1880 PVE::Storage::vdisk_free($storecfg, $volid);
1881 });
1882
1883 if ($keep_empty_config) {
1884 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
1885 } else {
1886 unlink $conffile;
1887 }
1888
1889 # also remove unused disk
1890 eval {
1891 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1892
1893 eval {
1894 PVE::Storage::foreach_volid($dl, sub {
1895 my ($volid, $sid, $volname, $d) = @_;
1896 PVE::Storage::vdisk_free($storecfg, $volid);
1897 });
1898 };
1899 warn $@ if $@;
1900
1901 };
1902 warn $@ if $@;
1903 }
1904
1905 sub load_config {
1906 my ($vmid, $node) = @_;
1907
1908 my $cfspath = cfs_config_path($vmid, $node);
1909
1910 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1911
1912 die "no such VM ('$vmid')\n" if !defined($conf);
1913
1914 return $conf;
1915 }
1916
1917 sub parse_vm_config {
1918 my ($filename, $raw) = @_;
1919
1920 return undef if !defined($raw);
1921
1922 my $res = {
1923 digest => Digest::SHA::sha1_hex($raw),
1924 snapshots => {},
1925 pending => {},
1926 };
1927
1928 $filename =~ m|/qemu-server/(\d+)\.conf$|
1929 || die "got strange filename '$filename'";
1930
1931 my $vmid = $1;
1932
1933 my $conf = $res;
1934 my $descr = '';
1935 my $section = '';
1936
1937 my @lines = split(/\n/, $raw);
1938 foreach my $line (@lines) {
1939 next if $line =~ m/^\s*$/;
1940
1941 if ($line =~ m/^\[PENDING\]\s*$/i) {
1942 $section = 'pending';
1943 $conf->{description} = $descr if $descr;
1944 $descr = '';
1945 $conf = $res->{$section} = {};
1946 next;
1947
1948 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
1949 $section = $1;
1950 $conf->{description} = $descr if $descr;
1951 $descr = '';
1952 $conf = $res->{snapshots}->{$section} = {};
1953 next;
1954 }
1955
1956 if ($line =~ m/^\#(.*)\s*$/) {
1957 $descr .= PVE::Tools::decode_text($1) . "\n";
1958 next;
1959 }
1960
1961 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
1962 $descr .= PVE::Tools::decode_text($2);
1963 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1964 $conf->{snapstate} = $1;
1965 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1966 my $key = $1;
1967 my $value = $2;
1968 $conf->{$key} = $value;
1969 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
1970 my $value = $1;
1971 if ($section eq 'pending') {
1972 $conf->{delete} = $value; # we parse this later
1973 } else {
1974 warn "vm $vmid - propertry 'delete' is only allowed in [PENDING]\n";
1975 }
1976 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1977 my $key = $1;
1978 my $value = $2;
1979 eval { $value = check_type($key, $value); };
1980 if ($@) {
1981 warn "vm $vmid - unable to parse value of '$key' - $@";
1982 } else {
1983 my $fmt = $confdesc->{$key}->{format};
1984 if ($fmt && $fmt eq 'pve-qm-drive') {
1985 my $v = parse_drive($key, $value);
1986 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1987 $v->{file} = $volid;
1988 $value = print_drive($vmid, $v);
1989 } else {
1990 warn "vm $vmid - unable to parse value of '$key'\n";
1991 next;
1992 }
1993 }
1994
1995 if ($key eq 'cdrom') {
1996 $conf->{ide2} = $value;
1997 } else {
1998 $conf->{$key} = $value;
1999 }
2000 }
2001 }
2002 }
2003
2004 $conf->{description} = $descr if $descr;
2005
2006 delete $res->{snapstate}; # just to be sure
2007
2008 return $res;
2009 }
2010
2011 sub write_vm_config {
2012 my ($filename, $conf) = @_;
2013
2014 delete $conf->{snapstate}; # just to be sure
2015
2016 if ($conf->{cdrom}) {
2017 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
2018 $conf->{ide2} = $conf->{cdrom};
2019 delete $conf->{cdrom};
2020 }
2021
2022 # we do not use 'smp' any longer
2023 if ($conf->{sockets}) {
2024 delete $conf->{smp};
2025 } elsif ($conf->{smp}) {
2026 $conf->{sockets} = $conf->{smp};
2027 delete $conf->{cores};
2028 delete $conf->{smp};
2029 }
2030
2031 if ($conf->{maxcpus} && $conf->{sockets}) {
2032 delete $conf->{sockets};
2033 }
2034
2035 my $used_volids = {};
2036
2037 my $cleanup_config = sub {
2038 my ($cref, $pending, $snapname) = @_;
2039
2040 foreach my $key (keys %$cref) {
2041 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
2042 $key eq 'snapstate' || $key eq 'pending';
2043 my $value = $cref->{$key};
2044 if ($key eq 'delete') {
2045 die "propertry 'delete' is only allowed in [PENDING]\n"
2046 if !$pending;
2047 # fixme: check syntax?
2048 next;
2049 }
2050 eval { $value = check_type($key, $value); };
2051 die "unable to parse value of '$key' - $@" if $@;
2052
2053 $cref->{$key} = $value;
2054
2055 if (!$snapname && valid_drivename($key)) {
2056 my $drive = parse_drive($key, $value);
2057 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
2058 }
2059 }
2060 };
2061
2062 &$cleanup_config($conf);
2063
2064 &$cleanup_config($conf->{pending}, 1);
2065
2066 foreach my $snapname (keys %{$conf->{snapshots}}) {
2067 die "internal error" if $snapname eq 'pending';
2068 &$cleanup_config($conf->{snapshots}->{$snapname}, undef, $snapname);
2069 }
2070
2071 # remove 'unusedX' settings if we re-add a volume
2072 foreach my $key (keys %$conf) {
2073 my $value = $conf->{$key};
2074 if ($key =~ m/^unused/ && $used_volids->{$value}) {
2075 delete $conf->{$key};
2076 }
2077 }
2078
2079 my $generate_raw_config = sub {
2080 my ($conf) = @_;
2081
2082 my $raw = '';
2083
2084 # add description as comment to top of file
2085 my $descr = $conf->{description} || '';
2086 foreach my $cl (split(/\n/, $descr)) {
2087 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
2088 }
2089
2090 foreach my $key (sort keys %$conf) {
2091 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' || $key eq 'snapshots';
2092 $raw .= "$key: $conf->{$key}\n";
2093 }
2094 return $raw;
2095 };
2096
2097 my $raw = &$generate_raw_config($conf);
2098
2099 if (scalar(keys %{$conf->{pending}})){
2100 $raw .= "\n[PENDING]\n";
2101 $raw .= &$generate_raw_config($conf->{pending});
2102 }
2103
2104 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
2105 $raw .= "\n[$snapname]\n";
2106 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
2107 }
2108
2109 return $raw;
2110 }
2111
2112 sub update_config_nolock {
2113 my ($vmid, $conf, $skiplock) = @_;
2114
2115 check_lock($conf) if !$skiplock;
2116
2117 my $cfspath = cfs_config_path($vmid);
2118
2119 PVE::Cluster::cfs_write_file($cfspath, $conf);
2120 }
2121
2122 sub update_config {
2123 my ($vmid, $conf, $skiplock) = @_;
2124
2125 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
2126 }
2127
2128 sub load_defaults {
2129
2130 my $res = {};
2131
2132 # we use static defaults from our JSON schema configuration
2133 foreach my $key (keys %$confdesc) {
2134 if (defined(my $default = $confdesc->{$key}->{default})) {
2135 $res->{$key} = $default;
2136 }
2137 }
2138
2139 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
2140 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
2141
2142 return $res;
2143 }
2144
2145 sub config_list {
2146 my $vmlist = PVE::Cluster::get_vmlist();
2147 my $res = {};
2148 return $res if !$vmlist || !$vmlist->{ids};
2149 my $ids = $vmlist->{ids};
2150
2151 foreach my $vmid (keys %$ids) {
2152 my $d = $ids->{$vmid};
2153 next if !$d->{node} || $d->{node} ne $nodename;
2154 next if !$d->{type} || $d->{type} ne 'qemu';
2155 $res->{$vmid}->{exists} = 1;
2156 }
2157 return $res;
2158 }
2159
2160 # test if VM uses local resources (to prevent migration)
2161 sub check_local_resources {
2162 my ($conf, $noerr) = @_;
2163
2164 my $loc_res = 0;
2165
2166 $loc_res = 1 if $conf->{hostusb}; # old syntax
2167 $loc_res = 1 if $conf->{hostpci}; # old syntax
2168
2169 foreach my $k (keys %$conf) {
2170 next if $k =~ m/^usb/ && ($conf->{$k} eq 'spice');
2171 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
2172 }
2173
2174 die "VM uses local resources\n" if $loc_res && !$noerr;
2175
2176 return $loc_res;
2177 }
2178
2179 # check if used storages are available on all nodes (use by migrate)
2180 sub check_storage_availability {
2181 my ($storecfg, $conf, $node) = @_;
2182
2183 foreach_drive($conf, sub {
2184 my ($ds, $drive) = @_;
2185
2186 my $volid = $drive->{file};
2187 return if !$volid;
2188
2189 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2190 return if !$sid;
2191
2192 # check if storage is available on both nodes
2193 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
2194 PVE::Storage::storage_check_node($storecfg, $sid, $node);
2195 });
2196 }
2197
2198 # list nodes where all VM images are available (used by has_feature API)
2199 sub shared_nodes {
2200 my ($conf, $storecfg) = @_;
2201
2202 my $nodelist = PVE::Cluster::get_nodelist();
2203 my $nodehash = { map { $_ => 1 } @$nodelist };
2204 my $nodename = PVE::INotify::nodename();
2205
2206 foreach_drive($conf, sub {
2207 my ($ds, $drive) = @_;
2208
2209 my $volid = $drive->{file};
2210 return if !$volid;
2211
2212 my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2213 if ($storeid) {
2214 my $scfg = PVE::Storage::storage_config($storecfg, $storeid);
2215 if ($scfg->{disable}) {
2216 $nodehash = {};
2217 } elsif (my $avail = $scfg->{nodes}) {
2218 foreach my $node (keys %$nodehash) {
2219 delete $nodehash->{$node} if !$avail->{$node};
2220 }
2221 } elsif (!$scfg->{shared}) {
2222 foreach my $node (keys %$nodehash) {
2223 delete $nodehash->{$node} if $node ne $nodename
2224 }
2225 }
2226 }
2227 });
2228
2229 return $nodehash
2230 }
2231
2232 sub check_lock {
2233 my ($conf) = @_;
2234
2235 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
2236 }
2237
2238 sub check_cmdline {
2239 my ($pidfile, $pid) = @_;
2240
2241 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
2242 if (defined($fh)) {
2243 my $line = <$fh>;
2244 $fh->close;
2245 return undef if !$line;
2246 my @param = split(/\0/, $line);
2247
2248 my $cmd = $param[0];
2249 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
2250
2251 for (my $i = 0; $i < scalar (@param); $i++) {
2252 my $p = $param[$i];
2253 next if !$p;
2254 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
2255 my $p = $param[$i+1];
2256 return 1 if $p && ($p eq $pidfile);
2257 return undef;
2258 }
2259 }
2260 }
2261 return undef;
2262 }
2263
2264 sub check_running {
2265 my ($vmid, $nocheck, $node) = @_;
2266
2267 my $filename = config_file($vmid, $node);
2268
2269 die "unable to find configuration file for VM $vmid - no such machine\n"
2270 if !$nocheck && ! -f $filename;
2271
2272 my $pidfile = pidfile_name($vmid);
2273
2274 if (my $fd = IO::File->new("<$pidfile")) {
2275 my $st = stat($fd);
2276 my $line = <$fd>;
2277 close($fd);
2278
2279 my $mtime = $st->mtime;
2280 if ($mtime > time()) {
2281 warn "file '$filename' modified in future\n";
2282 }
2283
2284 if ($line =~ m/^(\d+)$/) {
2285 my $pid = $1;
2286 if (check_cmdline($pidfile, $pid)) {
2287 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
2288 return $pid;
2289 }
2290 }
2291 }
2292 }
2293
2294 return undef;
2295 }
2296
2297 sub vzlist {
2298
2299 my $vzlist = config_list();
2300
2301 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
2302
2303 while (defined(my $de = $fd->read)) {
2304 next if $de !~ m/^(\d+)\.pid$/;
2305 my $vmid = $1;
2306 next if !defined($vzlist->{$vmid});
2307 if (my $pid = check_running($vmid)) {
2308 $vzlist->{$vmid}->{pid} = $pid;
2309 }
2310 }
2311
2312 return $vzlist;
2313 }
2314
2315 sub disksize {
2316 my ($storecfg, $conf) = @_;
2317
2318 my $bootdisk = $conf->{bootdisk};
2319 return undef if !$bootdisk;
2320 return undef if !valid_drivename($bootdisk);
2321
2322 return undef if !$conf->{$bootdisk};
2323
2324 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
2325 return undef if !defined($drive);
2326
2327 return undef if drive_is_cdrom($drive);
2328
2329 my $volid = $drive->{file};
2330 return undef if !$volid;
2331
2332 return $drive->{size};
2333 }
2334
2335 my $last_proc_pid_stat;
2336
2337 # get VM status information
2338 # This must be fast and should not block ($full == false)
2339 # We only query KVM using QMP if $full == true (this can be slow)
2340 sub vmstatus {
2341 my ($opt_vmid, $full) = @_;
2342
2343 my $res = {};
2344
2345 my $storecfg = PVE::Storage::config();
2346
2347 my $list = vzlist();
2348 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
2349
2350 my $cpucount = $cpuinfo->{cpus} || 1;
2351
2352 foreach my $vmid (keys %$list) {
2353 next if $opt_vmid && ($vmid ne $opt_vmid);
2354
2355 my $cfspath = cfs_config_path($vmid);
2356 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
2357
2358 my $d = {};
2359 $d->{pid} = $list->{$vmid}->{pid};
2360
2361 # fixme: better status?
2362 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
2363
2364 my $size = disksize($storecfg, $conf);
2365 if (defined($size)) {
2366 $d->{disk} = 0; # no info available
2367 $d->{maxdisk} = $size;
2368 } else {
2369 $d->{disk} = 0;
2370 $d->{maxdisk} = 0;
2371 }
2372
2373 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
2374 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
2375
2376 $d->{name} = $conf->{name} || "VM $vmid";
2377 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
2378
2379 if ($conf->{balloon}) {
2380 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
2381 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
2382 }
2383
2384 $d->{uptime} = 0;
2385 $d->{cpu} = 0;
2386 $d->{mem} = 0;
2387
2388 $d->{netout} = 0;
2389 $d->{netin} = 0;
2390
2391 $d->{diskread} = 0;
2392 $d->{diskwrite} = 0;
2393
2394 $d->{template} = is_template($conf);
2395
2396 $res->{$vmid} = $d;
2397 }
2398
2399 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
2400 foreach my $dev (keys %$netdev) {
2401 next if $dev !~ m/^tap([1-9]\d*)i/;
2402 my $vmid = $1;
2403 my $d = $res->{$vmid};
2404 next if !$d;
2405
2406 $d->{netout} += $netdev->{$dev}->{receive};
2407 $d->{netin} += $netdev->{$dev}->{transmit};
2408 }
2409
2410 my $ctime = gettimeofday;
2411
2412 foreach my $vmid (keys %$list) {
2413
2414 my $d = $res->{$vmid};
2415 my $pid = $d->{pid};
2416 next if !$pid;
2417
2418 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2419 next if !$pstat; # not running
2420
2421 my $used = $pstat->{utime} + $pstat->{stime};
2422
2423 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
2424
2425 if ($pstat->{vsize}) {
2426 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
2427 }
2428
2429 my $old = $last_proc_pid_stat->{$pid};
2430 if (!$old) {
2431 $last_proc_pid_stat->{$pid} = {
2432 time => $ctime,
2433 used => $used,
2434 cpu => 0,
2435 };
2436 next;
2437 }
2438
2439 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
2440
2441 if ($dtime > 1000) {
2442 my $dutime = $used - $old->{used};
2443
2444 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
2445 $last_proc_pid_stat->{$pid} = {
2446 time => $ctime,
2447 used => $used,
2448 cpu => $d->{cpu},
2449 };
2450 } else {
2451 $d->{cpu} = $old->{cpu};
2452 }
2453 }
2454
2455 return $res if !$full;
2456
2457 my $qmpclient = PVE::QMPClient->new();
2458
2459 my $ballooncb = sub {
2460 my ($vmid, $resp) = @_;
2461
2462 my $info = $resp->{'return'};
2463 return if !$info->{max_mem};
2464
2465 my $d = $res->{$vmid};
2466
2467 # use memory assigned to VM
2468 $d->{maxmem} = $info->{max_mem};
2469 $d->{balloon} = $info->{actual};
2470
2471 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2472 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2473 $d->{freemem} = $info->{free_mem};
2474 }
2475
2476 };
2477
2478 my $blockstatscb = sub {
2479 my ($vmid, $resp) = @_;
2480 my $data = $resp->{'return'} || [];
2481 my $totalrdbytes = 0;
2482 my $totalwrbytes = 0;
2483 for my $blockstat (@$data) {
2484 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2485 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2486 }
2487 $res->{$vmid}->{diskread} = $totalrdbytes;
2488 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2489 };
2490
2491 my $statuscb = sub {
2492 my ($vmid, $resp) = @_;
2493
2494 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
2495 # this fails if ballon driver is not loaded, so this must be
2496 # the last commnand (following command are aborted if this fails).
2497 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
2498
2499 my $status = 'unknown';
2500 if (!defined($status = $resp->{'return'}->{status})) {
2501 warn "unable to get VM status\n";
2502 return;
2503 }
2504
2505 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2506 };
2507
2508 foreach my $vmid (keys %$list) {
2509 next if $opt_vmid && ($vmid ne $opt_vmid);
2510 next if !$res->{$vmid}->{pid}; # not running
2511 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2512 }
2513
2514 $qmpclient->queue_execute(undef, 1);
2515
2516 foreach my $vmid (keys %$list) {
2517 next if $opt_vmid && ($vmid ne $opt_vmid);
2518 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2519 }
2520
2521 return $res;
2522 }
2523
2524 sub foreach_drive {
2525 my ($conf, $func) = @_;
2526
2527 foreach my $ds (keys %$conf) {
2528 next if !valid_drivename($ds);
2529
2530 my $drive = parse_drive($ds, $conf->{$ds});
2531 next if !$drive;
2532
2533 &$func($ds, $drive);
2534 }
2535 }
2536
2537 sub foreach_volid {
2538 my ($conf, $func) = @_;
2539
2540 my $volhash = {};
2541
2542 my $test_volid = sub {
2543 my ($volid, $is_cdrom) = @_;
2544
2545 return if !$volid;
2546
2547 $volhash->{$volid} = $is_cdrom || 0;
2548 };
2549
2550 foreach_drive($conf, sub {
2551 my ($ds, $drive) = @_;
2552 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2553 });
2554
2555 foreach my $snapname (keys %{$conf->{snapshots}}) {
2556 my $snap = $conf->{snapshots}->{$snapname};
2557 &$test_volid($snap->{vmstate}, 0);
2558 foreach_drive($snap, sub {
2559 my ($ds, $drive) = @_;
2560 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2561 });
2562 }
2563
2564 foreach my $volid (keys %$volhash) {
2565 &$func($volid, $volhash->{$volid});
2566 }
2567 }
2568
2569 sub vga_conf_has_spice {
2570 my ($vga) = @_;
2571
2572 return 0 if !$vga || $vga !~ m/^qxl([234])?$/;
2573
2574 return $1 || 1;
2575 }
2576
2577 sub config_to_command {
2578 my ($storecfg, $vmid, $conf, $defaults, $forcemachine) = @_;
2579
2580 my $cmd = [];
2581 my $globalFlags = [];
2582 my $machineFlags = [];
2583 my $rtcFlags = [];
2584 my $cpuFlags = [];
2585 my $devices = [];
2586 my $pciaddr = '';
2587 my $bridges = {};
2588 my $kvmver = kvm_user_version();
2589 my $vernum = 0; # unknown
2590 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2591 $vernum = $1*1000000+$2*1000;
2592 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
2593 $vernum = $1*1000000+$2*1000+$3;
2594 }
2595
2596 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
2597
2598 my $have_ovz = -f '/proc/vz/vestat';
2599
2600 my $q35 = machine_type_is_q35($conf);
2601
2602 push @$cmd, '/usr/bin/kvm';
2603
2604 push @$cmd, '-id', $vmid;
2605
2606 my $use_virtio = 0;
2607
2608 my $qmpsocket = qmp_socket($vmid);
2609 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2610 push @$cmd, '-mon', "chardev=qmp,mode=control";
2611
2612 my $socket = vnc_socket($vmid);
2613 push @$cmd, '-vnc', "unix:$socket,x509,password";
2614
2615 push @$cmd, '-pidfile' , pidfile_name($vmid);
2616
2617 push @$cmd, '-daemonize';
2618
2619 if ($conf->{smbios1}) {
2620 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
2621 }
2622
2623 push @$cmd, '-object', "iothread,id=iothread0" if $conf->{iothread};
2624
2625 if ($q35) {
2626 # the q35 chipset support native usb2, so we enable usb controller
2627 # by default for this machine type
2628 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
2629 } else {
2630 $pciaddr = print_pci_addr("piix3", $bridges);
2631 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
2632
2633 my $use_usb2 = 0;
2634 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2635 next if !$conf->{"usb$i"};
2636 $use_usb2 = 1;
2637 }
2638 # include usb device config
2639 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
2640 }
2641
2642 my $vga = $conf->{vga};
2643
2644 my $qxlnum = vga_conf_has_spice($vga);
2645 $vga = 'qxl' if $qxlnum;
2646
2647 if (!$vga) {
2648 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' ||
2649 $conf->{ostype} eq 'win7' ||
2650 $conf->{ostype} eq 'w2k8')) {
2651 $vga = 'std';
2652 } else {
2653 $vga = 'cirrus';
2654 }
2655 }
2656
2657 # enable absolute mouse coordinates (needed by vnc)
2658 my $tablet;
2659 if (defined($conf->{tablet})) {
2660 $tablet = $conf->{tablet};
2661 } else {
2662 $tablet = $defaults->{tablet};
2663 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
2664 $tablet = 0 if $vga =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
2665 }
2666
2667 push @$devices, '-device', print_tabletdevice_full($conf) if $tablet;
2668
2669 # host pci devices
2670 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2671 my $d = parse_hostpci($conf->{"hostpci$i"});
2672 next if !$d;
2673
2674 my $pcie = $d->{pcie};
2675 if($pcie){
2676 die "q35 machine model is not enabled" if !$q35;
2677 $pciaddr = print_pcie_addr("hostpci$i");
2678 }else{
2679 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2680 }
2681
2682 my $rombar = $d->{rombar} && $d->{rombar} eq 'off' ? ",rombar=0" : "";
2683 my $driver = $d->{driver} && $d->{driver} eq 'vfio' ? "vfio-pci" : "pci-assign";
2684 my $xvga = $d->{'x-vga'} && $d->{'x-vga'} eq 'on' ? ",x-vga=on" : "";
2685 if ($xvga && $xvga ne '') {
2686 push @$cpuFlags, 'kvm=off';
2687 $vga = 'none';
2688 }
2689 $driver = "vfio-pci" if $xvga ne '';
2690 my $pcidevices = $d->{pciid};
2691 my $multifunction = 1 if @$pcidevices > 1;
2692
2693 my $j=0;
2694 foreach my $pcidevice (@$pcidevices) {
2695
2696 my $id = "hostpci$i";
2697 $id .= ".$j" if $multifunction;
2698 my $addr = $pciaddr;
2699 $addr .= ".$j" if $multifunction;
2700 my $devicestr = "$driver,host=$pcidevice->{id}.$pcidevice->{function},id=$id$addr";
2701
2702 if($j == 0){
2703 $devicestr .= "$rombar$xvga";
2704 $devicestr .= ",multifunction=on" if $multifunction;
2705 }
2706
2707 push @$devices, '-device', $devicestr;
2708 $j++;
2709 }
2710 }
2711
2712 # usb devices
2713 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2714 my $d = parse_usb_device($conf->{"usb$i"});
2715 next if !$d;
2716 if ($d->{vendorid} && $d->{productid}) {
2717 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
2718 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
2719 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
2720 } elsif ($d->{spice}) {
2721 # usb redir support for spice
2722 push @$devices, '-chardev', "spicevmc,id=usbredirchardev$i,name=usbredir";
2723 push @$devices, '-device', "usb-redir,chardev=usbredirchardev$i,id=usbredirdev$i,bus=ehci.0";
2724 }
2725 }
2726
2727 # serial devices
2728 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
2729 if (my $path = $conf->{"serial$i"}) {
2730 if ($path eq 'socket') {
2731 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
2732 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server,nowait";
2733 push @$devices, '-device', "isa-serial,chardev=serial$i";
2734 } else {
2735 die "no such serial device\n" if ! -c $path;
2736 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2737 push @$devices, '-device', "isa-serial,chardev=serial$i";
2738 }
2739 }
2740 }
2741
2742 # parallel devices
2743 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
2744 if (my $path = $conf->{"parallel$i"}) {
2745 die "no such parallel device\n" if ! -c $path;
2746 my $devtype = $path =~ m!^/dev/usb/lp! ? 'tty' : 'parport';
2747 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
2748 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
2749 }
2750 }
2751
2752 my $vmname = $conf->{name} || "vm$vmid";
2753
2754 push @$cmd, '-name', $vmname;
2755
2756 my $sockets = 1;
2757 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2758 $sockets = $conf->{sockets} if $conf->{sockets};
2759
2760 my $cores = $conf->{cores} || 1;
2761 my $maxcpus = $conf->{maxcpus} if $conf->{maxcpus};
2762
2763 my $total_cores = $sockets * $cores;
2764 my $allowed_cores = $cpuinfo->{cpus};
2765
2766 die "MAX $allowed_cores cores allowed per VM on this node\n"
2767 if ($allowed_cores < $total_cores);
2768
2769 if ($maxcpus) {
2770 push @$cmd, '-smp', "cpus=$cores,maxcpus=$maxcpus";
2771 } else {
2772 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2773 }
2774
2775 push @$cmd, '-nodefaults';
2776
2777 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
2778
2779 my $bootindex_hash = {};
2780 my $i = 1;
2781 foreach my $o (split(//, $bootorder)) {
2782 $bootindex_hash->{$o} = $i*100;
2783 $i++;
2784 }
2785
2786 push @$cmd, '-boot', "menu=on";
2787
2788 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
2789
2790 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
2791
2792 push @$cmd, '-vga', $vga if $vga && $vga !~ m/^serial\d+$/; # for kvm 77 and later
2793
2794 # time drift fix
2795 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
2796
2797 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
2798 my $useLocaltime = $conf->{localtime};
2799
2800 if (my $ost = $conf->{ostype}) {
2801 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26, solaris
2802
2803 if ($ost =~ m/^w/) { # windows
2804 $useLocaltime = 1 if !defined($conf->{localtime});
2805
2806 # use time drift fix when acpi is enabled
2807 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
2808 $tdf = 1 if !defined($conf->{tdf});
2809 }
2810 }
2811
2812 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
2813 $ost eq 'wvista') {
2814 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
2815 push @$cmd, '-no-hpet';
2816 #push @$cpuFlags , 'hv_vapic" if !$nokvm; #fixme, my win2008R2 hang at boot with this
2817 push @$cpuFlags , 'hv_spinlocks=0xffff' if !$nokvm;
2818 }
2819
2820 if ($ost eq 'win7' || $ost eq 'win8') {
2821 push @$cpuFlags , 'hv_relaxed' if !$nokvm;
2822 }
2823 }
2824
2825 push @$rtcFlags, 'driftfix=slew' if $tdf;
2826
2827 if ($nokvm) {
2828 push @$machineFlags, 'accel=tcg';
2829 } else {
2830 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2831 }
2832
2833 my $machine_type = $forcemachine || $conf->{machine};
2834 if ($machine_type) {
2835 push @$machineFlags, "type=${machine_type}";
2836 }
2837
2838 if ($conf->{startdate}) {
2839 push @$rtcFlags, "base=$conf->{startdate}";
2840 } elsif ($useLocaltime) {
2841 push @$rtcFlags, 'base=localtime';
2842 }
2843
2844 my $cpu = $nokvm ? "qemu64" : "kvm64";
2845 $cpu = $conf->{cpu} if $conf->{cpu};
2846
2847 push @$cpuFlags , '+lahf_lm' if $cpu eq 'kvm64';
2848
2849 push @$cpuFlags , '+x2apic' if !$nokvm && $conf->{ostype} ne 'solaris';
2850
2851 push @$cpuFlags , '-x2apic' if $conf->{ostype} eq 'solaris';
2852
2853 push @$cpuFlags, '+sep' if $cpu eq 'kvm64' || $cpu eq 'kvm32';
2854
2855 $cpu .= "," . join(',', @$cpuFlags) if scalar(@$cpuFlags);
2856
2857 # Note: enforce needs kernel 3.10, so we do not use it for now
2858 # push @$cmd, '-cpu', "$cpu,enforce";
2859 push @$cmd, '-cpu', $cpu;
2860
2861 my $memory = $conf->{memory} || $defaults->{memory};
2862 push @$cmd, '-m', $memory;
2863
2864 if ($conf->{numa}) {
2865
2866 my $numa_totalmemory = undef;
2867 for (my $i = 0; $i < $MAX_NUMA; $i++) {
2868 next if !$conf->{"numa$i"};
2869 my $numa = parse_numa($conf->{"numa$i"});
2870 next if !$numa;
2871 # memory
2872 die "missing numa node$i memory value\n" if !$numa->{memory};
2873 my $numa_memory = $numa->{memory};
2874 $numa_totalmemory += $numa_memory;
2875 my $numa_object = "memory-backend-ram,id=ram-node$i,size=$numa_memory"."M";
2876
2877 # cpus
2878 my $cpus_start = $numa->{cpus}->{start};
2879 die "missing numa node$i cpus\n" if !defined($cpus_start);
2880 my $cpus_end = $numa->{cpus}->{end} if defined($numa->{cpus}->{end});
2881 my $cpus = $cpus_start;
2882 if (defined($cpus_end)) {
2883 $cpus .= "-$cpus_end";
2884 die "numa node$i : cpu range $cpus is incorrect\n" if $cpus_end <= $cpus_start;
2885 }
2886
2887 # hostnodes
2888 my $hostnodes_start = $numa->{hostnodes}->{start};
2889 if (defined($hostnodes_start)) {
2890 my $hostnodes_end = $numa->{hostnodes}->{end} if defined($numa->{hostnodes}->{end});
2891 my $hostnodes = $hostnodes_start;
2892 if (defined($hostnodes_end)) {
2893 $hostnodes .= "-$hostnodes_end";
2894 die "host node $hostnodes range is incorrect\n" if $hostnodes_end <= $hostnodes_start;
2895 }
2896
2897 my $hostnodes_end_range = defined($hostnodes_end) ? $hostnodes_end : $hostnodes_start;
2898 for (my $i = $hostnodes_start; $i <= $hostnodes_end_range; $i++ ) {
2899 die "host numa node$i don't exist\n" if ! -d "/sys/devices/system/node/node$i/";
2900 }
2901
2902 # policy
2903 my $policy = $numa->{policy};
2904 die "you need to define a policy for hostnode $hostnodes\n" if !$policy;
2905 $numa_object .= ",host-nodes=$hostnodes,policy=$policy";
2906 }
2907
2908 push @$cmd, '-object', $numa_object;
2909 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2910 }
2911
2912 die "total memory for NUMA nodes must be equal to vm memory\n"
2913 if $numa_totalmemory && $numa_totalmemory != $memory;
2914
2915 #if no custom tology, we split memory and cores across numa nodes
2916 if(!$numa_totalmemory) {
2917
2918 my $numa_memory = ($memory / $sockets) . "M";
2919
2920 for (my $i = 0; $i < $sockets; $i++) {
2921
2922 my $cpustart = ($cores * $i);
2923 my $cpuend = ($cpustart + $cores - 1) if $cores && $cores > 1;
2924 my $cpus = $cpustart;
2925 $cpus .= "-$cpuend" if $cpuend;
2926
2927 push @$cmd, '-object', "memory-backend-ram,size=$numa_memory,id=ram-node$i";
2928 push @$cmd, '-numa', "node,nodeid=$i,cpus=$cpus,memdev=ram-node$i";
2929 }
2930 }
2931 }
2932
2933 push @$cmd, '-S' if $conf->{freeze};
2934
2935 # set keyboard layout
2936 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2937 push @$cmd, '-k', $kb if $kb;
2938
2939 # enable sound
2940 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2941 #push @$cmd, '-soundhw', 'es1370';
2942 #push @$cmd, '-soundhw', $soundhw if $soundhw;
2943
2944 if($conf->{agent}) {
2945 my $qgasocket = qmp_socket($vmid, 1);
2946 my $pciaddr = print_pci_addr("qga0", $bridges);
2947 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2948 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2949 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2950 }
2951
2952 my $spice_port;
2953
2954 if ($qxlnum) {
2955 if ($qxlnum > 1) {
2956 if ($conf->{ostype} && $conf->{ostype} =~ m/^w/){
2957 for(my $i = 1; $i < $qxlnum; $i++){
2958 my $pciaddr = print_pci_addr("vga$i", $bridges);
2959 push @$cmd, '-device', "qxl,id=vga$i,ram_size=67108864,vram_size=33554432$pciaddr";
2960 }
2961 } else {
2962 # assume other OS works like Linux
2963 push @$cmd, '-global', 'qxl-vga.ram_size=134217728';
2964 push @$cmd, '-global', 'qxl-vga.vram_size=67108864';
2965 }
2966 }
2967
2968 my $pciaddr = print_pci_addr("spice", $bridges);
2969
2970 $spice_port = PVE::Tools::next_spice_port();
2971
2972 push @$devices, '-spice', "tls-port=${spice_port},addr=127.0.0.1,tls-ciphers=DES-CBC3-SHA,seamless-migration=on";
2973
2974 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
2975 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
2976 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
2977 }
2978
2979 # enable balloon by default, unless explicitly disabled
2980 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2981 $pciaddr = print_pci_addr("balloon0", $bridges);
2982 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2983 }
2984
2985 if ($conf->{watchdog}) {
2986 my $wdopts = parse_watchdog($conf->{watchdog});
2987 $pciaddr = print_pci_addr("watchdog", $bridges);
2988 my $watchdog = $wdopts->{model} || 'i6300esb';
2989 push @$devices, '-device', "$watchdog$pciaddr";
2990 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
2991 }
2992
2993 my $vollist = [];
2994 my $scsicontroller = {};
2995 my $ahcicontroller = {};
2996 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
2997
2998 # Add iscsi initiator name if available
2999 if (my $initiator = get_initiator_name()) {
3000 push @$devices, '-iscsi', "initiator-name=$initiator";
3001 }
3002
3003 foreach_drive($conf, sub {
3004 my ($ds, $drive) = @_;
3005
3006 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
3007 push @$vollist, $drive->{file};
3008 }
3009
3010 $use_virtio = 1 if $ds =~ m/^virtio/;
3011
3012 if (drive_is_cdrom ($drive)) {
3013 if ($bootindex_hash->{d}) {
3014 $drive->{bootindex} = $bootindex_hash->{d};
3015 $bootindex_hash->{d} += 1;
3016 }
3017 } else {
3018 if ($bootindex_hash->{c}) {
3019 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
3020 $bootindex_hash->{c} += 1;
3021 }
3022 }
3023
3024 if ($drive->{interface} eq 'scsi') {
3025
3026 my $maxdev = ($scsihw !~ m/^lsi/) ? 256 : 7;
3027 my $controller = int($drive->{index} / $maxdev);
3028 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
3029 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
3030 $scsicontroller->{$controller}=1;
3031 }
3032
3033 if ($drive->{interface} eq 'sata') {
3034 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
3035 $pciaddr = print_pci_addr("ahci$controller", $bridges);
3036 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
3037 $ahcicontroller->{$controller}=1;
3038 }
3039
3040 my $drive_cmd = print_drive_full($storecfg, $vmid, $drive);
3041 push @$devices, '-drive',$drive_cmd;
3042 push @$devices, '-device', print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
3043 });
3044
3045 for (my $i = 0; $i < $MAX_NETS; $i++) {
3046 next if !$conf->{"net$i"};
3047 my $d = parse_net($conf->{"net$i"});
3048 next if !$d;
3049
3050 $use_virtio = 1 if $d->{model} eq 'virtio';
3051
3052 if ($bootindex_hash->{n}) {
3053 $d->{bootindex} = $bootindex_hash->{n};
3054 $bootindex_hash->{n} += 1;
3055 }
3056
3057 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
3058 push @$devices, '-netdev', $netdevfull;
3059
3060 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
3061 push @$devices, '-device', $netdevicefull;
3062 }
3063
3064 if (!$q35) {
3065 # add pci bridges
3066 while (my ($k, $v) = each %$bridges) {
3067 $pciaddr = print_pci_addr("pci.$k");
3068 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
3069 }
3070 }
3071
3072 # hack: virtio with fairsched is unreliable, so we do not use fairsched
3073 # when the VM uses virtio devices.
3074 if (!$use_virtio && $have_ovz) {
3075
3076 my $cpuunits = defined($conf->{cpuunits}) ?
3077 $conf->{cpuunits} : $defaults->{cpuunits};
3078
3079 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
3080
3081 # fixme: cpulimit is currently ignored
3082 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
3083 }
3084
3085 # add custom args
3086 if ($conf->{args}) {
3087 my $aa = PVE::Tools::split_args($conf->{args});
3088 push @$cmd, @$aa;
3089 }
3090
3091 push @$cmd, @$devices;
3092 push @$cmd, '-rtc', join(',', @$rtcFlags)
3093 if scalar(@$rtcFlags);
3094 push @$cmd, '-machine', join(',', @$machineFlags)
3095 if scalar(@$machineFlags);
3096 push @$cmd, '-global', join(',', @$globalFlags)
3097 if scalar(@$globalFlags);
3098
3099 return wantarray ? ($cmd, $vollist, $spice_port) : $cmd;
3100 }
3101
3102 sub vnc_socket {
3103 my ($vmid) = @_;
3104 return "${var_run_tmpdir}/$vmid.vnc";
3105 }
3106
3107 sub spice_port {
3108 my ($vmid) = @_;
3109
3110 my $res = vm_mon_cmd($vmid, 'query-spice');
3111
3112 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
3113 }
3114
3115 sub qmp_socket {
3116 my ($vmid, $qga) = @_;
3117 my $sockettype = $qga ? 'qga' : 'qmp';
3118 return "${var_run_tmpdir}/$vmid.$sockettype";
3119 }
3120
3121 sub pidfile_name {
3122 my ($vmid) = @_;
3123 return "${var_run_tmpdir}/$vmid.pid";
3124 }
3125
3126 sub vm_devices_list {
3127 my ($vmid) = @_;
3128
3129 my $res = vm_mon_cmd($vmid, 'query-pci');
3130 my $devices = {};
3131 foreach my $pcibus (@$res) {
3132 foreach my $device (@{$pcibus->{devices}}) {
3133 next if !$device->{'qdev_id'};
3134 $devices->{$device->{'qdev_id'}} = 1;
3135 }
3136 }
3137
3138 my $resblock = vm_mon_cmd($vmid, 'query-block');
3139 foreach my $block (@$resblock) {
3140 if($block->{device} =~ m/^drive-(\S+)/){
3141 $devices->{$1} = 1;
3142 }
3143 }
3144
3145 my $resmice = vm_mon_cmd($vmid, 'query-mice');
3146 foreach my $mice (@$resmice) {
3147 if ($mice->{name} eq 'QEMU HID Tablet') {
3148 $devices->{tablet} = 1;
3149 last;
3150 }
3151 }
3152
3153 return $devices;
3154 }
3155
3156 sub vm_deviceplug {
3157 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
3158
3159 die "internal error" if !$conf->{hotplug};
3160
3161 my $q35 = machine_type_is_q35($conf);
3162
3163 my $devices_list = vm_devices_list($vmid);
3164 return 1 if defined($devices_list->{$deviceid});
3165
3166 qemu_add_pci_bridge($storecfg, $conf, $vmid, $deviceid); # add PCI bridge if we need it for the device
3167
3168 if ($deviceid eq 'tablet') {
3169
3170 qemu_deviceadd($vmid, print_tabletdevice_full($conf));
3171
3172 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
3173
3174 qemu_driveadd($storecfg, $vmid, $device);
3175 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3176
3177 qemu_deviceadd($vmid, $devicefull);
3178 eval { qemu_deviceaddverify($vmid, $deviceid); };
3179 if (my $err = $@) {
3180 eval { qemu_drivedel($vmid, $deviceid); };
3181 warn $@ if $@;
3182 die $err;
3183 }
3184
3185 } elsif ($deviceid =~ m/^(scsihw)(\d+)$/) {
3186
3187 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
3188 my $pciaddr = print_pci_addr($deviceid);
3189 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
3190
3191 qemu_deviceadd($vmid, $devicefull);
3192 qemu_deviceaddverify($vmid, $deviceid);
3193
3194 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3195
3196 qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
3197 qemu_driveadd($storecfg, $vmid, $device);
3198
3199 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
3200 eval { qemu_deviceadd($vmid, $devicefull); };
3201 if (my $err = $@) {
3202 eval { qemu_drivedel($vmid, $deviceid); };
3203 warn $@ if $@;
3204 die $err;
3205 }
3206
3207 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3208
3209 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
3210 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
3211 qemu_deviceadd($vmid, $netdevicefull);
3212 eval { qemu_deviceaddverify($vmid, $deviceid); };
3213 if (my $err = $@) {
3214 eval { qemu_netdevdel($vmid, $deviceid); };
3215 warn $@ if $@;
3216 die $err;
3217 }
3218
3219 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
3220
3221 my $bridgeid = $2;
3222 my $pciaddr = print_pci_addr($deviceid);
3223 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
3224
3225 qemu_deviceadd($vmid, $devicefull);
3226 qemu_deviceaddverify($vmid, $deviceid);
3227
3228 } else {
3229 die "can't hotplug device '$deviceid'\n";
3230 }
3231
3232 return 1;
3233 }
3234
3235 # fixme: this should raise exceptions on error!
3236 sub vm_deviceunplug {
3237 my ($vmid, $conf, $deviceid) = @_;
3238
3239 die "internal error" if !$conf->{hotplug};
3240
3241 my $devices_list = vm_devices_list($vmid);
3242 return 1 if !defined($devices_list->{$deviceid});
3243
3244 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
3245
3246 if ($deviceid eq 'tablet') {
3247
3248 qemu_devicedel($vmid, $deviceid);
3249
3250 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
3251
3252 qemu_devicedel($vmid, $deviceid);
3253 qemu_devicedelverify($vmid, $deviceid);
3254 qemu_drivedel($vmid, $deviceid);
3255
3256 } elsif ($deviceid =~ m/^(lsi)(\d+)$/) {
3257
3258 qemu_devicedel($vmid, $deviceid);
3259
3260 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
3261
3262 qemu_devicedel($vmid, $deviceid);
3263 qemu_drivedel($vmid, $deviceid);
3264
3265 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
3266
3267 qemu_devicedel($vmid, $deviceid);
3268 qemu_devicedelverify($vmid, $deviceid);
3269 qemu_netdevdel($vmid, $deviceid);
3270
3271 } else {
3272 die "can't unplug device '$deviceid'\n";
3273 }
3274
3275 return 1;
3276 }
3277
3278 sub qemu_deviceadd {
3279 my ($vmid, $devicefull) = @_;
3280
3281 $devicefull = "driver=".$devicefull;
3282 my %options = split(/[=,]/, $devicefull);
3283
3284 vm_mon_cmd($vmid, "device_add" , %options);
3285 }
3286
3287 sub qemu_devicedel {
3288 my ($vmid, $deviceid) = @_;
3289
3290 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
3291 }
3292
3293 sub qemu_driveadd {
3294 my ($storecfg, $vmid, $device) = @_;
3295
3296 my $drive = print_drive_full($storecfg, $vmid, $device);
3297 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
3298
3299 # If the command succeeds qemu prints: "OK"
3300 return 1 if $ret =~ m/OK/s;
3301
3302 die "adding drive failed: $ret\n";
3303 }
3304
3305 sub qemu_drivedel {
3306 my($vmid, $deviceid) = @_;
3307
3308 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
3309 $ret =~ s/^\s+//;
3310
3311 return 1 if $ret eq "";
3312
3313 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
3314 return 1 if $ret =~ m/Device \'.*?\' not found/s;
3315
3316 die "deleting drive $deviceid failed : $ret\n";
3317 }
3318
3319 sub qemu_deviceaddverify {
3320 my ($vmid, $deviceid) = @_;
3321
3322 for (my $i = 0; $i <= 5; $i++) {
3323 my $devices_list = vm_devices_list($vmid);
3324 return 1 if defined($devices_list->{$deviceid});
3325 sleep 1;
3326 }
3327
3328 die "error on hotplug device '$deviceid'\n";
3329 }
3330
3331
3332 sub qemu_devicedelverify {
3333 my ($vmid, $deviceid) = @_;
3334
3335 # need to verify that the device is correctly removed as device_del
3336 # is async and empty return is not reliable
3337
3338 for (my $i = 0; $i <= 5; $i++) {
3339 my $devices_list = vm_devices_list($vmid);
3340 return 1 if !defined($devices_list->{$deviceid});
3341 sleep 1;
3342 }
3343
3344 die "error on hot-unplugging device '$deviceid'\n";
3345 }
3346
3347 sub qemu_findorcreatescsihw {
3348 my ($storecfg, $conf, $vmid, $device) = @_;
3349
3350 my $maxdev = ($conf->{scsihw} && ($conf->{scsihw} !~ m/^lsi/)) ? 256 : 7;
3351 my $controller = int($device->{index} / $maxdev);
3352 my $scsihwid="scsihw$controller";
3353 my $devices_list = vm_devices_list($vmid);
3354
3355 if(!defined($devices_list->{$scsihwid})) {
3356 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
3357 }
3358
3359 return 1;
3360 }
3361
3362 sub qemu_add_pci_bridge {
3363 my ($storecfg, $conf, $vmid, $device) = @_;
3364
3365 my $bridges = {};
3366
3367 my $bridgeid;
3368
3369 print_pci_addr($device, $bridges);
3370
3371 while (my ($k, $v) = each %$bridges) {
3372 $bridgeid = $k;
3373 }
3374 return 1 if !defined($bridgeid) || $bridgeid < 1;
3375
3376 my $bridge = "pci.$bridgeid";
3377 my $devices_list = vm_devices_list($vmid);
3378
3379 if (!defined($devices_list->{$bridge})) {
3380 vm_deviceplug($storecfg, $conf, $vmid, $bridge);
3381 }
3382
3383 return 1;
3384 }
3385
3386 sub qemu_netdevadd {
3387 my ($vmid, $conf, $device, $deviceid) = @_;
3388
3389 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
3390 my %options = split(/[=,]/, $netdev);
3391
3392 vm_mon_cmd($vmid, "netdev_add", %options);
3393 return 1;
3394 }
3395
3396 sub qemu_netdevdel {
3397 my ($vmid, $deviceid) = @_;
3398
3399 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
3400 }
3401
3402 sub qemu_cpu_hotplug {
3403 my ($vmid, $conf, $cores) = @_;
3404
3405 my $sockets = $conf->{sockets} || 1;
3406 die "cpu hotplug only works with one socket\n"
3407 if $sockets > 1;
3408
3409 die "maxcpus is not defined\n"
3410 if !$conf->{maxcpus};
3411
3412 die "you can't add more cores than maxcpus\n"
3413 if $cores > $conf->{maxcpus};
3414
3415 my $currentcores = $conf->{cores} || 1;
3416 die "online cpu unplug is not yet possible\n"
3417 if $cores < $currentcores;
3418
3419 my $currentrunningcores = vm_mon_cmd($vmid, "query-cpus");
3420 die "cores number if running vm is different than configuration\n"
3421 if scalar(@{$currentrunningcores}) != $currentcores;
3422
3423 for (my $i = $currentcores; $i < $cores; $i++) {
3424 vm_mon_cmd($vmid, "cpu-add", id => int($i));
3425 }
3426 }
3427
3428 sub qemu_block_set_io_throttle {
3429 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
3430
3431 return if !check_running($vmid) ;
3432
3433 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
3434
3435 }
3436
3437 # old code, only used to shutdown old VM after update
3438 sub __read_avail {
3439 my ($fh, $timeout) = @_;
3440
3441 my $sel = new IO::Select;
3442 $sel->add($fh);
3443
3444 my $res = '';
3445 my $buf;
3446
3447 my @ready;
3448 while (scalar (@ready = $sel->can_read($timeout))) {
3449 my $count;
3450 if ($count = $fh->sysread($buf, 8192)) {
3451 if ($buf =~ /^(.*)\(qemu\) $/s) {
3452 $res .= $1;
3453 last;
3454 } else {
3455 $res .= $buf;
3456 }
3457 } else {
3458 if (!defined($count)) {
3459 die "$!\n";
3460 }
3461 last;
3462 }
3463 }
3464
3465 die "monitor read timeout\n" if !scalar(@ready);
3466
3467 return $res;
3468 }
3469
3470 # old code, only used to shutdown old VM after update
3471 sub vm_monitor_command {
3472 my ($vmid, $cmdstr, $nocheck) = @_;
3473
3474 my $res;
3475
3476 eval {
3477 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3478
3479 my $sname = "${var_run_tmpdir}/$vmid.mon";
3480
3481 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
3482 die "unable to connect to VM $vmid socket - $!\n";
3483
3484 my $timeout = 3;
3485
3486 # hack: migrate sometime blocks the monitor (when migrate_downtime
3487 # is set)
3488 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3489 $timeout = 60*60; # 1 hour
3490 }
3491
3492 # read banner;
3493 my $data = __read_avail($sock, $timeout);
3494
3495 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
3496 die "got unexpected qemu monitor banner\n";
3497 }
3498
3499 my $sel = new IO::Select;
3500 $sel->add($sock);
3501
3502 if (!scalar(my @ready = $sel->can_write($timeout))) {
3503 die "monitor write error - timeout";
3504 }
3505
3506 my $fullcmd = "$cmdstr\r";
3507
3508 # syslog('info', "VM $vmid monitor command: $cmdstr");
3509
3510 my $b;
3511 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
3512 die "monitor write error - $!";
3513 }
3514
3515 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
3516
3517 $timeout = 20;
3518
3519 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
3520 $timeout = 60*60; # 1 hour
3521 } elsif ($cmdstr =~ m/^(eject|change)/) {
3522 $timeout = 60; # note: cdrom mount command is slow
3523 }
3524 if ($res = __read_avail($sock, $timeout)) {
3525
3526 my @lines = split("\r?\n", $res);
3527
3528 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
3529
3530 $res = join("\n", @lines);
3531 $res .= "\n";
3532 }
3533 };
3534
3535 my $err = $@;
3536
3537 if ($err) {
3538 syslog("err", "VM $vmid monitor command failed - $err");
3539 die $err;
3540 }
3541
3542 return $res;
3543 }
3544
3545 sub qemu_block_resize {
3546 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
3547
3548 my $running = check_running($vmid);
3549
3550 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
3551
3552 return if !$running;
3553
3554 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
3555
3556 }
3557
3558 sub qemu_volume_snapshot {
3559 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3560
3561 my $running = check_running($vmid);
3562
3563 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
3564
3565 return if !$running;
3566
3567 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
3568
3569 }
3570
3571 sub qemu_volume_snapshot_delete {
3572 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
3573
3574 my $running = check_running($vmid);
3575
3576 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
3577
3578 return if !$running;
3579
3580 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
3581 }
3582
3583 sub set_migration_caps {
3584 my ($vmid) = @_;
3585
3586 my $cap_ref = [];
3587
3588 my $enabled_cap = {
3589 "auto-converge" => 1,
3590 "xbzrle" => 0,
3591 "x-rdma-pin-all" => 0,
3592 "zero-blocks" => 0,
3593 };
3594
3595 my $supported_capabilities = vm_mon_cmd_nocheck($vmid, "query-migrate-capabilities");
3596
3597 for my $supported_capability (@$supported_capabilities) {
3598 push @$cap_ref, {
3599 capability => $supported_capability->{capability},
3600 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
3601 };
3602 }
3603
3604 vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
3605 }
3606
3607 # hotplug changes in [PENDING]
3608 # $selection hash can be used to only apply specified options, for
3609 # example: { cores => 1 } (only apply changed 'cores')
3610 # $errors ref is used to return error messages
3611 sub vmconfig_hotplug_pending {
3612 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
3613
3614 my $defaults = load_defaults();
3615
3616 # commit values which do not have any impact on running VM first
3617 # Note: those option cannot raise errors, we we do not care about
3618 # $selection and always apply them.
3619
3620 my $add_error = sub {
3621 my ($opt, $msg) = @_;
3622 $errors->{$opt} = "hotplug problem - $msg";
3623 };
3624
3625 my $changes = 0;
3626 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3627 if ($opt eq 'name' || $opt eq 'hotplug' || $opt eq 'onboot' || $opt eq 'shares') {
3628 $conf->{$opt} = $conf->{pending}->{$opt};
3629 delete $conf->{pending}->{$opt};
3630 $changes = 1;
3631 }
3632 }
3633
3634 if ($changes) {
3635 update_config_nolock($vmid, $conf, 1);
3636 $conf = load_config($vmid); # update/reload
3637 }
3638
3639 my $hotplug = defined($conf->{hotplug}) ? $conf->{hotplug} : $defaults->{hotplug};
3640
3641 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3642 foreach my $opt (@delete) {
3643 next if $selection && !$selection->{$opt};
3644 eval {
3645 if ($opt eq 'tablet') {
3646 die "skip\n" if !$hotplug;
3647 if ($defaults->{tablet}) {
3648 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3649 } else {
3650 vm_deviceunplug($vmid, $conf, $opt);
3651 }
3652 } elsif ($opt eq 'cores') {
3653 die "skip\n" if !$hotplug;
3654 qemu_cpu_hotplug($vmid, $conf, 1);
3655 } elsif ($opt =~ m/^net(\d+)$/) {
3656 die "skip\n" if !$hotplug;
3657 vm_deviceunplug($vmid, $conf, $opt);
3658 } else {
3659 die "skip\n";
3660 }
3661 };
3662 if (my $err = $@) {
3663 &$add_error($opt, $err) if $err ne "skip\n";
3664 } else {
3665 # save new config if hotplug was successful
3666 delete $conf->{$opt};
3667 vmconfig_undelete_pending_option($conf, $opt);
3668 update_config_nolock($vmid, $conf, 1);
3669 $conf = load_config($vmid); # update/reload
3670 }
3671 }
3672
3673 foreach my $opt (keys %{$conf->{pending}}) {
3674 next if $selection && !$selection->{$opt};
3675 my $value = $conf->{pending}->{$opt};
3676 eval {
3677 if ($opt eq 'tablet') {
3678 die "skip\n" if !$hotplug;
3679 if ($value == 1) {
3680 vm_deviceplug($storecfg, $conf, $vmid, $opt);
3681 } elsif ($value == 0) {
3682 vm_deviceunplug($vmid, $conf, $opt);
3683 }
3684 } elsif ($opt eq 'cores') {
3685 die "skip\n" if !$hotplug;
3686 qemu_cpu_hotplug($vmid, $conf, $value);
3687 } elsif ($opt eq 'balloon') {
3688 die "skip\n" if !(defined($conf->{shares}) && ($conf->{shares} == 0));
3689 # allow manual ballooning if shares is set to zero
3690 my $balloon = $conf->{pending}->{balloon} || $conf->{memory} || $defaults->{memory};
3691 vm_mon_cmd($vmid, "balloon", value => $balloon*1024*1024);
3692 } elsif ($opt =~ m/^net(\d+)$/) {
3693 # some changes can be done without hotplug
3694 vmconfig_update_net($storecfg, $conf, $vmid, $opt, $value);
3695 } else {
3696 die "skip\n"; # skip non-hot-pluggable options
3697 }
3698 };
3699 if (my $err = $@) {
3700 &$add_error($opt, $err) if $err ne "skip\n";
3701 } else {
3702 # save new config if hotplug was successful
3703 $conf->{$opt} = $value;
3704 delete $conf->{pending}->{$opt};
3705 update_config_nolock($vmid, $conf, 1);
3706 $conf = load_config($vmid); # update/reload
3707 }
3708 }
3709 }
3710
3711 sub vmconfig_apply_pending {
3712 my ($vmid, $conf, $storecfg) = @_;
3713
3714 # cold plug
3715
3716 my @delete = PVE::Tools::split_list($conf->{pending}->{delete});
3717 foreach my $opt (@delete) { # delete
3718 die "internal error" if $opt =~ m/^unused/;
3719 $conf = load_config($vmid); # update/reload
3720 if (!defined($conf->{$opt})) {
3721 vmconfig_undelete_pending_option($conf, $opt);
3722 update_config_nolock($vmid, $conf, 1);
3723 } elsif (valid_drivename($opt)) {
3724 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}));
3725 vmconfig_undelete_pending_option($conf, $opt);
3726 delete $conf->{$opt};
3727 update_config_nolock($vmid, $conf, 1);
3728 } else {
3729 vmconfig_undelete_pending_option($conf, $opt);
3730 delete $conf->{$opt};
3731 update_config_nolock($vmid, $conf, 1);
3732 }
3733 }
3734
3735 $conf = load_config($vmid); # update/reload
3736
3737 foreach my $opt (keys %{$conf->{pending}}) { # add/change
3738 $conf = load_config($vmid); # update/reload
3739
3740 if (defined($conf->{$opt}) && ($conf->{$opt} eq $conf->{pending}->{$opt})) {
3741 # skip if nothing changed
3742 } elsif (valid_drivename($opt)) {
3743 vmconfig_register_unused_drive($storecfg, $vmid, $conf, parse_drive($opt, $conf->{$opt}))
3744 if defined($conf->{$opt});
3745 $conf->{$opt} = $conf->{pending}->{$opt};
3746 } else {
3747 $conf->{$opt} = $conf->{pending}->{$opt};
3748 }
3749
3750 delete $conf->{pending}->{$opt};
3751 update_config_nolock($vmid, $conf, 1);
3752 }
3753 }
3754
3755 my $safe_num_ne = sub {
3756 my ($a, $b) = @_;
3757
3758 return 0 if !defined($a) && !defined($b);
3759 return 1 if !defined($a);
3760 return 1 if !defined($b);
3761
3762 return $a != $b;
3763 };
3764
3765 my $safe_string_ne = sub {
3766 my ($a, $b) = @_;
3767
3768 return 0 if !defined($a) && !defined($b);
3769 return 1 if !defined($a);
3770 return 1 if !defined($b);
3771
3772 return $a ne $b;
3773 };
3774
3775 sub vmconfig_update_net {
3776 my ($storecfg, $conf, $vmid, $opt, $value) = @_;
3777
3778 my $newnet = parse_net($value);
3779
3780 if ($conf->{$opt}) {
3781 my $oldnet = parse_net($conf->{$opt});
3782
3783 if (&$safe_string_ne($oldnet->{model}, $newnet->{model}) ||
3784 &$safe_string_ne($oldnet->{macaddr}, $newnet->{macaddr}) ||
3785 &$safe_num_ne($oldnet->{queues}, $newnet->{queues}) ||
3786 !($newnet->{bridge} && $oldnet->{bridge})) { # bridge/nat mode change
3787
3788 # for non online change, we try to hot-unplug
3789 die "skip\n" if !$conf->{hotplug};
3790 vm_deviceunplug($vmid, $conf, $opt);
3791 } else {
3792
3793 die "internal error" if $opt !~ m/net(\d+)/;
3794 my $iface = "tap${vmid}i$1";
3795
3796 if (&$safe_num_ne($oldnet->{rate}, $newnet->{rate})) {
3797 PVE::Network::tap_rate_limit($iface, $newnet->{rate});
3798 }
3799
3800 if(&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
3801 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
3802 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
3803 PVE::Network::tap_unplug($iface);
3804 PVE::Network::tap_plug($iface, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall});
3805 }
3806 }
3807 }
3808
3809 vm_deviceplug($storecfg, $conf, $vmid, $opt, $newnet);
3810 }
3811
3812 sub vm_start {
3813 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused, $forcemachine, $spice_ticket) = @_;
3814
3815 lock_config($vmid, sub {
3816 my $conf = load_config($vmid, $migratedfrom);
3817
3818 die "you can't start a vm if it's a template\n" if is_template($conf);
3819
3820 check_lock($conf) if !$skiplock;
3821
3822 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
3823
3824 if (!$statefile && scalar(keys %{$conf->{pending}})) {
3825 vmconfig_apply_pending($vmid, $conf, $storecfg);
3826 $conf = load_config($vmid); # update/reload
3827 }
3828
3829 my $defaults = load_defaults();
3830
3831 # set environment variable useful inside network script
3832 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
3833
3834 my ($cmd, $vollist, $spice_port) = config_to_command($storecfg, $vmid, $conf, $defaults, $forcemachine);
3835
3836 my $migrate_port = 0;
3837 my $migrate_uri;
3838 if ($statefile) {
3839 if ($statefile eq 'tcp') {
3840 my $localip = "localhost";
3841 my $datacenterconf = PVE::Cluster::cfs_read_file('datacenter.cfg');
3842 if ($datacenterconf->{migration_unsecure}) {
3843 my $nodename = PVE::INotify::nodename();
3844 $localip = PVE::Cluster::remote_node_ip($nodename, 1);
3845 }
3846 $migrate_port = PVE::Tools::next_migrate_port();
3847 $migrate_uri = "tcp:${localip}:${migrate_port}";
3848 push @$cmd, '-incoming', $migrate_uri;
3849 push @$cmd, '-S';
3850 } else {
3851 push @$cmd, '-loadstate', $statefile;
3852 }
3853 } elsif ($paused) {
3854 push @$cmd, '-S';
3855 }
3856
3857 # host pci devices
3858 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
3859 my $d = parse_hostpci($conf->{"hostpci$i"});
3860 next if !$d;
3861 my $pcidevices = $d->{pciid};
3862 foreach my $pcidevice (@$pcidevices) {
3863 my $pciid = $pcidevice->{id}.".".$pcidevice->{function};
3864
3865 my $info = pci_device_info("0000:$pciid");
3866 die "IOMMU not present\n" if !check_iommu_support();
3867 die "no pci device info for device '$pciid'\n" if !$info;
3868
3869 if ($d->{driver} && $d->{driver} eq "vfio") {
3870 die "can't unbind/bind pci group to vfio '$pciid'\n" if !pci_dev_group_bind_to_vfio($pciid);
3871 } else {
3872 die "can't unbind/bind to stub pci device '$pciid'\n" if !pci_dev_bind_to_stub($info);
3873 }
3874
3875 die "can't reset pci device '$pciid'\n" if $info->{has_fl_reset} and !pci_dev_reset($info);
3876 }
3877 }
3878
3879 PVE::Storage::activate_volumes($storecfg, $vollist);
3880
3881 eval { run_command($cmd, timeout => $statefile ? undef : 30,
3882 umask => 0077); };
3883 my $err = $@;
3884 die "start failed: $err" if $err;
3885
3886 print "migration listens on $migrate_uri\n" if $migrate_uri;
3887
3888 if ($statefile && $statefile ne 'tcp') {
3889 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
3890 warn $@ if $@;
3891 }
3892
3893 if ($migratedfrom) {
3894
3895 eval {
3896 set_migration_caps($vmid);
3897 };
3898 warn $@ if $@;
3899
3900 if ($spice_port) {
3901 print "spice listens on port $spice_port\n";
3902 if ($spice_ticket) {
3903 vm_mon_cmd_nocheck($vmid, "set_password", protocol => 'spice', password => $spice_ticket);
3904 vm_mon_cmd_nocheck($vmid, "expire_password", protocol => 'spice', time => "+30");
3905 }
3906 }
3907
3908 } else {
3909
3910 if (!$statefile && (!defined($conf->{balloon}) || $conf->{balloon})) {
3911 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
3912 if $conf->{balloon};
3913 vm_mon_cmd_nocheck($vmid, 'qom-set',
3914 path => "machine/peripheral/balloon0",
3915 property => "guest-stats-polling-interval",
3916 value => 2);
3917 }
3918 }
3919 });
3920 }
3921
3922 sub vm_mon_cmd {
3923 my ($vmid, $execute, %params) = @_;
3924
3925 my $cmd = { execute => $execute, arguments => \%params };
3926 vm_qmp_command($vmid, $cmd);
3927 }
3928
3929 sub vm_mon_cmd_nocheck {
3930 my ($vmid, $execute, %params) = @_;
3931
3932 my $cmd = { execute => $execute, arguments => \%params };
3933 vm_qmp_command($vmid, $cmd, 1);
3934 }
3935
3936 sub vm_qmp_command {
3937 my ($vmid, $cmd, $nocheck) = @_;
3938
3939 my $res;
3940
3941 my $timeout;
3942 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
3943 $timeout = $cmd->{arguments}->{timeout};
3944 delete $cmd->{arguments}->{timeout};
3945 }
3946
3947 eval {
3948 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3949 my $sname = qmp_socket($vmid);
3950 if (-e $sname) { # test if VM is reasonambe new and supports qmp/qga
3951 my $qmpclient = PVE::QMPClient->new();
3952
3953 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
3954 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
3955 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
3956 if scalar(%{$cmd->{arguments}});
3957 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
3958 } else {
3959 die "unable to open monitor socket\n";
3960 }
3961 };
3962 if (my $err = $@) {
3963 syslog("err", "VM $vmid qmp command failed - $err");
3964 die $err;
3965 }
3966
3967 return $res;
3968 }
3969
3970 sub vm_human_monitor_command {
3971 my ($vmid, $cmdline) = @_;
3972
3973 my $res;
3974
3975 my $cmd = {
3976 execute => 'human-monitor-command',
3977 arguments => { 'command-line' => $cmdline},
3978 };
3979
3980 return vm_qmp_command($vmid, $cmd);
3981 }
3982
3983 sub vm_commandline {
3984 my ($storecfg, $vmid) = @_;
3985
3986 my $conf = load_config($vmid);
3987
3988 my $defaults = load_defaults();
3989
3990 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
3991
3992 return join(' ', @$cmd);
3993 }
3994
3995 sub vm_reset {
3996 my ($vmid, $skiplock) = @_;
3997
3998 lock_config($vmid, sub {
3999
4000 my $conf = load_config($vmid);
4001
4002 check_lock($conf) if !$skiplock;
4003
4004 vm_mon_cmd($vmid, "system_reset");
4005 });
4006 }
4007
4008 sub get_vm_volumes {
4009 my ($conf) = @_;
4010
4011 my $vollist = [];
4012 foreach_volid($conf, sub {
4013 my ($volid, $is_cdrom) = @_;
4014
4015 return if $volid =~ m|^/|;
4016
4017 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4018 return if !$sid;
4019
4020 push @$vollist, $volid;
4021 });
4022
4023 return $vollist;
4024 }
4025
4026 sub vm_stop_cleanup {
4027 my ($storecfg, $vmid, $conf, $keepActive) = @_;
4028
4029 eval {
4030 fairsched_rmnod($vmid); # try to destroy group
4031
4032 if (!$keepActive) {
4033 my $vollist = get_vm_volumes($conf);
4034 PVE::Storage::deactivate_volumes($storecfg, $vollist);
4035 }
4036
4037 foreach my $ext (qw(mon qmp pid vnc qga)) {
4038 unlink "/var/run/qemu-server/${vmid}.$ext";
4039 }
4040 };
4041 warn $@ if $@; # avoid errors - just warn
4042 }
4043
4044 # Note: use $nockeck to skip tests if VM configuration file exists.
4045 # We need that when migration VMs to other nodes (files already moved)
4046 # Note: we set $keepActive in vzdump stop mode - volumes need to stay active
4047 sub vm_stop {
4048 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
4049
4050 $force = 1 if !defined($force) && !$shutdown;
4051
4052 if ($migratedfrom){
4053 my $pid = check_running($vmid, $nocheck, $migratedfrom);
4054 kill 15, $pid if $pid;
4055 my $conf = load_config($vmid, $migratedfrom);
4056 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
4057 return;
4058 }
4059
4060 lock_config($vmid, sub {
4061
4062 my $pid = check_running($vmid, $nocheck);
4063 return if !$pid;
4064
4065 my $conf;
4066 if (!$nocheck) {
4067 $conf = load_config($vmid);
4068 check_lock($conf) if !$skiplock;
4069 if (!defined($timeout) && $shutdown && $conf->{startup}) {
4070 my $opts = parse_startup($conf->{startup});
4071 $timeout = $opts->{down} if $opts->{down};
4072 }
4073 }
4074
4075 $timeout = 60 if !defined($timeout);
4076
4077 eval {
4078 if ($shutdown) {
4079 if (!$nocheck && $conf->{agent}) {
4080 vm_qmp_command($vmid, { execute => "guest-shutdown" }, $nocheck);
4081 } else {
4082 vm_qmp_command($vmid, { execute => "system_powerdown" }, $nocheck);
4083 }
4084 } else {
4085 vm_qmp_command($vmid, { execute => "quit" }, $nocheck);
4086 }
4087 };
4088 my $err = $@;
4089
4090 if (!$err) {
4091 my $count = 0;
4092 while (($count < $timeout) && check_running($vmid, $nocheck)) {
4093 $count++;
4094 sleep 1;
4095 }
4096
4097 if ($count >= $timeout) {
4098 if ($force) {
4099 warn "VM still running - terminating now with SIGTERM\n";
4100 kill 15, $pid;
4101 } else {
4102 die "VM quit/powerdown failed - got timeout\n";
4103 }
4104 } else {
4105 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
4106 return;
4107 }
4108 } else {
4109 if ($force) {
4110 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
4111 kill 15, $pid;
4112 } else {
4113 die "VM quit/powerdown failed\n";
4114 }
4115 }
4116
4117 # wait again
4118 $timeout = 10;
4119
4120 my $count = 0;
4121 while (($count < $timeout) && check_running($vmid, $nocheck)) {
4122 $count++;
4123 sleep 1;
4124 }
4125
4126 if ($count >= $timeout) {
4127 warn "VM still running - terminating now with SIGKILL\n";
4128 kill 9, $pid;
4129 sleep 1;
4130 }
4131
4132 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
4133 });
4134 }
4135
4136 sub vm_suspend {
4137 my ($vmid, $skiplock) = @_;
4138
4139 lock_config($vmid, sub {
4140
4141 my $conf = load_config($vmid);
4142
4143 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
4144
4145 vm_mon_cmd($vmid, "stop");
4146 });
4147 }
4148
4149 sub vm_resume {
4150 my ($vmid, $skiplock) = @_;
4151
4152 lock_config($vmid, sub {
4153
4154 my $conf = load_config($vmid);
4155
4156 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
4157
4158 vm_mon_cmd($vmid, "cont");
4159 });
4160 }
4161
4162 sub vm_sendkey {
4163 my ($vmid, $skiplock, $key) = @_;
4164
4165 lock_config($vmid, sub {
4166
4167 my $conf = load_config($vmid);
4168
4169 # there is no qmp command, so we use the human monitor command
4170 vm_human_monitor_command($vmid, "sendkey $key");
4171 });
4172 }
4173
4174 sub vm_destroy {
4175 my ($storecfg, $vmid, $skiplock) = @_;
4176
4177 lock_config($vmid, sub {
4178
4179 my $conf = load_config($vmid);
4180
4181 check_lock($conf) if !$skiplock;
4182
4183 if (!check_running($vmid)) {
4184 fairsched_rmnod($vmid); # try to destroy group
4185 destroy_vm($storecfg, $vmid);
4186 } else {
4187 die "VM $vmid is running - destroy failed\n";
4188 }
4189 });
4190 }
4191
4192 # pci helpers
4193
4194 sub file_write {
4195 my ($filename, $buf) = @_;
4196
4197 my $fh = IO::File->new($filename, "w");
4198 return undef if !$fh;
4199
4200 my $res = print $fh $buf;
4201
4202 $fh->close();
4203
4204 return $res;
4205 }
4206
4207 sub pci_device_info {
4208 my ($name) = @_;
4209
4210 my $res;
4211
4212 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
4213 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
4214
4215 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
4216 return undef if !defined($irq) || $irq !~ m/^\d+$/;
4217
4218 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
4219 return undef if !defined($vendor) || $vendor !~ s/^0x//;
4220
4221 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
4222 return undef if !defined($product) || $product !~ s/^0x//;
4223
4224 $res = {
4225 name => $name,
4226 vendor => $vendor,
4227 product => $product,
4228 domain => $domain,
4229 bus => $bus,
4230 slot => $slot,
4231 func => $func,
4232 irq => $irq,
4233 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
4234 };
4235
4236 return $res;
4237 }
4238
4239 sub pci_dev_reset {
4240 my ($dev) = @_;
4241
4242 my $name = $dev->{name};
4243
4244 my $fn = "$pcisysfs/devices/$name/reset";
4245
4246 return file_write($fn, "1");
4247 }
4248
4249 sub pci_dev_bind_to_stub {
4250 my ($dev) = @_;
4251
4252 my $name = $dev->{name};
4253
4254 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
4255 return 1 if -d $testdir;
4256
4257 my $data = "$dev->{vendor} $dev->{product}";
4258 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
4259
4260 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4261 if (!file_write($fn, $name)) {
4262 return undef if -f $fn;
4263 }
4264
4265 $fn = "$pcisysfs/drivers/pci-stub/bind";
4266 if (! -d $testdir) {
4267 return undef if !file_write($fn, $name);
4268 }
4269
4270 return -d $testdir;
4271 }
4272
4273 sub pci_dev_bind_to_vfio {
4274 my ($dev) = @_;
4275
4276 my $name = $dev->{name};
4277
4278 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4279
4280 if (!-d $vfio_basedir) {
4281 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4282 }
4283 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4284
4285 my $testdir = "$vfio_basedir/$name";
4286 return 1 if -d $testdir;
4287
4288 my $data = "$dev->{vendor} $dev->{product}";
4289 return undef if !file_write("$vfio_basedir/new_id", $data);
4290
4291 my $fn = "$pcisysfs/devices/$name/driver/unbind";
4292 if (!file_write($fn, $name)) {
4293 return undef if -f $fn;
4294 }
4295
4296 $fn = "$vfio_basedir/bind";
4297 if (! -d $testdir) {
4298 return undef if !file_write($fn, $name);
4299 }
4300
4301 return -d $testdir;
4302 }
4303
4304 sub pci_dev_group_bind_to_vfio {
4305 my ($pciid) = @_;
4306
4307 my $vfio_basedir = "$pcisysfs/drivers/vfio-pci";
4308
4309 if (!-d $vfio_basedir) {
4310 system("/sbin/modprobe vfio-pci >/dev/null 2>/dev/null");
4311 }
4312 die "Cannot find vfio-pci module!\n" if !-d $vfio_basedir;
4313
4314 # get IOMMU group devices
4315 opendir(my $D, "$pcisysfs/devices/0000:$pciid/iommu_group/devices/") || die "Cannot open iommu_group: $!\n";
4316 my @devs = grep /^0000:/, readdir($D);
4317 closedir($D);
4318
4319 foreach my $pciid (@devs) {
4320 $pciid =~ m/^([:\.\da-f]+)$/ or die "PCI ID $pciid not valid!\n";
4321 my $info = pci_device_info($1);
4322 pci_dev_bind_to_vfio($info) || die "Cannot bind $pciid to vfio\n";
4323 }
4324
4325 return 1;
4326 }
4327
4328 sub print_pci_addr {
4329 my ($id, $bridges) = @_;
4330
4331 my $res = '';
4332 my $devices = {
4333 piix3 => { bus => 0, addr => 1 },
4334 #addr2 : first videocard
4335 balloon0 => { bus => 0, addr => 3 },
4336 watchdog => { bus => 0, addr => 4 },
4337 scsihw0 => { bus => 0, addr => 5 },
4338 scsihw1 => { bus => 0, addr => 6 },
4339 ahci0 => { bus => 0, addr => 7 },
4340 qga0 => { bus => 0, addr => 8 },
4341 spice => { bus => 0, addr => 9 },
4342 virtio0 => { bus => 0, addr => 10 },
4343 virtio1 => { bus => 0, addr => 11 },
4344 virtio2 => { bus => 0, addr => 12 },
4345 virtio3 => { bus => 0, addr => 13 },
4346 virtio4 => { bus => 0, addr => 14 },
4347 virtio5 => { bus => 0, addr => 15 },
4348 hostpci0 => { bus => 0, addr => 16 },
4349 hostpci1 => { bus => 0, addr => 17 },
4350 net0 => { bus => 0, addr => 18 },
4351 net1 => { bus => 0, addr => 19 },
4352 net2 => { bus => 0, addr => 20 },
4353 net3 => { bus => 0, addr => 21 },
4354 net4 => { bus => 0, addr => 22 },
4355 net5 => { bus => 0, addr => 23 },
4356 vga1 => { bus => 0, addr => 24 },
4357 vga2 => { bus => 0, addr => 25 },
4358 vga3 => { bus => 0, addr => 26 },
4359 hostpci2 => { bus => 0, addr => 27 },
4360 hostpci3 => { bus => 0, addr => 28 },
4361 #addr29 : usb-host (pve-usb.cfg)
4362 'pci.1' => { bus => 0, addr => 30 },
4363 'pci.2' => { bus => 0, addr => 31 },
4364 'net6' => { bus => 1, addr => 1 },
4365 'net7' => { bus => 1, addr => 2 },
4366 'net8' => { bus => 1, addr => 3 },
4367 'net9' => { bus => 1, addr => 4 },
4368 'net10' => { bus => 1, addr => 5 },
4369 'net11' => { bus => 1, addr => 6 },
4370 'net12' => { bus => 1, addr => 7 },
4371 'net13' => { bus => 1, addr => 8 },
4372 'net14' => { bus => 1, addr => 9 },
4373 'net15' => { bus => 1, addr => 10 },
4374 'net16' => { bus => 1, addr => 11 },
4375 'net17' => { bus => 1, addr => 12 },
4376 'net18' => { bus => 1, addr => 13 },
4377 'net19' => { bus => 1, addr => 14 },
4378 'net20' => { bus => 1, addr => 15 },
4379 'net21' => { bus => 1, addr => 16 },
4380 'net22' => { bus => 1, addr => 17 },
4381 'net23' => { bus => 1, addr => 18 },
4382 'net24' => { bus => 1, addr => 19 },
4383 'net25' => { bus => 1, addr => 20 },
4384 'net26' => { bus => 1, addr => 21 },
4385 'net27' => { bus => 1, addr => 22 },
4386 'net28' => { bus => 1, addr => 23 },
4387 'net29' => { bus => 1, addr => 24 },
4388 'net30' => { bus => 1, addr => 25 },
4389 'net31' => { bus => 1, addr => 26 },
4390 'virtio6' => { bus => 2, addr => 1 },
4391 'virtio7' => { bus => 2, addr => 2 },
4392 'virtio8' => { bus => 2, addr => 3 },
4393 'virtio9' => { bus => 2, addr => 4 },
4394 'virtio10' => { bus => 2, addr => 5 },
4395 'virtio11' => { bus => 2, addr => 6 },
4396 'virtio12' => { bus => 2, addr => 7 },
4397 'virtio13' => { bus => 2, addr => 8 },
4398 'virtio14' => { bus => 2, addr => 9 },
4399 'virtio15' => { bus => 2, addr => 10 },
4400 };
4401
4402 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4403 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4404 my $bus = $devices->{$id}->{bus};
4405 $res = ",bus=pci.$bus,addr=$addr";
4406 $bridges->{$bus} = 1 if $bridges;
4407 }
4408 return $res;
4409
4410 }
4411
4412 sub print_pcie_addr {
4413 my ($id) = @_;
4414
4415 my $res = '';
4416 my $devices = {
4417 hostpci0 => { bus => "ich9-pcie-port-1", addr => 0 },
4418 hostpci1 => { bus => "ich9-pcie-port-2", addr => 0 },
4419 hostpci2 => { bus => "ich9-pcie-port-3", addr => 0 },
4420 hostpci3 => { bus => "ich9-pcie-port-4", addr => 0 },
4421 };
4422
4423 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
4424 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
4425 my $bus = $devices->{$id}->{bus};
4426 $res = ",bus=$bus,addr=$addr";
4427 }
4428 return $res;
4429
4430 }
4431
4432 # vzdump restore implementaion
4433
4434 sub tar_archive_read_firstfile {
4435 my $archive = shift;
4436
4437 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
4438
4439 # try to detect archive type first
4440 my $pid = open (TMP, "tar tf '$archive'|") ||
4441 die "unable to open file '$archive'\n";
4442 my $firstfile = <TMP>;
4443 kill 15, $pid;
4444 close TMP;
4445
4446 die "ERROR: archive contaions no data\n" if !$firstfile;
4447 chomp $firstfile;
4448
4449 return $firstfile;
4450 }
4451
4452 sub tar_restore_cleanup {
4453 my ($storecfg, $statfile) = @_;
4454
4455 print STDERR "starting cleanup\n";
4456
4457 if (my $fd = IO::File->new($statfile, "r")) {
4458 while (defined(my $line = <$fd>)) {
4459 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
4460 my $volid = $2;
4461 eval {
4462 if ($volid =~ m|^/|) {
4463 unlink $volid || die 'unlink failed\n';
4464 } else {
4465 PVE::Storage::vdisk_free($storecfg, $volid);
4466 }
4467 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4468 };
4469 print STDERR "unable to cleanup '$volid' - $@" if $@;
4470 } else {
4471 print STDERR "unable to parse line in statfile - $line";
4472 }
4473 }
4474 $fd->close();
4475 }
4476 }
4477
4478 sub restore_archive {
4479 my ($archive, $vmid, $user, $opts) = @_;
4480
4481 my $format = $opts->{format};
4482 my $comp;
4483
4484 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
4485 $format = 'tar' if !$format;
4486 $comp = 'gzip';
4487 } elsif ($archive =~ m/\.tar$/) {
4488 $format = 'tar' if !$format;
4489 } elsif ($archive =~ m/.tar.lzo$/) {
4490 $format = 'tar' if !$format;
4491 $comp = 'lzop';
4492 } elsif ($archive =~ m/\.vma$/) {
4493 $format = 'vma' if !$format;
4494 } elsif ($archive =~ m/\.vma\.gz$/) {
4495 $format = 'vma' if !$format;
4496 $comp = 'gzip';
4497 } elsif ($archive =~ m/\.vma\.lzo$/) {
4498 $format = 'vma' if !$format;
4499 $comp = 'lzop';
4500 } else {
4501 $format = 'vma' if !$format; # default
4502 }
4503
4504 # try to detect archive format
4505 if ($format eq 'tar') {
4506 return restore_tar_archive($archive, $vmid, $user, $opts);
4507 } else {
4508 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
4509 }
4510 }
4511
4512 sub restore_update_config_line {
4513 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
4514
4515 return if $line =~ m/^\#qmdump\#/;
4516 return if $line =~ m/^\#vzdump\#/;
4517 return if $line =~ m/^lock:/;
4518 return if $line =~ m/^unused\d+:/;
4519 return if $line =~ m/^parent:/;
4520 return if $line =~ m/^template:/; # restored VM is never a template
4521
4522 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
4523 # try to convert old 1.X settings
4524 my ($id, $ind, $ethcfg) = ($1, $2, $3);
4525 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
4526 my ($model, $macaddr) = split(/\=/, $devconfig);
4527 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
4528 my $net = {
4529 model => $model,
4530 bridge => "vmbr$ind",
4531 macaddr => $macaddr,
4532 };
4533 my $netstr = print_net($net);
4534
4535 print $outfd "net$cookie->{netcount}: $netstr\n";
4536 $cookie->{netcount}++;
4537 }
4538 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
4539 my ($id, $netstr) = ($1, $2);
4540 my $net = parse_net($netstr);
4541 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
4542 $netstr = print_net($net);
4543 print $outfd "$id: $netstr\n";
4544 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
4545 my $virtdev = $1;
4546 my $value = $3;
4547 if ($line =~ m/backup=no/) {
4548 print $outfd "#$line";
4549 } elsif ($virtdev && $map->{$virtdev}) {
4550 my $di = parse_drive($virtdev, $value);
4551 delete $di->{format}; # format can change on restore
4552 $di->{file} = $map->{$virtdev};
4553 $value = print_drive($vmid, $di);
4554 print $outfd "$virtdev: $value\n";
4555 } else {
4556 print $outfd $line;
4557 }
4558 } else {
4559 print $outfd $line;
4560 }
4561 }
4562
4563 sub scan_volids {
4564 my ($cfg, $vmid) = @_;
4565
4566 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
4567
4568 my $volid_hash = {};
4569 foreach my $storeid (keys %$info) {
4570 foreach my $item (@{$info->{$storeid}}) {
4571 next if !($item->{volid} && $item->{size});
4572 $item->{path} = PVE::Storage::path($cfg, $item->{volid});
4573 $volid_hash->{$item->{volid}} = $item;
4574 }
4575 }
4576
4577 return $volid_hash;
4578 }
4579
4580 sub get_used_paths {
4581 my ($vmid, $storecfg, $conf, $scan_snapshots, $skip_drive) = @_;
4582
4583 my $used_path = {};
4584
4585 my $scan_config = sub {
4586 my ($cref, $snapname) = @_;
4587
4588 foreach my $key (keys %$cref) {
4589 my $value = $cref->{$key};
4590 if (valid_drivename($key)) {
4591 next if $skip_drive && $key eq $skip_drive;
4592 my $drive = parse_drive($key, $value);
4593 next if !$drive || !$drive->{file} || drive_is_cdrom($drive);
4594 if ($drive->{file} =~ m!^/!) {
4595 $used_path->{$drive->{file}}++; # = 1;
4596 } else {
4597 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
4598 next if !$storeid;
4599 my $scfg = PVE::Storage::storage_config($storecfg, $storeid, 1);
4600 next if !$scfg;
4601 my $path = PVE::Storage::path($storecfg, $drive->{file}, $snapname);
4602 $used_path->{$path}++; # = 1;
4603 }
4604 }
4605 }
4606 };
4607
4608 &$scan_config($conf);
4609
4610 undef $skip_drive;
4611
4612 if ($scan_snapshots) {
4613 foreach my $snapname (keys %{$conf->{snapshots}}) {
4614 &$scan_config($conf->{snapshots}->{$snapname}, $snapname);
4615 }
4616 }
4617
4618 return $used_path;
4619 }
4620
4621 sub update_disksize {
4622 my ($vmid, $conf, $volid_hash) = @_;
4623
4624 my $changes;
4625
4626 my $used = {};
4627
4628 # Note: it is allowed to define multiple storages with same path (alias), so
4629 # we need to check both 'volid' and real 'path' (two different volid can point
4630 # to the same path).
4631
4632 my $usedpath = {};
4633
4634 # update size info
4635 foreach my $opt (keys %$conf) {
4636 if (valid_drivename($opt)) {
4637 my $drive = parse_drive($opt, $conf->{$opt});
4638 my $volid = $drive->{file};
4639 next if !$volid;
4640
4641 $used->{$volid} = 1;
4642 if ($volid_hash->{$volid} &&
4643 (my $path = $volid_hash->{$volid}->{path})) {
4644 $usedpath->{$path} = 1;
4645 }
4646
4647 next if drive_is_cdrom($drive);
4648 next if !$volid_hash->{$volid};
4649
4650 $drive->{size} = $volid_hash->{$volid}->{size};
4651 my $new = print_drive($vmid, $drive);
4652 if ($new ne $conf->{$opt}) {
4653 $changes = 1;
4654 $conf->{$opt} = $new;
4655 }
4656 }
4657 }
4658
4659 # remove 'unusedX' entry if volume is used
4660 foreach my $opt (keys %$conf) {
4661 next if $opt !~ m/^unused\d+$/;
4662 my $volid = $conf->{$opt};
4663 my $path = $volid_hash->{$volid}->{path} if $volid_hash->{$volid};
4664 if ($used->{$volid} || ($path && $usedpath->{$path})) {
4665 $changes = 1;
4666 delete $conf->{$opt};
4667 }
4668 }
4669
4670 foreach my $volid (sort keys %$volid_hash) {
4671 next if $volid =~ m/vm-$vmid-state-/;
4672 next if $used->{$volid};
4673 my $path = $volid_hash->{$volid}->{path};
4674 next if !$path; # just to be sure
4675 next if $usedpath->{$path};
4676 $changes = 1;
4677 add_unused_volume($conf, $volid);
4678 $usedpath->{$path} = 1; # avoid to add more than once (aliases)
4679 }
4680
4681 return $changes;
4682 }
4683
4684 sub rescan {
4685 my ($vmid, $nolock) = @_;
4686
4687 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
4688
4689 my $volid_hash = scan_volids($cfg, $vmid);
4690
4691 my $updatefn = sub {
4692 my ($vmid) = @_;
4693
4694 my $conf = load_config($vmid);
4695
4696 check_lock($conf);
4697
4698 my $vm_volids = {};
4699 foreach my $volid (keys %$volid_hash) {
4700 my $info = $volid_hash->{$volid};
4701 $vm_volids->{$volid} = $info if $info->{vmid} && $info->{vmid} == $vmid;
4702 }
4703
4704 my $changes = update_disksize($vmid, $conf, $vm_volids);
4705
4706 update_config_nolock($vmid, $conf, 1) if $changes;
4707 };
4708
4709 if (defined($vmid)) {
4710 if ($nolock) {
4711 &$updatefn($vmid);
4712 } else {
4713 lock_config($vmid, $updatefn, $vmid);
4714 }
4715 } else {
4716 my $vmlist = config_list();
4717 foreach my $vmid (keys %$vmlist) {
4718 if ($nolock) {
4719 &$updatefn($vmid);
4720 } else {
4721 lock_config($vmid, $updatefn, $vmid);
4722 }
4723 }
4724 }
4725 }
4726
4727 sub restore_vma_archive {
4728 my ($archive, $vmid, $user, $opts, $comp) = @_;
4729
4730 my $input = $archive eq '-' ? "<&STDIN" : undef;
4731 my $readfrom = $archive;
4732
4733 my $uncomp = '';
4734 if ($comp) {
4735 $readfrom = '-';
4736 my $qarchive = PVE::Tools::shellquote($archive);
4737 if ($comp eq 'gzip') {
4738 $uncomp = "zcat $qarchive|";
4739 } elsif ($comp eq 'lzop') {
4740 $uncomp = "lzop -d -c $qarchive|";
4741 } else {
4742 die "unknown compression method '$comp'\n";
4743 }
4744
4745 }
4746
4747 my $tmpdir = "/var/tmp/vzdumptmp$$";
4748 rmtree $tmpdir;
4749
4750 # disable interrupts (always do cleanups)
4751 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4752 warn "got interrupt - ignored\n";
4753 };
4754
4755 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
4756 POSIX::mkfifo($mapfifo, 0600);
4757 my $fifofh;
4758
4759 my $openfifo = sub {
4760 open($fifofh, '>', $mapfifo) || die $!;
4761 };
4762
4763 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
4764
4765 my $oldtimeout;
4766 my $timeout = 5;
4767
4768 my $devinfo = {};
4769
4770 my $rpcenv = PVE::RPCEnvironment::get();
4771
4772 my $conffile = config_file($vmid);
4773 my $tmpfn = "$conffile.$$.tmp";
4774
4775 # Note: $oldconf is undef if VM does not exists
4776 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
4777
4778 my $print_devmap = sub {
4779 my $virtdev_hash = {};
4780
4781 my $cfgfn = "$tmpdir/qemu-server.conf";
4782
4783 # we can read the config - that is already extracted
4784 my $fh = IO::File->new($cfgfn, "r") ||
4785 "unable to read qemu-server.conf - $!\n";
4786
4787 while (defined(my $line = <$fh>)) {
4788 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
4789 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
4790 die "archive does not contain data for drive '$virtdev'\n"
4791 if !$devinfo->{$devname};
4792 if (defined($opts->{storage})) {
4793 $storeid = $opts->{storage} || 'local';
4794 } elsif (!$storeid) {
4795 $storeid = 'local';
4796 }
4797 $format = 'raw' if !$format;
4798 $devinfo->{$devname}->{devname} = $devname;
4799 $devinfo->{$devname}->{virtdev} = $virtdev;
4800 $devinfo->{$devname}->{format} = $format;
4801 $devinfo->{$devname}->{storeid} = $storeid;
4802
4803 # check permission on storage
4804 my $pool = $opts->{pool}; # todo: do we need that?
4805 if ($user ne 'root@pam') {
4806 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
4807 }
4808
4809 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
4810 }
4811 }
4812
4813 foreach my $devname (keys %$devinfo) {
4814 die "found no device mapping information for device '$devname'\n"
4815 if !$devinfo->{$devname}->{virtdev};
4816 }
4817
4818 my $cfg = cfs_read_file('storage.cfg');
4819
4820 # create empty/temp config
4821 if ($oldconf) {
4822 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
4823 foreach_drive($oldconf, sub {
4824 my ($ds, $drive) = @_;
4825
4826 return if drive_is_cdrom($drive);
4827
4828 my $volid = $drive->{file};
4829
4830 return if !$volid || $volid =~ m|^/|;
4831
4832 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
4833 return if !$path || !$owner || ($owner != $vmid);
4834
4835 # Note: only delete disk we want to restore
4836 # other volumes will become unused
4837 if ($virtdev_hash->{$ds}) {
4838 PVE::Storage::vdisk_free($cfg, $volid);
4839 }
4840 });
4841 }
4842
4843 my $map = {};
4844 foreach my $virtdev (sort keys %$virtdev_hash) {
4845 my $d = $virtdev_hash->{$virtdev};
4846 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
4847 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
4848
4849 # test if requested format is supported
4850 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($cfg, $d->{storeid});
4851 my $supported = grep { $_ eq $d->{format} } @$validFormats;
4852 $d->{format} = $defFormat if !$supported;
4853
4854 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
4855 $d->{format}, undef, $alloc_size);
4856 print STDERR "new volume ID is '$volid'\n";
4857 $d->{volid} = $volid;
4858 my $path = PVE::Storage::path($cfg, $volid);
4859
4860 my $write_zeros = 1;
4861 # fixme: what other storages types initialize volumes with zero?
4862 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs' || $scfg->{type} eq 'glusterfs' ||
4863 $scfg->{type} eq 'sheepdog' || $scfg->{type} eq 'rbd') {
4864 $write_zeros = 0;
4865 }
4866
4867 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
4868
4869 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
4870 $map->{$virtdev} = $volid;
4871 }
4872
4873 $fh->seek(0, 0) || die "seek failed - $!\n";
4874
4875 my $outfd = new IO::File ($tmpfn, "w") ||
4876 die "unable to write config for VM $vmid\n";
4877
4878 my $cookie = { netcount => 0 };
4879 while (defined(my $line = <$fh>)) {
4880 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
4881 }
4882
4883 $fh->close();
4884 $outfd->close();
4885 };
4886
4887 eval {
4888 # enable interrupts
4889 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
4890 die "interrupted by signal\n";
4891 };
4892 local $SIG{ALRM} = sub { die "got timeout\n"; };
4893
4894 $oldtimeout = alarm($timeout);
4895
4896 my $parser = sub {
4897 my $line = shift;
4898
4899 print "$line\n";
4900
4901 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
4902 my ($dev_id, $size, $devname) = ($1, $2, $3);
4903 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
4904 } elsif ($line =~ m/^CTIME: /) {
4905 # we correctly received the vma config, so we can disable
4906 # the timeout now for disk allocation (set to 10 minutes, so
4907 # that we always timeout if something goes wrong)
4908 alarm(600);
4909 &$print_devmap();
4910 print $fifofh "done\n";
4911 my $tmp = $oldtimeout || 0;
4912 $oldtimeout = undef;
4913 alarm($tmp);
4914 close($fifofh);
4915 }
4916 };
4917
4918 print "restore vma archive: $cmd\n";
4919 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
4920 };
4921 my $err = $@;
4922
4923 alarm($oldtimeout) if $oldtimeout;
4924
4925 unlink $mapfifo;
4926
4927 if ($err) {
4928 rmtree $tmpdir;
4929 unlink $tmpfn;
4930
4931 my $cfg = cfs_read_file('storage.cfg');
4932 foreach my $devname (keys %$devinfo) {
4933 my $volid = $devinfo->{$devname}->{volid};
4934 next if !$volid;
4935 eval {
4936 if ($volid =~ m|^/|) {
4937 unlink $volid || die 'unlink failed\n';
4938 } else {
4939 PVE::Storage::vdisk_free($cfg, $volid);
4940 }
4941 print STDERR "temporary volume '$volid' sucessfuly removed\n";
4942 };
4943 print STDERR "unable to cleanup '$volid' - $@" if $@;
4944 }
4945 die $err;
4946 }
4947
4948 rmtree $tmpdir;
4949
4950 rename($tmpfn, $conffile) ||
4951 die "unable to commit configuration file '$conffile'\n";
4952
4953 PVE::Cluster::cfs_update(); # make sure we read new file
4954
4955 eval { rescan($vmid, 1); };
4956 warn $@ if $@;
4957 }
4958
4959 sub restore_tar_archive {
4960 my ($archive, $vmid, $user, $opts) = @_;
4961
4962 if ($archive ne '-') {
4963 my $firstfile = tar_archive_read_firstfile($archive);
4964 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
4965 if $firstfile ne 'qemu-server.conf';
4966 }
4967
4968 my $storecfg = cfs_read_file('storage.cfg');
4969
4970 # destroy existing data - keep empty config
4971 my $vmcfgfn = config_file($vmid);
4972 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
4973
4974 my $tocmd = "/usr/lib/qemu-server/qmextract";
4975
4976 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
4977 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
4978 $tocmd .= ' --prealloc' if $opts->{prealloc};
4979 $tocmd .= ' --info' if $opts->{info};
4980
4981 # tar option "xf" does not autodetect compression when read from STDIN,
4982 # so we pipe to zcat
4983 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
4984 PVE::Tools::shellquote("--to-command=$tocmd");
4985
4986 my $tmpdir = "/var/tmp/vzdumptmp$$";
4987 mkpath $tmpdir;
4988
4989 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
4990 local $ENV{VZDUMP_VMID} = $vmid;
4991 local $ENV{VZDUMP_USER} = $user;
4992
4993 my $conffile = config_file($vmid);
4994 my $tmpfn = "$conffile.$$.tmp";
4995
4996 # disable interrupts (always do cleanups)
4997 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
4998 print STDERR "got interrupt - ignored\n";
4999 };
5000
5001 eval {
5002 # enable interrupts
5003 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
5004 die "interrupted by signal\n";
5005 };
5006
5007 if ($archive eq '-') {
5008 print "extracting archive from STDIN\n";
5009 run_command($cmd, input => "<&STDIN");
5010 } else {
5011 print "extracting archive '$archive'\n";
5012 run_command($cmd);
5013 }
5014
5015 return if $opts->{info};
5016
5017 # read new mapping
5018 my $map = {};
5019 my $statfile = "$tmpdir/qmrestore.stat";
5020 if (my $fd = IO::File->new($statfile, "r")) {
5021 while (defined (my $line = <$fd>)) {
5022 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
5023 $map->{$1} = $2 if $1;
5024 } else {
5025 print STDERR "unable to parse line in statfile - $line\n";
5026 }
5027 }
5028 $fd->close();
5029 }
5030
5031 my $confsrc = "$tmpdir/qemu-server.conf";
5032
5033 my $srcfd = new IO::File($confsrc, "r") ||
5034 die "unable to open file '$confsrc'\n";
5035
5036 my $outfd = new IO::File ($tmpfn, "w") ||
5037 die "unable to write config for VM $vmid\n";
5038
5039 my $cookie = { netcount => 0 };
5040 while (defined (my $line = <$srcfd>)) {
5041 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
5042 }
5043
5044 $srcfd->close();
5045 $outfd->close();
5046 };
5047 my $err = $@;
5048
5049 if ($err) {
5050
5051 unlink $tmpfn;
5052
5053 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
5054
5055 die $err;
5056 }
5057
5058 rmtree $tmpdir;
5059
5060 rename $tmpfn, $conffile ||
5061 die "unable to commit configuration file '$conffile'\n";
5062
5063 PVE::Cluster::cfs_update(); # make sure we read new file
5064
5065 eval { rescan($vmid, 1); };
5066 warn $@ if $@;
5067 };
5068
5069
5070 # Internal snapshots
5071
5072 # NOTE: Snapshot create/delete involves several non-atomic
5073 # action, and can take a long time.
5074 # So we try to avoid locking the file and use 'lock' variable
5075 # inside the config file instead.
5076
5077 my $snapshot_copy_config = sub {
5078 my ($source, $dest) = @_;
5079
5080 foreach my $k (keys %$source) {
5081 next if $k eq 'snapshots';
5082 next if $k eq 'snapstate';
5083 next if $k eq 'snaptime';
5084 next if $k eq 'vmstate';
5085 next if $k eq 'lock';
5086 next if $k eq 'digest';
5087 next if $k eq 'description';
5088 next if $k =~ m/^unused\d+$/;
5089
5090 $dest->{$k} = $source->{$k};
5091 }
5092 };
5093
5094 my $snapshot_apply_config = sub {
5095 my ($conf, $snap) = @_;
5096
5097 # copy snapshot list
5098 my $newconf = {
5099 snapshots => $conf->{snapshots},
5100 };
5101
5102 # keep description and list of unused disks
5103 foreach my $k (keys %$conf) {
5104 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
5105 $newconf->{$k} = $conf->{$k};
5106 }
5107
5108 &$snapshot_copy_config($snap, $newconf);
5109
5110 return $newconf;
5111 };
5112
5113 sub foreach_writable_storage {
5114 my ($conf, $func) = @_;
5115
5116 my $sidhash = {};
5117
5118 foreach my $ds (keys %$conf) {
5119 next if !valid_drivename($ds);
5120
5121 my $drive = parse_drive($ds, $conf->{$ds});
5122 next if !$drive;
5123 next if drive_is_cdrom($drive);
5124
5125 my $volid = $drive->{file};
5126
5127 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
5128 $sidhash->{$sid} = $sid if $sid;
5129 }
5130
5131 foreach my $sid (sort keys %$sidhash) {
5132 &$func($sid);
5133 }
5134 }
5135
5136 my $alloc_vmstate_volid = sub {
5137 my ($storecfg, $vmid, $conf, $snapname) = @_;
5138
5139 # Note: we try to be smart when selecting a $target storage
5140
5141 my $target;
5142
5143 # search shared storage first
5144 foreach_writable_storage($conf, sub {
5145 my ($sid) = @_;
5146 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5147 return if !$scfg->{shared};
5148
5149 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
5150 });
5151
5152 if (!$target) {
5153 # now search local storage
5154 foreach_writable_storage($conf, sub {
5155 my ($sid) = @_;
5156 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
5157 return if $scfg->{shared};
5158
5159 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
5160 });
5161 }
5162
5163 $target = 'local' if !$target;
5164
5165 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
5166 # we abort live save after $conf->{memory}, so we need at max twice that space
5167 my $size = $conf->{memory}*2 + $driver_state_size;
5168
5169 my $name = "vm-$vmid-state-$snapname";
5170 my $scfg = PVE::Storage::storage_config($storecfg, $target);
5171 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
5172 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
5173
5174 return $volid;
5175 };
5176
5177 my $snapshot_prepare = sub {
5178 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
5179
5180 my $snap;
5181
5182 my $updatefn = sub {
5183
5184 my $conf = load_config($vmid);
5185
5186 die "you can't take a snapshot if it's a template\n"
5187 if is_template($conf);
5188
5189 check_lock($conf);
5190
5191 $conf->{lock} = 'snapshot';
5192
5193 die "snapshot name '$snapname' already used\n"
5194 if defined($conf->{snapshots}->{$snapname});
5195
5196 my $storecfg = PVE::Storage::config();
5197 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
5198
5199 $snap = $conf->{snapshots}->{$snapname} = {};
5200
5201 if ($save_vmstate && check_running($vmid)) {
5202 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
5203 }
5204
5205 &$snapshot_copy_config($conf, $snap);
5206
5207 $snap->{snapstate} = "prepare";
5208 $snap->{snaptime} = time();
5209 $snap->{description} = $comment if $comment;
5210
5211 # always overwrite machine if we save vmstate. This makes sure we
5212 # can restore it later using correct machine type
5213 $snap->{machine} = get_current_qemu_machine($vmid) if $snap->{vmstate};
5214
5215 update_config_nolock($vmid, $conf, 1);
5216 };
5217
5218 lock_config($vmid, $updatefn);
5219
5220 return $snap;
5221 };
5222
5223 my $snapshot_commit = sub {
5224 my ($vmid, $snapname) = @_;
5225
5226 my $updatefn = sub {
5227
5228 my $conf = load_config($vmid);
5229
5230 die "missing snapshot lock\n"
5231 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
5232
5233 my $has_machine_config = defined($conf->{machine});
5234
5235 my $snap = $conf->{snapshots}->{$snapname};
5236
5237 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5238
5239 die "wrong snapshot state\n"
5240 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
5241
5242 delete $snap->{snapstate};
5243 delete $conf->{lock};
5244
5245 my $newconf = &$snapshot_apply_config($conf, $snap);
5246
5247 delete $newconf->{machine} if !$has_machine_config;
5248
5249 $newconf->{parent} = $snapname;
5250
5251 update_config_nolock($vmid, $newconf, 1);
5252 };
5253
5254 lock_config($vmid, $updatefn);
5255 };
5256
5257 sub snapshot_rollback {
5258 my ($vmid, $snapname) = @_;
5259
5260 my $snap;
5261
5262 my $prepare = 1;
5263
5264 my $storecfg = PVE::Storage::config();
5265
5266 my $updatefn = sub {
5267
5268 my $conf = load_config($vmid);
5269
5270 die "you can't rollback if vm is a template\n" if is_template($conf);
5271
5272 $snap = $conf->{snapshots}->{$snapname};
5273
5274 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5275
5276 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
5277 if $snap->{snapstate};
5278
5279 if ($prepare) {
5280 check_lock($conf);
5281 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
5282 }
5283
5284 die "unable to rollback vm $vmid: vm is running\n"
5285 if check_running($vmid);
5286
5287 if ($prepare) {
5288 $conf->{lock} = 'rollback';
5289 } else {
5290 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
5291 delete $conf->{lock};
5292 }
5293
5294 my $forcemachine;
5295
5296 if (!$prepare) {
5297 my $has_machine_config = defined($conf->{machine});
5298
5299 # copy snapshot config to current config
5300 $conf = &$snapshot_apply_config($conf, $snap);
5301 $conf->{parent} = $snapname;
5302
5303 # Note: old code did not store 'machine', so we try to be smart
5304 # and guess the snapshot was generated with kvm 1.4 (pc-i440fx-1.4).
5305 $forcemachine = $conf->{machine} || 'pc-i440fx-1.4';
5306 # we remove the 'machine' configuration if not explicitly specified
5307 # in the original config.
5308 delete $conf->{machine} if $snap->{vmstate} && !$has_machine_config;
5309 }
5310
5311 update_config_nolock($vmid, $conf, 1);
5312
5313 if (!$prepare && $snap->{vmstate}) {
5314 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
5315 vm_start($storecfg, $vmid, $statefile, undef, undef, undef, $forcemachine);
5316 }
5317 };
5318
5319 lock_config($vmid, $updatefn);
5320
5321 foreach_drive($snap, sub {
5322 my ($ds, $drive) = @_;
5323
5324 return if drive_is_cdrom($drive);
5325
5326 my $volid = $drive->{file};
5327 my $device = "drive-$ds";
5328
5329 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
5330 });
5331
5332 $prepare = 0;
5333 lock_config($vmid, $updatefn);
5334 }
5335
5336 my $savevm_wait = sub {
5337 my ($vmid) = @_;
5338
5339 for(;;) {
5340 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5341 if (!$stat->{status}) {
5342 die "savevm not active\n";
5343 } elsif ($stat->{status} eq 'active') {
5344 sleep(1);
5345 next;
5346 } elsif ($stat->{status} eq 'completed') {
5347 last;
5348 } else {
5349 die "query-savevm returned status '$stat->{status}'\n";
5350 }
5351 }
5352 };
5353
5354 sub snapshot_create {
5355 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
5356
5357 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
5358
5359 $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
5360
5361 my $config = load_config($vmid);
5362
5363 my $running = check_running($vmid);
5364
5365 my $freezefs = $running && $config->{agent};
5366 $freezefs = 0 if $snap->{vmstate}; # not needed if we save RAM
5367
5368 my $drivehash = {};
5369
5370 if ($freezefs) {
5371 eval { vm_mon_cmd($vmid, "guest-fsfreeze-freeze"); };
5372 warn "guest-fsfreeze-freeze problems - $@" if $@;
5373 }
5374
5375 eval {
5376 # create internal snapshots of all drives
5377
5378 my $storecfg = PVE::Storage::config();
5379
5380 if ($running) {
5381 if ($snap->{vmstate}) {
5382 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
5383 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
5384 &$savevm_wait($vmid);
5385 } else {
5386 vm_mon_cmd($vmid, "savevm-start");
5387 }
5388 };
5389
5390 foreach_drive($snap, sub {
5391 my ($ds, $drive) = @_;
5392
5393 return if drive_is_cdrom($drive);
5394
5395 my $volid = $drive->{file};
5396 my $device = "drive-$ds";
5397
5398 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
5399 $drivehash->{$ds} = 1;
5400 });
5401 };
5402 my $err = $@;
5403
5404 if ($running) {
5405 eval { vm_mon_cmd($vmid, "savevm-end") };
5406 warn $@ if $@;
5407
5408 if ($freezefs) {
5409 eval { vm_mon_cmd($vmid, "guest-fsfreeze-thaw"); };
5410 warn "guest-fsfreeze-thaw problems - $@" if $@;
5411 }
5412
5413 # savevm-end is async, we need to wait
5414 for (;;) {
5415 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
5416 if (!$stat->{bytes}) {
5417 last;
5418 } else {
5419 print "savevm not yet finished\n";
5420 sleep(1);
5421 next;
5422 }
5423 }
5424 }
5425
5426 if ($err) {
5427 warn "snapshot create failed: starting cleanup\n";
5428 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
5429 warn $@ if $@;
5430 die $err;
5431 }
5432
5433 &$snapshot_commit($vmid, $snapname);
5434 }
5435
5436 # Note: $drivehash is only set when called from snapshot_create.
5437 sub snapshot_delete {
5438 my ($vmid, $snapname, $force, $drivehash) = @_;
5439
5440 my $prepare = 1;
5441
5442 my $snap;
5443 my $unused = [];
5444
5445 my $unlink_parent = sub {
5446 my ($confref, $new_parent) = @_;
5447
5448 if ($confref->{parent} && $confref->{parent} eq $snapname) {
5449 if ($new_parent) {
5450 $confref->{parent} = $new_parent;
5451 } else {
5452 delete $confref->{parent};
5453 }
5454 }
5455 };
5456
5457 my $updatefn = sub {
5458 my ($remove_drive) = @_;
5459
5460 my $conf = load_config($vmid);
5461
5462 if (!$drivehash) {
5463 check_lock($conf);
5464 die "you can't delete a snapshot if vm is a template\n"
5465 if is_template($conf);
5466 }
5467
5468 $snap = $conf->{snapshots}->{$snapname};
5469
5470 die "snapshot '$snapname' does not exist\n" if !defined($snap);
5471
5472 # remove parent refs
5473 if (!$prepare) {
5474 &$unlink_parent($conf, $snap->{parent});
5475 foreach my $sn (keys %{$conf->{snapshots}}) {
5476 next if $sn eq $snapname;
5477 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
5478 }
5479 }
5480
5481 if ($remove_drive) {
5482 if ($remove_drive eq 'vmstate') {
5483 delete $snap->{$remove_drive};
5484 } else {
5485 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
5486 my $volid = $drive->{file};
5487 delete $snap->{$remove_drive};
5488 add_unused_volume($conf, $volid);
5489 }
5490 }
5491
5492 if ($prepare) {
5493 $snap->{snapstate} = 'delete';
5494 } else {
5495 delete $conf->{snapshots}->{$snapname};
5496 delete $conf->{lock} if $drivehash;
5497 foreach my $volid (@$unused) {
5498 add_unused_volume($conf, $volid);
5499 }
5500 }
5501
5502 update_config_nolock($vmid, $conf, 1);
5503 };
5504
5505 lock_config($vmid, $updatefn);
5506
5507 # now remove vmstate file
5508
5509 my $storecfg = PVE::Storage::config();
5510
5511 if ($snap->{vmstate}) {
5512 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
5513 if (my $err = $@) {
5514 die $err if !$force;
5515 warn $err;
5516 }
5517 # save changes (remove vmstate from snapshot)
5518 lock_config($vmid, $updatefn, 'vmstate') if !$force;
5519 };
5520
5521 # now remove all internal snapshots
5522 foreach_drive($snap, sub {
5523 my ($ds, $drive) = @_;
5524
5525 return if drive_is_cdrom($drive);
5526
5527 my $volid = $drive->{file};
5528 my $device = "drive-$ds";
5529
5530 if (!$drivehash || $drivehash->{$ds}) {
5531 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
5532 if (my $err = $@) {
5533 die $err if !$force;
5534 warn $err;
5535 }
5536 }
5537
5538 # save changes (remove drive fron snapshot)
5539 lock_config($vmid, $updatefn, $ds) if !$force;
5540 push @$unused, $volid;
5541 });
5542
5543 # now cleanup config
5544 $prepare = 0;
5545 lock_config($vmid, $updatefn);
5546 }
5547
5548 sub has_feature {
5549 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
5550
5551 my $err;
5552 foreach_drive($conf, sub {
5553 my ($ds, $drive) = @_;
5554
5555 return if drive_is_cdrom($drive);
5556 my $volid = $drive->{file};
5557 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
5558 });
5559
5560 return $err ? 0 : 1;
5561 }
5562
5563 sub template_create {
5564 my ($vmid, $conf, $disk) = @_;
5565
5566 my $storecfg = PVE::Storage::config();
5567
5568 foreach_drive($conf, sub {
5569 my ($ds, $drive) = @_;
5570
5571 return if drive_is_cdrom($drive);
5572 return if $disk && $ds ne $disk;
5573
5574 my $volid = $drive->{file};
5575 return if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
5576
5577 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
5578 $drive->{file} = $voliddst;
5579 $conf->{$ds} = print_drive($vmid, $drive);
5580 update_config_nolock($vmid, $conf, 1);
5581 });
5582 }
5583
5584 sub is_template {
5585 my ($conf) = @_;
5586
5587 return 1 if defined $conf->{template} && $conf->{template} == 1;
5588 }
5589
5590 sub qemu_img_convert {
5591 my ($src_volid, $dst_volid, $size, $snapname) = @_;
5592
5593 my $storecfg = PVE::Storage::config();
5594 my ($src_storeid, $src_volname) = PVE::Storage::parse_volume_id($src_volid, 1);
5595 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid, 1);
5596
5597 if ($src_storeid && $dst_storeid) {
5598 my $src_scfg = PVE::Storage::storage_config($storecfg, $src_storeid);
5599 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5600
5601 my $src_format = qemu_img_format($src_scfg, $src_volname);
5602 my $dst_format = qemu_img_format($dst_scfg, $dst_volname);
5603
5604 my $src_path = PVE::Storage::path($storecfg, $src_volid, $snapname);
5605 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5606
5607 my $cmd = [];
5608 push @$cmd, '/usr/bin/qemu-img', 'convert', '-t', 'writeback', '-p', '-n';
5609 push @$cmd, '-s', $snapname if($snapname && $src_format eq "qcow2");
5610 push @$cmd, '-f', $src_format, '-O', $dst_format, $src_path, $dst_path;
5611
5612 my $parser = sub {
5613 my $line = shift;
5614 if($line =~ m/\((\S+)\/100\%\)/){
5615 my $percent = $1;
5616 my $transferred = int($size * $percent / 100);
5617 my $remaining = $size - $transferred;
5618
5619 print "transferred: $transferred bytes remaining: $remaining bytes total: $size bytes progression: $percent %\n";
5620 }
5621
5622 };
5623
5624 eval { run_command($cmd, timeout => undef, outfunc => $parser); };
5625 my $err = $@;
5626 die "copy failed: $err" if $err;
5627 }
5628 }
5629
5630 sub qemu_img_format {
5631 my ($scfg, $volname) = @_;
5632
5633 if ($scfg->{path} && $volname =~ m/\.(raw|qcow2|qed|vmdk)$/) {
5634 return $1;
5635 } elsif ($scfg->{type} eq 'iscsi') {
5636 return "host_device";
5637 } else {
5638 return "raw";
5639 }
5640 }
5641
5642 sub qemu_drive_mirror {
5643 my ($vmid, $drive, $dst_volid, $vmiddst) = @_;
5644
5645 my $count = 0;
5646 my $old_len = 0;
5647 my $frozen = undef;
5648 my $maxwait = 120;
5649
5650 my $storecfg = PVE::Storage::config();
5651 my ($dst_storeid, $dst_volname) = PVE::Storage::parse_volume_id($dst_volid);
5652
5653 my $dst_scfg = PVE::Storage::storage_config($storecfg, $dst_storeid);
5654
5655 my $format;
5656 if ($dst_volname =~ m/\.(raw|qcow2)$/){
5657 $format = $1;
5658 }
5659
5660 my $dst_path = PVE::Storage::path($storecfg, $dst_volid);
5661
5662 my $opts = { timeout => 10, device => "drive-$drive", mode => "existing", sync => "full", target => $dst_path };
5663 $opts->{format} = $format if $format;
5664
5665 #fixme : sometime drive-mirror timeout, but works fine after.
5666 # (I have see the problem with big volume > 200GB), so we need to eval
5667 eval { vm_mon_cmd($vmid, "drive-mirror", %$opts); };
5668 # ignore errors here
5669
5670 eval {
5671 while (1) {
5672 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5673 my $stat = @$stats[0];
5674 die "mirroring job seem to have die. Maybe do you have bad sectors?" if !$stat;
5675 die "error job is not mirroring" if $stat->{type} ne "mirror";
5676
5677 my $busy = $stat->{busy};
5678
5679 if (my $total = $stat->{len}) {
5680 my $transferred = $stat->{offset} || 0;
5681 my $remaining = $total - $transferred;
5682 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
5683
5684 print "transferred: $transferred bytes remaining: $remaining bytes total: $total bytes progression: $percent % busy: $busy\n";
5685 }
5686
5687 if ($stat->{len} == $stat->{offset}) {
5688 if ($busy eq 'false') {
5689
5690 last if $vmiddst != $vmid;
5691
5692 # try to switch the disk if source and destination are on the same guest
5693 eval { vm_mon_cmd($vmid, "block-job-complete", device => "drive-$drive") };
5694 last if !$@;
5695 die $@ if $@ !~ m/cannot be completed/;
5696 }
5697
5698 if ($count > $maxwait) {
5699 # if too much writes to disk occurs at the end of migration
5700 #the disk needs to be freezed to be able to complete the migration
5701 vm_suspend($vmid,1);
5702 $frozen = 1;
5703 }
5704 $count ++
5705 }
5706 $old_len = $stat->{offset};
5707 sleep 1;
5708 }
5709
5710 vm_resume($vmid, 1) if $frozen;
5711
5712 };
5713 my $err = $@;
5714
5715 my $cancel_job = sub {
5716 vm_mon_cmd($vmid, "block-job-cancel", device => "drive-$drive");
5717 while (1) {
5718 my $stats = vm_mon_cmd($vmid, "query-block-jobs");
5719 my $stat = @$stats[0];
5720 last if !$stat;
5721 sleep 1;
5722 }
5723 };
5724
5725 if ($err) {
5726 eval { &$cancel_job(); };
5727 die "mirroring error: $err";
5728 }
5729
5730 if ($vmiddst != $vmid) {
5731 # if we clone a disk for a new target vm, we don't switch the disk
5732 &$cancel_job(); # so we call block-job-cancel
5733 }
5734 }
5735
5736 sub clone_disk {
5737 my ($storecfg, $vmid, $running, $drivename, $drive, $snapname,
5738 $newvmid, $storage, $format, $full, $newvollist) = @_;
5739
5740 my $newvolid;
5741
5742 if (!$full) {
5743 print "create linked clone of drive $drivename ($drive->{file})\n";
5744 $newvolid = PVE::Storage::vdisk_clone($storecfg, $drive->{file}, $newvmid, $snapname);
5745 push @$newvollist, $newvolid;
5746 } else {
5747 my ($storeid, $volname) = PVE::Storage::parse_volume_id($drive->{file});
5748 $storeid = $storage if $storage;
5749
5750 my ($defFormat, $validFormats) = PVE::Storage::storage_default_format($storecfg, $storeid);
5751 if (!$format) {
5752 $format = $drive->{format} || $defFormat;
5753 }
5754
5755 # test if requested format is supported - else use default
5756 my $supported = grep { $_ eq $format } @$validFormats;
5757 $format = $defFormat if !$supported;
5758
5759 my ($size) = PVE::Storage::volume_size_info($storecfg, $drive->{file}, 3);
5760
5761 print "create full clone of drive $drivename ($drive->{file})\n";
5762 $newvolid = PVE::Storage::vdisk_alloc($storecfg, $storeid, $newvmid, $format, undef, ($size/1024));
5763 push @$newvollist, $newvolid;
5764
5765 if (!$running || $snapname) {
5766 qemu_img_convert($drive->{file}, $newvolid, $size, $snapname);
5767 } else {
5768 qemu_drive_mirror($vmid, $drivename, $newvolid, $newvmid);
5769 }
5770 }
5771
5772 my ($size) = PVE::Storage::volume_size_info($storecfg, $newvolid, 3);
5773
5774 my $disk = $drive;
5775 $disk->{format} = undef;
5776 $disk->{file} = $newvolid;
5777 $disk->{size} = $size;
5778
5779 return $disk;
5780 }
5781
5782 # this only works if VM is running
5783 sub get_current_qemu_machine {
5784 my ($vmid) = @_;
5785
5786 my $cmd = { execute => 'query-machines', arguments => {} };
5787 my $res = vm_qmp_command($vmid, $cmd);
5788
5789 my ($current, $default);
5790 foreach my $e (@$res) {
5791 $default = $e->{name} if $e->{'is-default'};
5792 $current = $e->{name} if $e->{'is-current'};
5793 }
5794
5795 # fallback to the default machine if current is not supported by qemu
5796 return $current || $default || 'pc';
5797 }
5798
5799 sub lspci {
5800
5801 my $devices = {};
5802
5803 dir_glob_foreach("$pcisysfs/devices", '[a-f0-9]{4}:([a-f0-9]{2}:[a-f0-9]{2})\.([0-9])', sub {
5804 my (undef, $id, $function) = @_;
5805 my $res = { id => $id, function => $function};
5806 push @{$devices->{$id}}, $res;
5807 });
5808
5809 return $devices;
5810 }
5811
5812 1;