]> git.proxmox.com Git - qemu-server.git/blame_incremental - PVE/QemuServer.pm
usb-tablet : always use uhci controller
[qemu-server.git] / PVE / QemuServer.pm
... / ...
CommitLineData
1package PVE::QemuServer;
2
3use strict;
4use POSIX;
5use IO::Handle;
6use IO::Select;
7use IO::File;
8use IO::Dir;
9use IO::Socket::UNIX;
10use File::Basename;
11use File::Path;
12use File::stat;
13use Getopt::Long;
14use Digest::SHA;
15use Fcntl ':flock';
16use Cwd 'abs_path';
17use IPC::Open3;
18use JSON;
19use Fcntl;
20use PVE::SafeSyslog;
21use Storable qw(dclone);
22use PVE::Exception qw(raise raise_param_exc);
23use PVE::Storage;
24use PVE::Tools qw(run_command lock_file file_read_firstline);
25use PVE::JSONSchema qw(get_standard_option);
26use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
27use PVE::INotify;
28use PVE::ProcFSTools;
29use PVE::QMPClient;
30use PVE::RPCEnvironment;
31use Time::HiRes qw(gettimeofday);
32
33my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
34
35# Note about locking: we use flock on the config file protect
36# against concurent actions.
37# Aditionaly, we have a 'lock' setting in the config file. This
38# can be set to 'migrate', 'backup', 'snapshot' or 'rollback'. Most actions are not
39# allowed when such lock is set. But you can ignore this kind of
40# lock with the --skiplock flag.
41
42cfs_register_file('/qemu-server/',
43 \&parse_vm_config,
44 \&write_vm_config);
45
46PVE::JSONSchema::register_standard_option('skiplock', {
47 description => "Ignore locks - only root is allowed to use this option.",
48 type => 'boolean',
49 optional => 1,
50});
51
52PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
53 description => "Some command save/restore state from this location.",
54 type => 'string',
55 maxLength => 128,
56 optional => 1,
57});
58
59PVE::JSONSchema::register_standard_option('pve-snapshot-name', {
60 description => "The name of the snapshot.",
61 type => 'string', format => 'pve-configid',
62 maxLength => 40,
63});
64
65#no warnings 'redefine';
66
67unless(defined(&_VZSYSCALLS_H_)) {
68 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
69 require 'sys/syscall.ph';
70 if(defined(&__x86_64__)) {
71 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
72 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
73 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
74 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
75 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
76 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
77 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
78 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
79 }
80 elsif(defined( &__i386__) ) {
81 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
82 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
83 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
84 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
85 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
86 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
87 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
88 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
89 } else {
90 die("no fairsched syscall for this arch");
91 }
92 require 'asm/ioctl.ph';
93 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
94}
95
96sub fairsched_mknod {
97 my ($parent, $weight, $desired) = @_;
98
99 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
100}
101
102sub fairsched_rmnod {
103 my ($id) = @_;
104
105 return syscall(&__NR_fairsched_rmnod, int($id));
106}
107
108sub fairsched_mvpr {
109 my ($pid, $newid) = @_;
110
111 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
112}
113
114sub fairsched_vcpus {
115 my ($id, $vcpus) = @_;
116
117 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
118}
119
120sub fairsched_rate {
121 my ($id, $op, $rate) = @_;
122
123 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
124}
125
126use constant FAIRSCHED_SET_RATE => 0;
127use constant FAIRSCHED_DROP_RATE => 1;
128use constant FAIRSCHED_GET_RATE => 2;
129
130sub fairsched_cpulimit {
131 my ($id, $limit) = @_;
132
133 my $cpulim1024 = int($limit * 1024 / 100);
134 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
135
136 return fairsched_rate($id, $op, $cpulim1024);
137}
138
139my $nodename = PVE::INotify::nodename();
140
141mkdir "/etc/pve/nodes/$nodename";
142my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
143mkdir $confdir;
144
145my $var_run_tmpdir = "/var/run/qemu-server";
146mkdir $var_run_tmpdir;
147
148my $lock_dir = "/var/lock/qemu-server";
149mkdir $lock_dir;
150
151my $pcisysfs = "/sys/bus/pci";
152
153my $confdesc = {
154 onboot => {
155 optional => 1,
156 type => 'boolean',
157 description => "Specifies whether a VM will be started during system bootup.",
158 default => 0,
159 },
160 autostart => {
161 optional => 1,
162 type => 'boolean',
163 description => "Automatic restart after crash (currently ignored).",
164 default => 0,
165 },
166 hotplug => {
167 optional => 1,
168 type => 'boolean',
169 description => "Allow hotplug for disk and network device",
170 default => 0,
171 },
172 reboot => {
173 optional => 1,
174 type => 'boolean',
175 description => "Allow reboot. If set to '0' the VM exit on reboot.",
176 default => 1,
177 },
178 lock => {
179 optional => 1,
180 type => 'string',
181 description => "Lock/unlock the VM.",
182 enum => [qw(migrate backup snapshot rollback)],
183 },
184 cpulimit => {
185 optional => 1,
186 type => 'integer',
187 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
188 minimum => 0,
189 default => 0,
190 },
191 cpuunits => {
192 optional => 1,
193 type => 'integer',
194 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
195 minimum => 0,
196 maximum => 500000,
197 default => 1000,
198 },
199 memory => {
200 optional => 1,
201 type => 'integer',
202 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
203 minimum => 16,
204 default => 512,
205 },
206 balloon => {
207 optional => 1,
208 type => 'integer',
209 description => "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
210 minimum => 0,
211 },
212 shares => {
213 optional => 1,
214 type => 'integer',
215 description => "Amount of memory shares for auto-ballooning. The larger the number is, the more memory this VM gets. Number is relative to weights of all other running VMs. Using zero disables auto-ballooning",
216 minimum => 0,
217 maximum => 50000,
218 default => 1000,
219 },
220 keyboard => {
221 optional => 1,
222 type => 'string',
223 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
224 enum => PVE::Tools::kvmkeymaplist(),
225 default => 'en-us',
226 },
227 name => {
228 optional => 1,
229 type => 'string', format => 'dns-name',
230 description => "Set a name for the VM. Only used on the configuration web interface.",
231 },
232 scsihw => {
233 optional => 1,
234 type => 'string',
235 description => "scsi controller model",
236 enum => [qw(lsi virtio-scsi-pci megasas)],
237 default => 'lsi',
238 },
239 description => {
240 optional => 1,
241 type => 'string',
242 description => "Description for the VM. Only used on the configuration web interface. This is saved as comment inside the configuration file.",
243 },
244 ostype => {
245 optional => 1,
246 type => 'string',
247 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 l24 l26)],
248 description => <<EODESC,
249Used to enable special optimization/features for specific
250operating systems:
251
252other => unspecified OS
253wxp => Microsoft Windows XP
254w2k => Microsoft Windows 2000
255w2k3 => Microsoft Windows 2003
256w2k8 => Microsoft Windows 2008
257wvista => Microsoft Windows Vista
258win7 => Microsoft Windows 7
259win8 => Microsoft Windows 8/2012
260l24 => Linux 2.4 Kernel
261l26 => Linux 2.6/3.X Kernel
262
263other|l24|l26 ... no special behaviour
264wxp|w2k|w2k3|w2k8|wvista|win7|win8 ... use --localtime switch
265EODESC
266 },
267 boot => {
268 optional => 1,
269 type => 'string',
270 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
271 pattern => '[acdn]{1,4}',
272 default => 'cdn',
273 },
274 bootdisk => {
275 optional => 1,
276 type => 'string', format => 'pve-qm-bootdisk',
277 description => "Enable booting from specified disk.",
278 pattern => '(ide|sata|scsi|virtio)\d+',
279 },
280 smp => {
281 optional => 1,
282 type => 'integer',
283 description => "The number of CPUs. Please use option -sockets instead.",
284 minimum => 1,
285 default => 1,
286 },
287 sockets => {
288 optional => 1,
289 type => 'integer',
290 description => "The number of CPU sockets.",
291 minimum => 1,
292 default => 1,
293 },
294 cores => {
295 optional => 1,
296 type => 'integer',
297 description => "The number of cores per socket.",
298 minimum => 1,
299 default => 1,
300 },
301 acpi => {
302 optional => 1,
303 type => 'boolean',
304 description => "Enable/disable ACPI.",
305 default => 1,
306 },
307 agent => {
308 optional => 1,
309 type => 'boolean',
310 description => "Enable/disable Qemu GuestAgent.",
311 default => 0,
312 },
313 kvm => {
314 optional => 1,
315 type => 'boolean',
316 description => "Enable/disable KVM hardware virtualization.",
317 default => 1,
318 },
319 tdf => {
320 optional => 1,
321 type => 'boolean',
322 description => "Enable/disable time drift fix.",
323 default => 0,
324 },
325 localtime => {
326 optional => 1,
327 type => 'boolean',
328 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
329 },
330 freeze => {
331 optional => 1,
332 type => 'boolean',
333 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
334 },
335 vga => {
336 optional => 1,
337 type => 'string',
338 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win8/win7/w2k8, and 'cirrur' for other OS types",
339 enum => [qw(std cirrus vmware)],
340 },
341 watchdog => {
342 optional => 1,
343 type => 'string', format => 'pve-qm-watchdog',
344 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
345 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
346 },
347 startdate => {
348 optional => 1,
349 type => 'string',
350 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
351 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
352 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
353 default => 'now',
354 },
355 startup => {
356 optional => 1,
357 type => 'string', format => 'pve-qm-startup',
358 typetext => '[[order=]\d+] [,up=\d+] [,down=\d+] ',
359 description => "Startup and shutdown behavior. Order is a non-negative number defining the general startup order. Shutdown in done with reverse ordering. Additionally you can set the 'up' or 'down' delay in seconds, which specifies a delay to wait before the next VM is started or stopped.",
360 },
361 args => {
362 optional => 1,
363 type => 'string',
364 description => <<EODESCR,
365Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
366
367args: -no-reboot -no-hpet
368EODESCR
369 },
370 tablet => {
371 optional => 1,
372 type => 'boolean',
373 default => 1,
374 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning. Else the mouse runs out of sync with normal vnc clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches.",
375 },
376 migrate_speed => {
377 optional => 1,
378 type => 'integer',
379 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
380 minimum => 0,
381 default => 0,
382 },
383 migrate_downtime => {
384 optional => 1,
385 type => 'number',
386 description => "Set maximum tolerated downtime (in seconds) for migrations.",
387 minimum => 0,
388 default => 0.1,
389 },
390 cdrom => {
391 optional => 1,
392 type => 'string', format => 'pve-qm-drive',
393 typetext => 'volume',
394 description => "This is an alias for option -ide2",
395 },
396 cpu => {
397 optional => 1,
398 description => "Emulated CPU type.",
399 type => 'string',
400 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom Conroe Penryn Nehalem Westmere SandyBridge Haswell Opteron_G1 Opteron_G2 Opteron_G3 Opteron_G4 Opteron_G5 host) ],
401 default => 'qemu64',
402 },
403 parent => get_standard_option('pve-snapshot-name', {
404 optional => 1,
405 description => "Parent snapshot name. This is used internally, and should not be modified.",
406 }),
407 snaptime => {
408 optional => 1,
409 description => "Timestamp for snapshots.",
410 type => 'integer',
411 minimum => 0,
412 },
413 vmstate => {
414 optional => 1,
415 type => 'string', format => 'pve-volume-id',
416 description => "Reference to a volume which stores the VM state. This is used internally for snapshots.",
417 },
418};
419
420# what about other qemu settings ?
421#cpu => 'string',
422#machine => 'string',
423#fda => 'file',
424#fdb => 'file',
425#mtdblock => 'file',
426#sd => 'file',
427#pflash => 'file',
428#snapshot => 'bool',
429#bootp => 'file',
430##tftp => 'dir',
431##smb => 'dir',
432#kernel => 'file',
433#append => 'string',
434#initrd => 'file',
435##soundhw => 'string',
436
437while (my ($k, $v) = each %$confdesc) {
438 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
439}
440
441my $MAX_IDE_DISKS = 4;
442my $MAX_SCSI_DISKS = 14;
443my $MAX_VIRTIO_DISKS = 16;
444my $MAX_SATA_DISKS = 6;
445my $MAX_USB_DEVICES = 5;
446my $MAX_NETS = 32;
447my $MAX_UNUSED_DISKS = 8;
448my $MAX_HOSTPCI_DEVICES = 2;
449my $MAX_SERIAL_PORTS = 4;
450my $MAX_PARALLEL_PORTS = 3;
451
452my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
453 'ne2k_isa', 'i82551', 'i82557b', 'i82559er'];
454my $nic_model_list_txt = join(' ', sort @$nic_model_list);
455
456my $netdesc = {
457 optional => 1,
458 type => 'string', format => 'pve-qm-net',
459 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,rate=<mbps>][,tag=<vlanid>]",
460 description => <<EODESCR,
461Specify network devices.
462
463MODEL is one of: $nic_model_list_txt
464
465XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
466automatically generated if not specified.
467
468The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
469
470Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
471
472If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
473
47410.0.2.2 Gateway
47510.0.2.3 DNS Server
47610.0.2.4 SMB Server
477
478The DHCP server assign addresses to the guest starting from 10.0.2.15.
479
480EODESCR
481};
482PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
483
484for (my $i = 0; $i < $MAX_NETS; $i++) {
485 $confdesc->{"net$i"} = $netdesc;
486}
487
488my $drivename_hash;
489
490my $idedesc = {
491 optional => 1,
492 type => 'string', format => 'pve-qm-drive',
493 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads]',
494 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to " .($MAX_IDE_DISKS -1) . ").",
495};
496PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
497
498my $scsidesc = {
499 optional => 1,
500 type => 'string', format => 'pve-qm-drive',
501 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads]',
502 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to " . ($MAX_SCSI_DISKS - 1) . ").",
503};
504PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
505
506my $satadesc = {
507 optional => 1,
508 type => 'string', format => 'pve-qm-drive',
509 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads]',
510 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to " . ($MAX_SATA_DISKS - 1). ").",
511};
512PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
513
514my $virtiodesc = {
515 optional => 1,
516 type => 'string', format => 'pve-qm-drive',
517 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe|directsync] [,format=f] [,backup=yes|no] [,rerror=ignore|report|stop] [,werror=enospc|ignore|report|stop] [,aio=native|threads]',
518 description => "Use volume as VIRTIO hard disk (n is 0 to " . ($MAX_VIRTIO_DISKS - 1) . ").",
519};
520PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
521
522my $usbdesc = {
523 optional => 1,
524 type => 'string', format => 'pve-qm-usb-device',
525 typetext => 'host=HOSTUSBDEVICE',
526 description => <<EODESCR,
527Configure an USB device (n is 0 to 4). This can be used to
528pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
529
530'bus-port(.port)*' (decimal numbers) or
531'vendor_id:product_id' (hexadeciaml numbers)
532
533You can use the 'lsusb -t' command to list existing usb devices.
534
535Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
536
537EODESCR
538};
539PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
540
541my $hostpcidesc = {
542 optional => 1,
543 type => 'string', format => 'pve-qm-hostpci',
544 typetext => "HOSTPCIDEVICE",
545 description => <<EODESCR,
546Map host pci devices. HOSTPCIDEVICE syntax is:
547
548'bus:dev.func' (hexadecimal numbers)
549
550You can us the 'lspci' command to list existing pci devices.
551
552Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
553
554Experimental: user reported problems with this option.
555EODESCR
556};
557PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
558
559my $serialdesc = {
560 optional => 1,
561 type => 'string',
562 pattern => '/dev/ttyS\d+',
563 description => <<EODESCR,
564Map host serial devices (n is 0 to 3).
565
566Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
567
568Experimental: user reported problems with this option.
569EODESCR
570};
571
572my $paralleldesc= {
573 optional => 1,
574 type => 'string',
575 pattern => '/dev/parport\d+',
576 description => <<EODESCR,
577Map host parallel devices (n is 0 to 2).
578
579Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
580
581Experimental: user reported problems with this option.
582EODESCR
583};
584
585for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
586 $confdesc->{"parallel$i"} = $paralleldesc;
587}
588
589for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
590 $confdesc->{"serial$i"} = $serialdesc;
591}
592
593for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
594 $confdesc->{"hostpci$i"} = $hostpcidesc;
595}
596
597for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
598 $drivename_hash->{"ide$i"} = 1;
599 $confdesc->{"ide$i"} = $idedesc;
600}
601
602for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
603 $drivename_hash->{"sata$i"} = 1;
604 $confdesc->{"sata$i"} = $satadesc;
605}
606
607for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
608 $drivename_hash->{"scsi$i"} = 1;
609 $confdesc->{"scsi$i"} = $scsidesc ;
610}
611
612for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
613 $drivename_hash->{"virtio$i"} = 1;
614 $confdesc->{"virtio$i"} = $virtiodesc;
615}
616
617for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
618 $confdesc->{"usb$i"} = $usbdesc;
619}
620
621my $unuseddesc = {
622 optional => 1,
623 type => 'string', format => 'pve-volume-id',
624 description => "Reference to unused volumes.",
625};
626
627for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
628 $confdesc->{"unused$i"} = $unuseddesc;
629}
630
631my $kvm_api_version = 0;
632
633sub kvm_version {
634
635 return $kvm_api_version if $kvm_api_version;
636
637 my $fh = IO::File->new("</dev/kvm") ||
638 return 0;
639
640 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
641 $kvm_api_version = $v;
642 }
643
644 $fh->close();
645
646 return $kvm_api_version;
647}
648
649my $kvm_user_version;
650
651sub kvm_user_version {
652
653 return $kvm_user_version if $kvm_user_version;
654
655 $kvm_user_version = 'unknown';
656
657 my $tmp = `kvm -help 2>/dev/null`;
658
659 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)[,\s]/) {
660 $kvm_user_version = $2;
661 }
662
663 return $kvm_user_version;
664
665}
666
667my $kernel_has_vhost_net = -c '/dev/vhost-net';
668
669sub disknames {
670 # order is important - used to autoselect boot disk
671 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
672 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
673 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
674 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
675}
676
677sub valid_drivename {
678 my $dev = shift;
679
680 return defined($drivename_hash->{$dev});
681}
682
683sub option_exists {
684 my $key = shift;
685 return defined($confdesc->{$key});
686}
687
688sub nic_models {
689 return $nic_model_list;
690}
691
692sub os_list_description {
693
694 return {
695 other => 'Other',
696 wxp => 'Windows XP',
697 w2k => 'Windows 2000',
698 w2k3 =>, 'Windows 2003',
699 w2k8 => 'Windows 2008',
700 wvista => 'Windows Vista',
701 win7 => 'Windows 7',
702 win8 => 'Windows 8/2012',
703 l24 => 'Linux 2.4',
704 l26 => 'Linux 2.6',
705 };
706}
707
708my $cdrom_path;
709
710sub get_cdrom_path {
711
712 return $cdrom_path if $cdrom_path;
713
714 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
715 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
716 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
717}
718
719sub get_iso_path {
720 my ($storecfg, $vmid, $cdrom) = @_;
721
722 if ($cdrom eq 'cdrom') {
723 return get_cdrom_path();
724 } elsif ($cdrom eq 'none') {
725 return '';
726 } elsif ($cdrom =~ m|^/|) {
727 return $cdrom;
728 } else {
729 return PVE::Storage::path($storecfg, $cdrom);
730 }
731}
732
733# try to convert old style file names to volume IDs
734sub filename_to_volume_id {
735 my ($vmid, $file, $media) = @_;
736
737 if (!($file eq 'none' || $file eq 'cdrom' ||
738 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
739
740 return undef if $file =~ m|/|;
741
742 if ($media && $media eq 'cdrom') {
743 $file = "local:iso/$file";
744 } else {
745 $file = "local:$vmid/$file";
746 }
747 }
748
749 return $file;
750}
751
752sub verify_media_type {
753 my ($opt, $vtype, $media) = @_;
754
755 return if !$media;
756
757 my $etype;
758 if ($media eq 'disk') {
759 $etype = 'images';
760 } elsif ($media eq 'cdrom') {
761 $etype = 'iso';
762 } else {
763 die "internal error";
764 }
765
766 return if ($vtype eq $etype);
767
768 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
769}
770
771sub cleanup_drive_path {
772 my ($opt, $storecfg, $drive) = @_;
773
774 # try to convert filesystem paths to volume IDs
775
776 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
777 ($drive->{file} !~ m|^/dev/.+|) &&
778 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
779 ($drive->{file} !~ m/^\d+$/)) {
780 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
781 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
782 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
783 verify_media_type($opt, $vtype, $drive->{media});
784 $drive->{file} = $volid;
785 }
786
787 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
788}
789
790sub create_conf_nolock {
791 my ($vmid, $settings) = @_;
792
793 my $filename = config_file($vmid);
794
795 die "configuration file '$filename' already exists\n" if -f $filename;
796
797 my $defaults = load_defaults();
798
799 $settings->{name} = "vm$vmid" if !$settings->{name};
800 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
801
802 my $data = '';
803 foreach my $opt (keys %$settings) {
804 next if !$confdesc->{$opt};
805
806 my $value = $settings->{$opt};
807 next if !$value;
808
809 $data .= "$opt: $value\n";
810 }
811
812 PVE::Tools::file_set_contents($filename, $data);
813}
814
815my $parse_size = sub {
816 my ($value) = @_;
817
818 return undef if $value !~ m/^(\d+(\.\d+)?)([KMG])?$/;
819 my ($size, $unit) = ($1, $3);
820 if ($unit) {
821 if ($unit eq 'K') {
822 $size = $size * 1024;
823 } elsif ($unit eq 'M') {
824 $size = $size * 1024 * 1024;
825 } elsif ($unit eq 'G') {
826 $size = $size * 1024 * 1024 * 1024;
827 }
828 }
829 return int($size);
830};
831
832my $format_size = sub {
833 my ($size) = @_;
834
835 $size = int($size);
836
837 my $kb = int($size/1024);
838 return $size if $kb*1024 != $size;
839
840 my $mb = int($kb/1024);
841 return "${kb}K" if $mb*1024 != $kb;
842
843 my $gb = int($mb/1024);
844 return "${mb}M" if $gb*1024 != $mb;
845
846 return "${gb}G";
847};
848
849# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
850# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
851# [,rerror=ignore|report|stop][,werror=enospc|ignore|report|stop]
852# [,aio=native|threads]
853
854sub parse_drive {
855 my ($key, $data) = @_;
856
857 my $res = {};
858
859 # $key may be undefined - used to verify JSON parameters
860 if (!defined($key)) {
861 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
862 $res->{index} = 0;
863 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
864 $res->{interface} = $1;
865 $res->{index} = $2;
866 } else {
867 return undef;
868 }
869
870 foreach my $p (split (/,/, $data)) {
871 next if $p =~ m/^\s*$/;
872
873 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio|bps|mbps|bps_rd|mbps_rd|bps_wr|mbps_wr|iops|iops_rd|iops_wr|size)=(.+)$/) {
874 my ($k, $v) = ($1, $2);
875
876 $k = 'file' if $k eq 'volume';
877
878 return undef if defined $res->{$k};
879
880 if ($k eq 'bps' || $k eq 'bps_rd' || $k eq 'bps_wr') {
881 return undef if !$v || $v !~ m/^\d+/;
882 $k = "m$k";
883 $v = sprintf("%.3f", $v / (1024*1024));
884 }
885 $res->{$k} = $v;
886 } else {
887 if (!$res->{file} && $p !~ m/=/) {
888 $res->{file} = $p;
889 } else {
890 return undef;
891 }
892 }
893 }
894
895 return undef if !$res->{file};
896
897 return undef if $res->{cache} &&
898 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe|directsync)$/;
899 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
900 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
901 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
902 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
903 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
904 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
905 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
906 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
907 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
908 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
909 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
910
911
912 return undef if $res->{mbps_rd} && $res->{mbps};
913 return undef if $res->{mbps_wr} && $res->{mbps};
914
915 return undef if $res->{mbps} && $res->{mbps} !~ m/^\d+(\.\d+)?$/;
916 return undef if $res->{mbps_rd} && $res->{mbps_rd} !~ m/^\d+(\.\d+)?$/;
917 return undef if $res->{mbps_wr} && $res->{mbps_wr} !~ m/^\d+(\.\d+)?$/;
918
919 return undef if $res->{iops_rd} && $res->{iops};
920 return undef if $res->{iops_wr} && $res->{iops};
921 return undef if $res->{iops} && $res->{iops} !~ m/^\d+$/;
922 return undef if $res->{iops_rd} && $res->{iops_rd} !~ m/^\d+$/;
923 return undef if $res->{iops_wr} && $res->{iops_wr} !~ m/^\d+$/;
924
925
926 if ($res->{size}) {
927 return undef if !defined($res->{size} = &$parse_size($res->{size}));
928 }
929
930 if ($res->{media} && ($res->{media} eq 'cdrom')) {
931 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
932 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
933 return undef if $res->{interface} eq 'virtio';
934 }
935
936 # rerror does not work with scsi drives
937 if ($res->{rerror}) {
938 return undef if $res->{interface} eq 'scsi';
939 }
940
941 return $res;
942}
943
944my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio iops iops_rd iops_wr);
945
946sub print_drive {
947 my ($vmid, $drive) = @_;
948
949 my $opts = '';
950 foreach my $o (@qemu_drive_options, 'mbps', 'mbps_rd', 'mbps_wr', 'backup') {
951 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
952 }
953
954 if ($drive->{size}) {
955 $opts .= ",size=" . &$format_size($drive->{size});
956 }
957
958 return "$drive->{file}$opts";
959}
960
961sub scsi_inquiry {
962 my($fh, $noerr) = @_;
963
964 my $SG_IO = 0x2285;
965 my $SG_GET_VERSION_NUM = 0x2282;
966
967 my $versionbuf = "\x00" x 8;
968 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
969 if (!$ret) {
970 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
971 return undef;
972 }
973 my $version = unpack("I", $versionbuf);
974 if ($version < 30000) {
975 die "scsi generic interface too old\n" if !$noerr;
976 return undef;
977 }
978
979 my $buf = "\x00" x 36;
980 my $sensebuf = "\x00" x 8;
981 my $cmd = pack("C x3 C x11", 0x12, 36);
982
983 # see /usr/include/scsi/sg.h
984 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
985
986 my $packet = pack($sg_io_hdr_t, ord('S'), -3, length($cmd),
987 length($sensebuf), 0, length($buf), $buf,
988 $cmd, $sensebuf, 6000);
989
990 $ret = ioctl($fh, $SG_IO, $packet);
991 if (!$ret) {
992 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
993 return undef;
994 }
995
996 my @res = unpack($sg_io_hdr_t, $packet);
997 if ($res[17] || $res[18]) {
998 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
999 return undef;
1000 }
1001
1002 my $res = {};
1003 ($res->{device}, $res->{removable}, $res->{venodor},
1004 $res->{product}, $res->{revision}) = unpack("C C x6 A8 A16 A4", $buf);
1005
1006 return $res;
1007}
1008
1009sub path_is_scsi {
1010 my ($path) = @_;
1011
1012 my $fh = IO::File->new("+<$path") || return undef;
1013 my $res = scsi_inquiry($fh, 1);
1014 close($fh);
1015
1016 return $res;
1017}
1018
1019sub print_drivedevice_full {
1020 my ($storecfg, $conf, $vmid, $drive, $bridges) = @_;
1021
1022 my $device = '';
1023 my $maxdev = 0;
1024
1025 if ($drive->{interface} eq 'virtio') {
1026 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}", $bridges);
1027 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
1028 } elsif ($drive->{interface} eq 'scsi') {
1029 $maxdev = ($conf->{scsihw} && $conf->{scsihw} ne 'lsi') ? 256 : 7;
1030 my $controller = int($drive->{index} / $maxdev);
1031 my $unit = $drive->{index} % $maxdev;
1032 my $devicetype = 'hd';
1033 my $path = '';
1034 if (drive_is_cdrom($drive)) {
1035 $devicetype = 'cd';
1036 } else {
1037 if ($drive->{file} =~ m|^/|) {
1038 $path = $drive->{file};
1039 } else {
1040 $path = PVE::Storage::path($storecfg, $drive->{file});
1041 }
1042
1043 if($path =~ m/^iscsi\:\/\//){
1044 $devicetype = 'generic';
1045 }
1046 else {
1047 $devicetype = 'block' if path_is_scsi($path);
1048 }
1049 }
1050
1051 if (!$conf->{scsihw} || $conf->{scsihw} eq 'lsi'){
1052 $device = "scsi-$devicetype,bus=scsihw$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}" if !$conf->{scsihw} || $conf->{scsihw} eq 'lsi';
1053 } else {
1054 $device = "scsi-$devicetype,bus=scsihw$controller.0,channel=0,scsi-id=0,lun=$drive->{index},drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1055 }
1056
1057 } elsif ($drive->{interface} eq 'ide'){
1058 $maxdev = 2;
1059 my $controller = int($drive->{index} / $maxdev);
1060 my $unit = $drive->{index} % $maxdev;
1061 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
1062
1063 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1064 } elsif ($drive->{interface} eq 'sata'){
1065 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
1066 my $unit = $drive->{index} % $MAX_SATA_DISKS;
1067 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
1068 } elsif ($drive->{interface} eq 'usb') {
1069 die "implement me";
1070 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1071 } else {
1072 die "unsupported interface type";
1073 }
1074
1075 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
1076
1077 return $device;
1078}
1079
1080sub print_drive_full {
1081 my ($storecfg, $vmid, $drive) = @_;
1082
1083 my $opts = '';
1084 foreach my $o (@qemu_drive_options) {
1085 next if $o eq 'bootindex';
1086 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
1087 }
1088
1089 foreach my $o (qw(bps bps_rd bps_wr)) {
1090 my $v = $drive->{"m$o"};
1091 $opts .= ",$o=" . int($v*1024*1024) if $v;
1092 }
1093
1094 # use linux-aio by default (qemu default is threads)
1095 $opts .= ",aio=native" if !$drive->{aio};
1096
1097 my $path;
1098 my $volid = $drive->{file};
1099 if (drive_is_cdrom($drive)) {
1100 $path = get_iso_path($storecfg, $vmid, $volid);
1101 } else {
1102 if ($volid =~ m|^/|) {
1103 $path = $volid;
1104 } else {
1105 $path = PVE::Storage::path($storecfg, $volid);
1106 }
1107 }
1108
1109 my $pathinfo = $path ? "file=$path," : '';
1110
1111 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1112}
1113
1114sub print_netdevice_full {
1115 my ($vmid, $conf, $net, $netid, $bridges) = @_;
1116
1117 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
1118
1119 my $device = $net->{model};
1120 if ($net->{model} eq 'virtio') {
1121 $device = 'virtio-net-pci';
1122 };
1123
1124 # qemu > 0.15 always try to boot from network - we disable that by
1125 # not loading the pxe rom file
1126 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
1127 my $pciaddr = print_pci_addr("$netid", $bridges);
1128 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
1129 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
1130 return $tmpstr;
1131}
1132
1133sub print_netdev_full {
1134 my ($vmid, $conf, $net, $netid) = @_;
1135
1136 my $i = '';
1137 if ($netid =~ m/^net(\d+)$/) {
1138 $i = int($1);
1139 }
1140
1141 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
1142
1143 my $ifname = "tap${vmid}i$i";
1144
1145 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1146 die "interface name '$ifname' is too long (max 15 character)\n"
1147 if length($ifname) >= 16;
1148
1149 my $vhostparam = '';
1150 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1151
1152 my $vmname = $conf->{name} || "vm$vmid";
1153
1154 if ($net->{bridge}) {
1155 return "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge$vhostparam";
1156 } else {
1157 return "type=user,id=$netid,hostname=$vmname";
1158 }
1159}
1160
1161sub drive_is_cdrom {
1162 my ($drive) = @_;
1163
1164 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1165
1166}
1167
1168sub parse_hostpci {
1169 my ($value) = @_;
1170
1171 return undef if !$value;
1172
1173 my $res = {};
1174
1175 if ($value =~ m/^[a-f0-9]{2}:[a-f0-9]{2}\.[a-f0-9]$/) {
1176 $res->{pciid} = $value;
1177 } else {
1178 return undef;
1179 }
1180
1181 return $res;
1182}
1183
1184# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1185sub parse_net {
1186 my ($data) = @_;
1187
1188 my $res = {};
1189
1190 foreach my $kvp (split(/,/, $data)) {
1191
1192 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
1193 my $model = lc($1);
1194 my $mac = uc($3) || PVE::Tools::random_ether_addr();
1195 $res->{model} = $model;
1196 $res->{macaddr} = $mac;
1197 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1198 $res->{bridge} = $1;
1199 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1200 $res->{rate} = $1;
1201 } elsif ($kvp =~ m/^tag=(\d+)$/) {
1202 $res->{tag} = $1;
1203 } else {
1204 return undef;
1205 }
1206
1207 }
1208
1209 return undef if !$res->{model};
1210
1211 return $res;
1212}
1213
1214sub print_net {
1215 my $net = shift;
1216
1217 my $res = "$net->{model}";
1218 $res .= "=$net->{macaddr}" if $net->{macaddr};
1219 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1220 $res .= ",rate=$net->{rate}" if $net->{rate};
1221 $res .= ",tag=$net->{tag}" if $net->{tag};
1222
1223 return $res;
1224}
1225
1226sub add_random_macs {
1227 my ($settings) = @_;
1228
1229 foreach my $opt (keys %$settings) {
1230 next if $opt !~ m/^net(\d+)$/;
1231 my $net = parse_net($settings->{$opt});
1232 next if !$net;
1233 $settings->{$opt} = print_net($net);
1234 }
1235}
1236
1237sub add_unused_volume {
1238 my ($config, $volid) = @_;
1239
1240 my $key;
1241 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1242 my $test = "unused$ind";
1243 if (my $vid = $config->{$test}) {
1244 return if $vid eq $volid; # do not add duplicates
1245 } else {
1246 $key = $test;
1247 }
1248 }
1249
1250 die "To many unused volume - please delete them first.\n" if !$key;
1251
1252 $config->{$key} = $volid;
1253
1254 return $key;
1255}
1256
1257PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1258sub verify_bootdisk {
1259 my ($value, $noerr) = @_;
1260
1261 return $value if valid_drivename($value);
1262
1263 return undef if $noerr;
1264
1265 die "invalid boot disk '$value'\n";
1266}
1267
1268PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1269sub verify_net {
1270 my ($value, $noerr) = @_;
1271
1272 return $value if parse_net($value);
1273
1274 return undef if $noerr;
1275
1276 die "unable to parse network options\n";
1277}
1278
1279PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1280sub verify_drive {
1281 my ($value, $noerr) = @_;
1282
1283 return $value if parse_drive(undef, $value);
1284
1285 return undef if $noerr;
1286
1287 die "unable to parse drive options\n";
1288}
1289
1290PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1291sub verify_hostpci {
1292 my ($value, $noerr) = @_;
1293
1294 return $value if parse_hostpci($value);
1295
1296 return undef if $noerr;
1297
1298 die "unable to parse pci id\n";
1299}
1300
1301PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1302sub verify_watchdog {
1303 my ($value, $noerr) = @_;
1304
1305 return $value if parse_watchdog($value);
1306
1307 return undef if $noerr;
1308
1309 die "unable to parse watchdog options\n";
1310}
1311
1312sub parse_watchdog {
1313 my ($value) = @_;
1314
1315 return undef if !$value;
1316
1317 my $res = {};
1318
1319 foreach my $p (split(/,/, $value)) {
1320 next if $p =~ m/^\s*$/;
1321
1322 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1323 $res->{model} = $2;
1324 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1325 $res->{action} = $2;
1326 } else {
1327 return undef;
1328 }
1329 }
1330
1331 return $res;
1332}
1333
1334PVE::JSONSchema::register_format('pve-qm-startup', \&verify_startup);
1335sub verify_startup {
1336 my ($value, $noerr) = @_;
1337
1338 return $value if parse_startup($value);
1339
1340 return undef if $noerr;
1341
1342 die "unable to parse startup options\n";
1343}
1344
1345sub parse_startup {
1346 my ($value) = @_;
1347
1348 return undef if !$value;
1349
1350 my $res = {};
1351
1352 foreach my $p (split(/,/, $value)) {
1353 next if $p =~ m/^\s*$/;
1354
1355 if ($p =~ m/^(order=)?(\d+)$/) {
1356 $res->{order} = $2;
1357 } elsif ($p =~ m/^up=(\d+)$/) {
1358 $res->{up} = $1;
1359 } elsif ($p =~ m/^down=(\d+)$/) {
1360 $res->{down} = $1;
1361 } else {
1362 return undef;
1363 }
1364 }
1365
1366 return $res;
1367}
1368
1369sub parse_usb_device {
1370 my ($value) = @_;
1371
1372 return undef if !$value;
1373
1374 my @dl = split(/,/, $value);
1375 my $found;
1376
1377 my $res = {};
1378 foreach my $v (@dl) {
1379 if ($v =~ m/^host=(0x)?([0-9A-Fa-f]{4}):(0x)?([0-9A-Fa-f]{4})$/) {
1380 $found = 1;
1381 $res->{vendorid} = $2;
1382 $res->{productid} = $4;
1383 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1384 $found = 1;
1385 $res->{hostbus} = $1;
1386 $res->{hostport} = $2;
1387 } else {
1388 return undef;
1389 }
1390 }
1391 return undef if !$found;
1392
1393 return $res;
1394}
1395
1396PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1397sub verify_usb_device {
1398 my ($value, $noerr) = @_;
1399
1400 return $value if parse_usb_device($value);
1401
1402 return undef if $noerr;
1403
1404 die "unable to parse usb device\n";
1405}
1406
1407# add JSON properties for create and set function
1408sub json_config_properties {
1409 my $prop = shift;
1410
1411 foreach my $opt (keys %$confdesc) {
1412 next if $opt eq 'parent' || $opt eq 'snaptime' || $opt eq 'vmstate';
1413 $prop->{$opt} = $confdesc->{$opt};
1414 }
1415
1416 return $prop;
1417}
1418
1419sub check_type {
1420 my ($key, $value) = @_;
1421
1422 die "unknown setting '$key'\n" if !$confdesc->{$key};
1423
1424 my $type = $confdesc->{$key}->{type};
1425
1426 if (!defined($value)) {
1427 die "got undefined value\n";
1428 }
1429
1430 if ($value =~ m/[\n\r]/) {
1431 die "property contains a line feed\n";
1432 }
1433
1434 if ($type eq 'boolean') {
1435 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1436 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1437 die "type check ('boolean') failed - got '$value'\n";
1438 } elsif ($type eq 'integer') {
1439 return int($1) if $value =~ m/^(\d+)$/;
1440 die "type check ('integer') failed - got '$value'\n";
1441 } elsif ($type eq 'number') {
1442 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
1443 die "type check ('number') failed - got '$value'\n";
1444 } elsif ($type eq 'string') {
1445 if (my $fmt = $confdesc->{$key}->{format}) {
1446 if ($fmt eq 'pve-qm-drive') {
1447 # special case - we need to pass $key to parse_drive()
1448 my $drive = parse_drive($key, $value);
1449 return $value if $drive;
1450 die "unable to parse drive options\n";
1451 }
1452 PVE::JSONSchema::check_format($fmt, $value);
1453 return $value;
1454 }
1455 $value =~ s/^\"(.*)\"$/$1/;
1456 return $value;
1457 } else {
1458 die "internal error"
1459 }
1460}
1461
1462sub lock_config_full {
1463 my ($vmid, $timeout, $code, @param) = @_;
1464
1465 my $filename = config_file_lock($vmid);
1466
1467 my $res = lock_file($filename, $timeout, $code, @param);
1468
1469 die $@ if $@;
1470
1471 return $res;
1472}
1473
1474sub lock_config {
1475 my ($vmid, $code, @param) = @_;
1476
1477 return lock_config_full($vmid, 10, $code, @param);
1478}
1479
1480sub cfs_config_path {
1481 my ($vmid, $node) = @_;
1482
1483 $node = $nodename if !$node;
1484 return "nodes/$node/qemu-server/$vmid.conf";
1485}
1486
1487sub check_iommu_support{
1488 #fixme : need to check IOMMU support
1489 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1490
1491 my $iommu=1;
1492 return $iommu;
1493
1494}
1495
1496sub config_file {
1497 my ($vmid, $node) = @_;
1498
1499 my $cfspath = cfs_config_path($vmid, $node);
1500 return "/etc/pve/$cfspath";
1501}
1502
1503sub config_file_lock {
1504 my ($vmid) = @_;
1505
1506 return "$lock_dir/lock-$vmid.conf";
1507}
1508
1509sub touch_config {
1510 my ($vmid) = @_;
1511
1512 my $conf = config_file($vmid);
1513 utime undef, undef, $conf;
1514}
1515
1516sub destroy_vm {
1517 my ($storecfg, $vmid, $keep_empty_config) = @_;
1518
1519 my $conffile = config_file($vmid);
1520
1521 my $conf = load_config($vmid);
1522
1523 check_lock($conf);
1524
1525 # only remove disks owned by this VM
1526 foreach_drive($conf, sub {
1527 my ($ds, $drive) = @_;
1528
1529 return if drive_is_cdrom($drive);
1530
1531 my $volid = $drive->{file};
1532
1533 return if !$volid || $volid =~ m|^/|;
1534
1535 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
1536 return if !$path || !$owner || ($owner != $vmid);
1537
1538 PVE::Storage::vdisk_free($storecfg, $volid);
1539 });
1540
1541 if ($keep_empty_config) {
1542 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
1543 } else {
1544 unlink $conffile;
1545 }
1546
1547 # also remove unused disk
1548 eval {
1549 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1550
1551 eval {
1552 PVE::Storage::foreach_volid($dl, sub {
1553 my ($volid, $sid, $volname, $d) = @_;
1554 PVE::Storage::vdisk_free($storecfg, $volid);
1555 });
1556 };
1557 warn $@ if $@;
1558
1559 };
1560 warn $@ if $@;
1561}
1562
1563sub load_config {
1564 my ($vmid, $node) = @_;
1565
1566 my $cfspath = cfs_config_path($vmid, $node);
1567
1568 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1569
1570 die "no such VM ('$vmid')\n" if !defined($conf);
1571
1572 return $conf;
1573}
1574
1575sub parse_vm_config {
1576 my ($filename, $raw) = @_;
1577
1578 return undef if !defined($raw);
1579
1580 my $res = {
1581 digest => Digest::SHA::sha1_hex($raw),
1582 snapshots => {},
1583 };
1584
1585 $filename =~ m|/qemu-server/(\d+)\.conf$|
1586 || die "got strange filename '$filename'";
1587
1588 my $vmid = $1;
1589
1590 my $conf = $res;
1591 my $descr = '';
1592
1593 my @lines = split(/\n/, $raw);
1594 foreach my $line (@lines) {
1595 next if $line =~ m/^\s*$/;
1596
1597 if ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
1598 my $snapname = $1;
1599 $conf->{description} = $descr if $descr;
1600 $descr = '';
1601 $conf = $res->{snapshots}->{$snapname} = {};
1602 next;
1603 }
1604
1605 if ($line =~ m/^\#(.*)\s*$/) {
1606 $descr .= PVE::Tools::decode_text($1) . "\n";
1607 next;
1608 }
1609
1610 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
1611 $descr .= PVE::Tools::decode_text($2);
1612 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
1613 $conf->{snapstate} = $1;
1614 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1615 my $key = $1;
1616 my $value = $2;
1617 $conf->{$key} = $value;
1618 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1619 my $key = $1;
1620 my $value = $2;
1621 eval { $value = check_type($key, $value); };
1622 if ($@) {
1623 warn "vm $vmid - unable to parse value of '$key' - $@";
1624 } else {
1625 my $fmt = $confdesc->{$key}->{format};
1626 if ($fmt && $fmt eq 'pve-qm-drive') {
1627 my $v = parse_drive($key, $value);
1628 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1629 $v->{file} = $volid;
1630 $value = print_drive($vmid, $v);
1631 } else {
1632 warn "vm $vmid - unable to parse value of '$key'\n";
1633 next;
1634 }
1635 }
1636
1637 if ($key eq 'cdrom') {
1638 $conf->{ide2} = $value;
1639 } else {
1640 $conf->{$key} = $value;
1641 }
1642 }
1643 }
1644 }
1645
1646 $conf->{description} = $descr if $descr;
1647
1648 delete $res->{snapstate}; # just to be sure
1649
1650 return $res;
1651}
1652
1653sub write_vm_config {
1654 my ($filename, $conf) = @_;
1655
1656 delete $conf->{snapstate}; # just to be sure
1657
1658 if ($conf->{cdrom}) {
1659 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
1660 $conf->{ide2} = $conf->{cdrom};
1661 delete $conf->{cdrom};
1662 }
1663
1664 # we do not use 'smp' any longer
1665 if ($conf->{sockets}) {
1666 delete $conf->{smp};
1667 } elsif ($conf->{smp}) {
1668 $conf->{sockets} = $conf->{smp};
1669 delete $conf->{cores};
1670 delete $conf->{smp};
1671 }
1672
1673 my $used_volids = {};
1674
1675 my $cleanup_config = sub {
1676 my ($cref) = @_;
1677
1678 foreach my $key (keys %$cref) {
1679 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
1680 $key eq 'snapstate';
1681 my $value = $cref->{$key};
1682 eval { $value = check_type($key, $value); };
1683 die "unable to parse value of '$key' - $@" if $@;
1684
1685 $cref->{$key} = $value;
1686
1687 if (valid_drivename($key)) {
1688 my $drive = parse_drive($key, $value);
1689 $used_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
1690 }
1691 }
1692 };
1693
1694 &$cleanup_config($conf);
1695 foreach my $snapname (keys %{$conf->{snapshots}}) {
1696 &$cleanup_config($conf->{snapshots}->{$snapname});
1697 }
1698
1699 # remove 'unusedX' settings if we re-add a volume
1700 foreach my $key (keys %$conf) {
1701 my $value = $conf->{$key};
1702 if ($key =~ m/^unused/ && $used_volids->{$value}) {
1703 delete $conf->{$key};
1704 }
1705 }
1706
1707 my $generate_raw_config = sub {
1708 my ($conf) = @_;
1709
1710 my $raw = '';
1711
1712 # add description as comment to top of file
1713 my $descr = $conf->{description} || '';
1714 foreach my $cl (split(/\n/, $descr)) {
1715 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
1716 }
1717
1718 foreach my $key (sort keys %$conf) {
1719 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots';
1720 $raw .= "$key: $conf->{$key}\n";
1721 }
1722 return $raw;
1723 };
1724
1725 my $raw = &$generate_raw_config($conf);
1726 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
1727 $raw .= "\n[$snapname]\n";
1728 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
1729 }
1730
1731 return $raw;
1732}
1733
1734sub update_config_nolock {
1735 my ($vmid, $conf, $skiplock) = @_;
1736
1737 check_lock($conf) if !$skiplock;
1738
1739 my $cfspath = cfs_config_path($vmid);
1740
1741 PVE::Cluster::cfs_write_file($cfspath, $conf);
1742}
1743
1744sub update_config {
1745 my ($vmid, $conf, $skiplock) = @_;
1746
1747 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1748}
1749
1750sub load_defaults {
1751
1752 my $res = {};
1753
1754 # we use static defaults from our JSON schema configuration
1755 foreach my $key (keys %$confdesc) {
1756 if (defined(my $default = $confdesc->{$key}->{default})) {
1757 $res->{$key} = $default;
1758 }
1759 }
1760
1761 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
1762 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
1763
1764 return $res;
1765}
1766
1767sub config_list {
1768 my $vmlist = PVE::Cluster::get_vmlist();
1769 my $res = {};
1770 return $res if !$vmlist || !$vmlist->{ids};
1771 my $ids = $vmlist->{ids};
1772
1773 foreach my $vmid (keys %$ids) {
1774 my $d = $ids->{$vmid};
1775 next if !$d->{node} || $d->{node} ne $nodename;
1776 next if !$d->{type} || $d->{type} ne 'qemu';
1777 $res->{$vmid}->{exists} = 1;
1778 }
1779 return $res;
1780}
1781
1782# test if VM uses local resources (to prevent migration)
1783sub check_local_resources {
1784 my ($conf, $noerr) = @_;
1785
1786 my $loc_res = 0;
1787
1788 $loc_res = 1 if $conf->{hostusb}; # old syntax
1789 $loc_res = 1 if $conf->{hostpci}; # old syntax
1790
1791 foreach my $k (keys %$conf) {
1792 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
1793 }
1794
1795 die "VM uses local resources\n" if $loc_res && !$noerr;
1796
1797 return $loc_res;
1798}
1799
1800# check is used storages are available on all nodes (use by migrate)
1801sub check_storage_availability {
1802 my ($storecfg, $conf, $node) = @_;
1803
1804 foreach_drive($conf, sub {
1805 my ($ds, $drive) = @_;
1806
1807 my $volid = $drive->{file};
1808 return if !$volid;
1809
1810 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
1811 return if !$sid;
1812
1813 # check if storage is available on both nodes
1814 my $scfg = PVE::Storage::storage_check_node($storecfg, $sid);
1815 PVE::Storage::storage_check_node($storecfg, $sid, $node);
1816 });
1817}
1818
1819sub check_lock {
1820 my ($conf) = @_;
1821
1822 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
1823}
1824
1825sub check_cmdline {
1826 my ($pidfile, $pid) = @_;
1827
1828 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
1829 if (defined($fh)) {
1830 my $line = <$fh>;
1831 $fh->close;
1832 return undef if !$line;
1833 my @param = split(/\0/, $line);
1834
1835 my $cmd = $param[0];
1836 return if !$cmd || ($cmd !~ m|kvm$| && $cmd !~ m|qemu-system-x86_64$|);
1837
1838 for (my $i = 0; $i < scalar (@param); $i++) {
1839 my $p = $param[$i];
1840 next if !$p;
1841 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
1842 my $p = $param[$i+1];
1843 return 1 if $p && ($p eq $pidfile);
1844 return undef;
1845 }
1846 }
1847 }
1848 return undef;
1849}
1850
1851sub check_running {
1852 my ($vmid, $nocheck, $node) = @_;
1853
1854 my $filename = config_file($vmid, $node);
1855
1856 die "unable to find configuration file for VM $vmid - no such machine\n"
1857 if !$nocheck && ! -f $filename;
1858
1859 my $pidfile = pidfile_name($vmid);
1860
1861 if (my $fd = IO::File->new("<$pidfile")) {
1862 my $st = stat($fd);
1863 my $line = <$fd>;
1864 close($fd);
1865
1866 my $mtime = $st->mtime;
1867 if ($mtime > time()) {
1868 warn "file '$filename' modified in future\n";
1869 }
1870
1871 if ($line =~ m/^(\d+)$/) {
1872 my $pid = $1;
1873 if (check_cmdline($pidfile, $pid)) {
1874 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
1875 return $pid;
1876 }
1877 }
1878 }
1879 }
1880
1881 return undef;
1882}
1883
1884sub vzlist {
1885
1886 my $vzlist = config_list();
1887
1888 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1889
1890 while (defined(my $de = $fd->read)) {
1891 next if $de !~ m/^(\d+)\.pid$/;
1892 my $vmid = $1;
1893 next if !defined($vzlist->{$vmid});
1894 if (my $pid = check_running($vmid)) {
1895 $vzlist->{$vmid}->{pid} = $pid;
1896 }
1897 }
1898
1899 return $vzlist;
1900}
1901
1902sub disksize {
1903 my ($storecfg, $conf) = @_;
1904
1905 my $bootdisk = $conf->{bootdisk};
1906 return undef if !$bootdisk;
1907 return undef if !valid_drivename($bootdisk);
1908
1909 return undef if !$conf->{$bootdisk};
1910
1911 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
1912 return undef if !defined($drive);
1913
1914 return undef if drive_is_cdrom($drive);
1915
1916 my $volid = $drive->{file};
1917 return undef if !$volid;
1918
1919 return $drive->{size};
1920}
1921
1922my $last_proc_pid_stat;
1923
1924# get VM status information
1925# This must be fast and should not block ($full == false)
1926# We only query KVM using QMP if $full == true (this can be slow)
1927sub vmstatus {
1928 my ($opt_vmid, $full) = @_;
1929
1930 my $res = {};
1931
1932 my $storecfg = PVE::Storage::config();
1933
1934 my $list = vzlist();
1935 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1936
1937 my $cpucount = $cpuinfo->{cpus} || 1;
1938
1939 foreach my $vmid (keys %$list) {
1940 next if $opt_vmid && ($vmid ne $opt_vmid);
1941
1942 my $cfspath = cfs_config_path($vmid);
1943 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
1944
1945 my $d = {};
1946 $d->{pid} = $list->{$vmid}->{pid};
1947
1948 # fixme: better status?
1949 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
1950
1951 my $size = disksize($storecfg, $conf);
1952 if (defined($size)) {
1953 $d->{disk} = 0; # no info available
1954 $d->{maxdisk} = $size;
1955 } else {
1956 $d->{disk} = 0;
1957 $d->{maxdisk} = 0;
1958 }
1959
1960 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
1961 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
1962
1963 $d->{name} = $conf->{name} || "VM $vmid";
1964 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1965
1966 if ($conf->{balloon}) {
1967 $d->{balloon_min} = $conf->{balloon}*(1024*1024);
1968 $d->{shares} = defined($conf->{shares}) ? $conf->{shares} : 1000;
1969 }
1970
1971 $d->{uptime} = 0;
1972 $d->{cpu} = 0;
1973 $d->{mem} = 0;
1974
1975 $d->{netout} = 0;
1976 $d->{netin} = 0;
1977
1978 $d->{diskread} = 0;
1979 $d->{diskwrite} = 0;
1980
1981 $d->{template} = is_template($conf);
1982
1983 $res->{$vmid} = $d;
1984 }
1985
1986 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
1987 foreach my $dev (keys %$netdev) {
1988 next if $dev !~ m/^tap([1-9]\d*)i/;
1989 my $vmid = $1;
1990 my $d = $res->{$vmid};
1991 next if !$d;
1992
1993 $d->{netout} += $netdev->{$dev}->{receive};
1994 $d->{netin} += $netdev->{$dev}->{transmit};
1995 }
1996
1997 my $ctime = gettimeofday;
1998
1999 foreach my $vmid (keys %$list) {
2000
2001 my $d = $res->{$vmid};
2002 my $pid = $d->{pid};
2003 next if !$pid;
2004
2005 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
2006 next if !$pstat; # not running
2007
2008 my $used = $pstat->{utime} + $pstat->{stime};
2009
2010 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
2011
2012 if ($pstat->{vsize}) {
2013 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
2014 }
2015
2016 my $old = $last_proc_pid_stat->{$pid};
2017 if (!$old) {
2018 $last_proc_pid_stat->{$pid} = {
2019 time => $ctime,
2020 used => $used,
2021 cpu => 0,
2022 };
2023 next;
2024 }
2025
2026 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
2027
2028 if ($dtime > 1000) {
2029 my $dutime = $used - $old->{used};
2030
2031 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
2032 $last_proc_pid_stat->{$pid} = {
2033 time => $ctime,
2034 used => $used,
2035 cpu => $d->{cpu},
2036 };
2037 } else {
2038 $d->{cpu} = $old->{cpu};
2039 }
2040 }
2041
2042 return $res if !$full;
2043
2044 my $qmpclient = PVE::QMPClient->new();
2045
2046 my $ballooncb = sub {
2047 my ($vmid, $resp) = @_;
2048
2049 my $info = $resp->{'return'};
2050 return if !$info->{max_mem};
2051
2052 my $d = $res->{$vmid};
2053
2054 # use memory assigned to VM
2055 $d->{maxmem} = $info->{max_mem};
2056 $d->{balloon} = $info->{actual};
2057
2058 if (defined($info->{total_mem}) && defined($info->{free_mem})) {
2059 $d->{mem} = $info->{total_mem} - $info->{free_mem};
2060 $d->{freemem} = $info->{free_mem};
2061 }
2062
2063 };
2064
2065 my $blockstatscb = sub {
2066 my ($vmid, $resp) = @_;
2067 my $data = $resp->{'return'} || [];
2068 my $totalrdbytes = 0;
2069 my $totalwrbytes = 0;
2070 for my $blockstat (@$data) {
2071 $totalrdbytes = $totalrdbytes + $blockstat->{stats}->{rd_bytes};
2072 $totalwrbytes = $totalwrbytes + $blockstat->{stats}->{wr_bytes};
2073 }
2074 $res->{$vmid}->{diskread} = $totalrdbytes;
2075 $res->{$vmid}->{diskwrite} = $totalwrbytes;
2076 };
2077
2078 my $statuscb = sub {
2079 my ($vmid, $resp) = @_;
2080
2081 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
2082 # this fails if ballon driver is not loaded, so this must be
2083 # the last commnand (following command are aborted if this fails).
2084 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
2085
2086 my $status = 'unknown';
2087 if (!defined($status = $resp->{'return'}->{status})) {
2088 warn "unable to get VM status\n";
2089 return;
2090 }
2091
2092 $res->{$vmid}->{qmpstatus} = $resp->{'return'}->{status};
2093 };
2094
2095 foreach my $vmid (keys %$list) {
2096 next if $opt_vmid && ($vmid ne $opt_vmid);
2097 next if !$res->{$vmid}->{pid}; # not running
2098 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
2099 }
2100
2101 $qmpclient->queue_execute();
2102
2103 foreach my $vmid (keys %$list) {
2104 next if $opt_vmid && ($vmid ne $opt_vmid);
2105 $res->{$vmid}->{qmpstatus} = $res->{$vmid}->{status} if !$res->{$vmid}->{qmpstatus};
2106 }
2107
2108 return $res;
2109}
2110
2111sub foreach_drive {
2112 my ($conf, $func) = @_;
2113
2114 foreach my $ds (keys %$conf) {
2115 next if !valid_drivename($ds);
2116
2117 my $drive = parse_drive($ds, $conf->{$ds});
2118 next if !$drive;
2119
2120 &$func($ds, $drive);
2121 }
2122}
2123
2124sub foreach_volid {
2125 my ($conf, $func) = @_;
2126
2127 my $volhash = {};
2128
2129 my $test_volid = sub {
2130 my ($volid, $is_cdrom) = @_;
2131
2132 return if !$volid;
2133
2134 $volhash->{$volid} = $is_cdrom || 0;
2135 };
2136
2137 foreach_drive($conf, sub {
2138 my ($ds, $drive) = @_;
2139 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2140 });
2141
2142 foreach my $snapname (keys %{$conf->{snapshots}}) {
2143 my $snap = $conf->{snapshots}->{$snapname};
2144 &$test_volid($snap->{vmstate}, 0);
2145 foreach_drive($snap, sub {
2146 my ($ds, $drive) = @_;
2147 &$test_volid($drive->{file}, drive_is_cdrom($drive));
2148 });
2149 }
2150
2151 foreach my $volid (keys %$volhash) {
2152 &$func($volid, $volhash->{$volid});
2153 }
2154}
2155
2156sub config_to_command {
2157 my ($storecfg, $vmid, $conf, $defaults) = @_;
2158
2159 my $cmd = [];
2160 my $globalFlags = [];
2161 my $machineFlags = [];
2162 my $rtcFlags = [];
2163 my $devices = [];
2164 my $pciaddr = '';
2165 my $bridges = {};
2166 my $kvmver = kvm_user_version();
2167 my $vernum = 0; # unknown
2168 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
2169 $vernum = $1*1000000+$2*1000;
2170 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
2171 $vernum = $1*1000000+$2*1000+$3;
2172 }
2173
2174 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
2175
2176 my $have_ovz = -f '/proc/vz/vestat';
2177
2178 push @$cmd, '/usr/bin/kvm';
2179
2180 push @$cmd, '-id', $vmid;
2181
2182 my $use_virtio = 0;
2183
2184 my $qmpsocket = qmp_socket($vmid);
2185 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server,nowait";
2186 push @$cmd, '-mon', "chardev=qmp,mode=control";
2187
2188 my $socket = vnc_socket($vmid);
2189 push @$cmd, '-vnc', "unix:$socket,x509,password";
2190
2191 push @$cmd, '-pidfile' , pidfile_name($vmid);
2192
2193 push @$cmd, '-daemonize';
2194
2195 $pciaddr = print_pci_addr("piix3", $bridges);
2196 push @$devices, '-device', "piix3-usb-uhci,id=uhci$pciaddr.0x2";
2197
2198 my $use_usb2 = 0;
2199 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2200 next if !$conf->{"usb$i"};
2201 $use_usb2 = 1;
2202 }
2203 # include usb device config
2204 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
2205
2206 # enable absolute mouse coordinates (needed by vnc)
2207 my $tablet = defined($conf->{tablet}) ? $conf->{tablet} : $defaults->{tablet};
2208 push @$devices, '-device', 'usb-tablet,id=tablet,bus=uhci.0,port=1' if $tablet;
2209
2210 # host pci devices
2211 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2212 my $d = parse_hostpci($conf->{"hostpci$i"});
2213 next if !$d;
2214 $pciaddr = print_pci_addr("hostpci$i", $bridges);
2215 push @$devices, '-device', "pci-assign,host=$d->{pciid},id=hostpci$i$pciaddr";
2216 }
2217
2218 # usb devices
2219 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
2220 my $d = parse_usb_device($conf->{"usb$i"});
2221 next if !$d;
2222 if ($d->{vendorid} && $d->{productid}) {
2223 push @$devices, '-device', "usb-host,vendorid=0x$d->{vendorid},productid=0x$d->{productid}";
2224 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
2225 push @$devices, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
2226 }
2227 }
2228
2229 # serial devices
2230 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
2231 if (my $path = $conf->{"serial$i"}) {
2232 die "no such serial device\n" if ! -c $path;
2233 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
2234 push @$devices, '-device', "isa-serial,chardev=serial$i";
2235 }
2236 }
2237
2238 # parallel devices
2239 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
2240 if (my $path = $conf->{"parallel$i"}) {
2241 die "no such parallel device\n" if ! -c $path;
2242 push @$devices, '-chardev', "parport,id=parallel$i,path=$path";
2243 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
2244 }
2245 }
2246
2247 my $vmname = $conf->{name} || "vm$vmid";
2248
2249 push @$cmd, '-name', $vmname;
2250
2251 my $sockets = 1;
2252 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
2253 $sockets = $conf->{sockets} if $conf->{sockets};
2254
2255 my $cores = $conf->{cores} || 1;
2256
2257 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
2258
2259 push @$cmd, '-cpu', $conf->{cpu} if $conf->{cpu};
2260
2261 push @$cmd, '-nodefaults';
2262
2263 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
2264
2265 my $bootindex_hash = {};
2266 my $i = 1;
2267 foreach my $o (split(//, $bootorder)) {
2268 $bootindex_hash->{$o} = $i*100;
2269 $i++;
2270 }
2271
2272 push @$cmd, '-boot', "menu=on";
2273
2274 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
2275
2276 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
2277
2278 my $vga = $conf->{vga};
2279 if (!$vga) {
2280 if ($conf->{ostype} && ($conf->{ostype} eq 'win8' || $conf->{ostype} eq 'win7' || $conf->{ostype} eq 'w2k8')) {
2281 $vga = 'std';
2282 } else {
2283 $vga = 'cirrus';
2284 }
2285 }
2286
2287 push @$cmd, '-vga', $vga if $vga; # for kvm 77 and later
2288
2289 # time drift fix
2290 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
2291
2292 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
2293 my $useLocaltime = $conf->{localtime};
2294
2295 if (my $ost = $conf->{ostype}) {
2296 # other, wxp, w2k, w2k3, w2k8, wvista, win7, win8, l24, l26
2297
2298 if ($ost =~ m/^w/) { # windows
2299 $useLocaltime = 1 if !defined($conf->{localtime});
2300
2301 # use time drift fix when acpi is enabled
2302 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
2303 $tdf = 1 if !defined($conf->{tdf});
2304 }
2305 }
2306
2307 if ($ost eq 'win7' || $ost eq 'win8' || $ost eq 'w2k8' ||
2308 $ost eq 'wvista') {
2309 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
2310 push @$cmd, '-no-hpet';
2311 }
2312 }
2313
2314 push @$rtcFlags, 'driftfix=slew' if $tdf;
2315
2316 if ($nokvm) {
2317 push @$machineFlags, 'accel=tcg';
2318 } else {
2319 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2320 }
2321
2322 if ($conf->{startdate}) {
2323 push @$rtcFlags, "base=$conf->{startdate}";
2324 } elsif ($useLocaltime) {
2325 push @$rtcFlags, 'base=localtime';
2326 }
2327
2328 push @$cmd, '-S' if $conf->{freeze};
2329
2330 # set keyboard layout
2331 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2332 push @$cmd, '-k', $kb if $kb;
2333
2334 # enable sound
2335 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2336 #push @$cmd, '-soundhw', 'es1370';
2337 #push @$cmd, '-soundhw', $soundhw if $soundhw;
2338
2339 if($conf->{agent}) {
2340 my $qgasocket = qga_socket($vmid);
2341 my $pciaddr = print_pci_addr("qga0", $bridges);
2342 push @$devices, '-chardev', "socket,path=$qgasocket,server,nowait,id=qga0";
2343 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
2344 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
2345 }
2346
2347 # enable balloon by default, unless explicitly disabled
2348 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2349 $pciaddr = print_pci_addr("balloon0", $bridges);
2350 push @$devices, '-device', "virtio-balloon-pci,id=balloon0$pciaddr";
2351 }
2352
2353 if ($conf->{watchdog}) {
2354 my $wdopts = parse_watchdog($conf->{watchdog});
2355 $pciaddr = print_pci_addr("watchdog", $bridges);
2356 my $watchdog = $wdopts->{model} || 'i6300esb';
2357 push @$devices, '-device', "$watchdog$pciaddr";
2358 push @$devices, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
2359 }
2360
2361 my $vollist = [];
2362 my $scsicontroller = {};
2363 my $ahcicontroller = {};
2364 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : $defaults->{scsihw};
2365
2366 foreach_drive($conf, sub {
2367 my ($ds, $drive) = @_;
2368
2369 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
2370 push @$vollist, $drive->{file};
2371 }
2372
2373 $use_virtio = 1 if $ds =~ m/^virtio/;
2374
2375 if (drive_is_cdrom ($drive)) {
2376 if ($bootindex_hash->{d}) {
2377 $drive->{bootindex} = $bootindex_hash->{d};
2378 $bootindex_hash->{d} += 1;
2379 }
2380 } else {
2381 if ($bootindex_hash->{c}) {
2382 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
2383 $bootindex_hash->{c} += 1;
2384 }
2385 }
2386
2387 if ($drive->{interface} eq 'scsi') {
2388
2389 my $maxdev = ($scsihw ne 'lsi') ? 256 : 7;
2390 my $controller = int($drive->{index} / $maxdev);
2391 $pciaddr = print_pci_addr("scsihw$controller", $bridges);
2392 push @$devices, '-device', "$scsihw,id=scsihw$controller$pciaddr" if !$scsicontroller->{$controller};
2393 $scsicontroller->{$controller}=1;
2394 }
2395
2396 if ($drive->{interface} eq 'sata') {
2397 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
2398 $pciaddr = print_pci_addr("ahci$controller", $bridges);
2399 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
2400 $ahcicontroller->{$controller}=1;
2401 }
2402
2403 push @$devices, '-drive',print_drive_full($storecfg, $vmid, $drive);
2404 push @$devices, '-device',print_drivedevice_full($storecfg, $conf, $vmid, $drive, $bridges);
2405 });
2406
2407 push @$cmd, '-m', $conf->{memory} || $defaults->{memory};
2408
2409 for (my $i = 0; $i < $MAX_NETS; $i++) {
2410 next if !$conf->{"net$i"};
2411 my $d = parse_net($conf->{"net$i"});
2412 next if !$d;
2413
2414 $use_virtio = 1 if $d->{model} eq 'virtio';
2415
2416 if ($bootindex_hash->{n}) {
2417 $d->{bootindex} = $bootindex_hash->{n};
2418 $bootindex_hash->{n} += 1;
2419 }
2420
2421 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
2422 push @$devices, '-netdev', $netdevfull;
2423
2424 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i",$bridges);
2425 push @$devices, '-device', $netdevicefull;
2426 }
2427
2428 #bridges
2429 while (my ($k, $v) = each %$bridges) {
2430 $pciaddr = print_pci_addr("pci.$k");
2431 unshift @$devices, '-device', "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr" if $k > 0;
2432 }
2433
2434
2435 # hack: virtio with fairsched is unreliable, so we do not use fairsched
2436 # when the VM uses virtio devices.
2437 if (!$use_virtio && $have_ovz) {
2438
2439 my $cpuunits = defined($conf->{cpuunits}) ?
2440 $conf->{cpuunits} : $defaults->{cpuunits};
2441
2442 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
2443
2444 # fixme: cpulimit is currently ignored
2445 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
2446 }
2447
2448 # add custom args
2449 if ($conf->{args}) {
2450 my $aa = PVE::Tools::split_args($conf->{args});
2451 push @$cmd, @$aa;
2452 }
2453
2454 push @$cmd, @$devices;
2455 push @$cmd, '-rtc', join(',', @$rtcFlags)
2456 if scalar(@$rtcFlags);
2457 push @$cmd, '-machine', join(',', @$machineFlags)
2458 if scalar(@$machineFlags);
2459 push @$cmd, '-global', join(',', @$globalFlags)
2460 if scalar(@$globalFlags);
2461
2462 return wantarray ? ($cmd, $vollist) : $cmd;
2463}
2464
2465sub vnc_socket {
2466 my ($vmid) = @_;
2467 return "${var_run_tmpdir}/$vmid.vnc";
2468}
2469
2470sub qmp_socket {
2471 my ($vmid) = @_;
2472 return "${var_run_tmpdir}/$vmid.qmp";
2473}
2474
2475sub qga_socket {
2476 my ($vmid) = @_;
2477 return "${var_run_tmpdir}/$vmid.qga";
2478}
2479
2480sub pidfile_name {
2481 my ($vmid) = @_;
2482 return "${var_run_tmpdir}/$vmid.pid";
2483}
2484
2485sub next_migrate_port {
2486
2487 for (my $p = 60000; $p < 60010; $p++) {
2488
2489 my $sock = IO::Socket::INET->new(Listen => 5,
2490 LocalAddr => 'localhost',
2491 LocalPort => $p,
2492 ReuseAddr => 1,
2493 Proto => 0);
2494
2495 if ($sock) {
2496 close($sock);
2497 return $p;
2498 }
2499 }
2500
2501 die "unable to find free migration port";
2502}
2503
2504sub vm_devices_list {
2505 my ($vmid) = @_;
2506
2507 my $res = vm_mon_cmd($vmid, 'query-pci');
2508
2509 my $devices = {};
2510 foreach my $pcibus (@$res) {
2511 foreach my $device (@{$pcibus->{devices}}) {
2512 next if !$device->{'qdev_id'};
2513 $devices->{$device->{'qdev_id'}} = $device;
2514 }
2515 }
2516
2517 return $devices;
2518}
2519
2520sub vm_deviceplug {
2521 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
2522
2523 return 1 if !check_running($vmid);
2524
2525 if ($deviceid eq 'tablet') {
2526 my $devicefull = "usb-tablet,id=tablet,bus=uhci.0,port=1";
2527 qemu_deviceadd($vmid, $devicefull);
2528 return 1;
2529 }
2530
2531 return 1 if !$conf->{hotplug};
2532
2533 my $devices_list = vm_devices_list($vmid);
2534 return 1 if defined($devices_list->{$deviceid});
2535
2536 qemu_bridgeadd($storecfg, $conf, $vmid, $deviceid); #add bridge if we need it for the device
2537
2538 if ($deviceid =~ m/^(virtio)(\d+)$/) {
2539 return undef if !qemu_driveadd($storecfg, $vmid, $device);
2540 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
2541 qemu_deviceadd($vmid, $devicefull);
2542 if(!qemu_deviceaddverify($vmid, $deviceid)) {
2543 qemu_drivedel($vmid, $deviceid);
2544 return undef;
2545 }
2546 }
2547
2548 if ($deviceid =~ m/^(scsihw)(\d+)$/) {
2549 my $scsihw = defined($conf->{scsihw}) ? $conf->{scsihw} : "lsi";
2550 my $pciaddr = print_pci_addr($deviceid);
2551 my $devicefull = "$scsihw,id=$deviceid$pciaddr";
2552 qemu_deviceadd($vmid, $devicefull);
2553 return undef if(!qemu_deviceaddverify($vmid, $deviceid));
2554 }
2555
2556 if ($deviceid =~ m/^(scsi)(\d+)$/) {
2557 return 1 if ($conf->{scsihw} && $conf->{scsihw} ne 'lsi'); #virtio-scsi not yet support hotplug
2558 return undef if !qemu_findorcreatescsihw($storecfg,$conf, $vmid, $device);
2559 return undef if !qemu_driveadd($storecfg, $vmid, $device);
2560 my $devicefull = print_drivedevice_full($storecfg, $conf, $vmid, $device);
2561 if(!qemu_deviceadd($vmid, $devicefull)) {
2562 qemu_drivedel($vmid, $deviceid);
2563 return undef;
2564 }
2565 }
2566
2567 if ($deviceid =~ m/^(net)(\d+)$/) {
2568 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
2569 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
2570 qemu_deviceadd($vmid, $netdevicefull);
2571 if(!qemu_deviceaddverify($vmid, $deviceid)) {
2572 qemu_netdevdel($vmid, $deviceid);
2573 return undef;
2574 }
2575 }
2576
2577 if ($deviceid =~ m/^(pci\.)(\d+)$/) {
2578 my $bridgeid = $2;
2579 my $pciaddr = print_pci_addr($deviceid);
2580 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
2581 qemu_deviceadd($vmid, $devicefull);
2582 return undef if !qemu_deviceaddverify($vmid, $deviceid);
2583 }
2584
2585 return 1;
2586}
2587
2588sub vm_deviceunplug {
2589 my ($vmid, $conf, $deviceid) = @_;
2590
2591 return 1 if !check_running ($vmid);
2592
2593 if ($deviceid eq 'tablet') {
2594 qemu_devicedel($vmid, $deviceid);
2595 return 1;
2596 }
2597
2598 return 1 if !$conf->{hotplug};
2599
2600 my $devices_list = vm_devices_list($vmid);
2601 return 1 if !defined($devices_list->{$deviceid});
2602
2603 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
2604
2605 if ($deviceid =~ m/^(virtio)(\d+)$/) {
2606 return undef if !qemu_drivedel($vmid, $deviceid);
2607 qemu_devicedel($vmid, $deviceid);
2608 return undef if !qemu_devicedelverify($vmid, $deviceid);
2609 }
2610
2611 if ($deviceid =~ m/^(lsi)(\d+)$/) {
2612 return undef if !qemu_devicedel($vmid, $deviceid);
2613 }
2614
2615 if ($deviceid =~ m/^(scsi)(\d+)$/) {
2616 return undef if !qemu_devicedel($vmid, $deviceid);
2617 return undef if !qemu_drivedel($vmid, $deviceid);
2618 }
2619
2620 if ($deviceid =~ m/^(net)(\d+)$/) {
2621 return undef if !qemu_netdevdel($vmid, $deviceid);
2622 qemu_devicedel($vmid, $deviceid);
2623 return undef if !qemu_devicedelverify($vmid, $deviceid);
2624 }
2625
2626 return 1;
2627}
2628
2629sub qemu_deviceadd {
2630 my ($vmid, $devicefull) = @_;
2631
2632 $devicefull = "driver=".$devicefull;
2633 my %options = split(/[=,]/, $devicefull);
2634
2635 vm_mon_cmd($vmid, "device_add" , %options);
2636 return 1;
2637}
2638
2639sub qemu_devicedel {
2640 my($vmid, $deviceid) = @_;
2641 my $ret = vm_mon_cmd($vmid, "device_del", id => $deviceid);
2642 return 1;
2643}
2644
2645sub qemu_driveadd {
2646 my($storecfg, $vmid, $device) = @_;
2647
2648 my $drive = print_drive_full($storecfg, $vmid, $device);
2649 my $ret = vm_human_monitor_command($vmid, "drive_add auto $drive");
2650 # If the command succeeds qemu prints: "OK"
2651 if ($ret !~ m/OK/s) {
2652 syslog("err", "adding drive failed: $ret");
2653 return undef;
2654 }
2655 return 1;
2656}
2657
2658sub qemu_drivedel {
2659 my($vmid, $deviceid) = @_;
2660
2661 my $ret = vm_human_monitor_command($vmid, "drive_del drive-$deviceid");
2662 $ret =~ s/^\s+//;
2663 if ($ret =~ m/Device \'.*?\' not found/s) {
2664 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
2665 }
2666 elsif ($ret ne "") {
2667 syslog("err", "deleting drive $deviceid failed : $ret");
2668 return undef;
2669 }
2670 return 1;
2671}
2672
2673sub qemu_deviceaddverify {
2674 my ($vmid,$deviceid) = @_;
2675
2676 for (my $i = 0; $i <= 5; $i++) {
2677 my $devices_list = vm_devices_list($vmid);
2678 return 1 if defined($devices_list->{$deviceid});
2679 sleep 1;
2680 }
2681 syslog("err", "error on hotplug device $deviceid");
2682 return undef;
2683}
2684
2685
2686sub qemu_devicedelverify {
2687 my ($vmid,$deviceid) = @_;
2688
2689 #need to verify the device is correctly remove as device_del is async and empty return is not reliable
2690 for (my $i = 0; $i <= 5; $i++) {
2691 my $devices_list = vm_devices_list($vmid);
2692 return 1 if !defined($devices_list->{$deviceid});
2693 sleep 1;
2694 }
2695 syslog("err", "error on hot-unplugging device $deviceid");
2696 return undef;
2697}
2698
2699sub qemu_findorcreatescsihw {
2700 my ($storecfg, $conf, $vmid, $device) = @_;
2701
2702 my $maxdev = ($conf->{scsihw} && $conf->{scsihw} ne 'lsi') ? 256 : 7;
2703 my $controller = int($device->{index} / $maxdev);
2704 my $scsihwid="scsihw$controller";
2705 my $devices_list = vm_devices_list($vmid);
2706
2707 if(!defined($devices_list->{$scsihwid})) {
2708 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $scsihwid);
2709 }
2710 return 1;
2711}
2712
2713sub qemu_bridgeadd {
2714 my ($storecfg, $conf, $vmid, $device) = @_;
2715
2716 my $bridges = {};
2717 my $bridgeid = undef;
2718 print_pci_addr($device, $bridges);
2719
2720 while (my ($k, $v) = each %$bridges) {
2721 $bridgeid = $k;
2722 }
2723 return if $bridgeid < 1;
2724 my $bridge = "pci.$bridgeid";
2725 my $devices_list = vm_devices_list($vmid);
2726
2727 if(!defined($devices_list->{$bridge})) {
2728 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $bridge);
2729 }
2730 return 1;
2731}
2732
2733sub qemu_netdevadd {
2734 my ($vmid, $conf, $device, $deviceid) = @_;
2735
2736 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
2737 my %options = split(/[=,]/, $netdev);
2738
2739 vm_mon_cmd($vmid, "netdev_add", %options);
2740 return 1;
2741}
2742
2743sub qemu_netdevdel {
2744 my ($vmid, $deviceid) = @_;
2745
2746 vm_mon_cmd($vmid, "netdev_del", id => $deviceid);
2747 return 1;
2748}
2749
2750sub qemu_block_set_io_throttle {
2751 my ($vmid, $deviceid, $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr) = @_;
2752
2753 return if !check_running($vmid) ;
2754
2755 $bps = 0 if !$bps;
2756 $bps_rd = 0 if !$bps_rd;
2757 $bps_wr = 0 if !$bps_wr;
2758 $iops = 0 if !$iops;
2759 $iops_rd = 0 if !$iops_rd;
2760 $iops_wr = 0 if !$iops_wr;
2761
2762 vm_mon_cmd($vmid, "block_set_io_throttle", device => $deviceid, bps => int($bps), bps_rd => int($bps_rd), bps_wr => int($bps_wr), iops => int($iops), iops_rd => int($iops_rd), iops_wr => int($iops_wr));
2763
2764}
2765
2766# old code, only used to shutdown old VM after update
2767sub __read_avail {
2768 my ($fh, $timeout) = @_;
2769
2770 my $sel = new IO::Select;
2771 $sel->add($fh);
2772
2773 my $res = '';
2774 my $buf;
2775
2776 my @ready;
2777 while (scalar (@ready = $sel->can_read($timeout))) {
2778 my $count;
2779 if ($count = $fh->sysread($buf, 8192)) {
2780 if ($buf =~ /^(.*)\(qemu\) $/s) {
2781 $res .= $1;
2782 last;
2783 } else {
2784 $res .= $buf;
2785 }
2786 } else {
2787 if (!defined($count)) {
2788 die "$!\n";
2789 }
2790 last;
2791 }
2792 }
2793
2794 die "monitor read timeout\n" if !scalar(@ready);
2795
2796 return $res;
2797}
2798
2799# old code, only used to shutdown old VM after update
2800sub vm_monitor_command {
2801 my ($vmid, $cmdstr, $nocheck) = @_;
2802
2803 my $res;
2804
2805 eval {
2806 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
2807
2808 my $sname = "${var_run_tmpdir}/$vmid.mon";
2809
2810 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
2811 die "unable to connect to VM $vmid socket - $!\n";
2812
2813 my $timeout = 3;
2814
2815 # hack: migrate sometime blocks the monitor (when migrate_downtime
2816 # is set)
2817 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
2818 $timeout = 60*60; # 1 hour
2819 }
2820
2821 # read banner;
2822 my $data = __read_avail($sock, $timeout);
2823
2824 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
2825 die "got unexpected qemu monitor banner\n";
2826 }
2827
2828 my $sel = new IO::Select;
2829 $sel->add($sock);
2830
2831 if (!scalar(my @ready = $sel->can_write($timeout))) {
2832 die "monitor write error - timeout";
2833 }
2834
2835 my $fullcmd = "$cmdstr\r";
2836
2837 # syslog('info', "VM $vmid monitor command: $cmdstr");
2838
2839 my $b;
2840 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
2841 die "monitor write error - $!";
2842 }
2843
2844 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
2845
2846 $timeout = 20;
2847
2848 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
2849 $timeout = 60*60; # 1 hour
2850 } elsif ($cmdstr =~ m/^(eject|change)/) {
2851 $timeout = 60; # note: cdrom mount command is slow
2852 }
2853 if ($res = __read_avail($sock, $timeout)) {
2854
2855 my @lines = split("\r?\n", $res);
2856
2857 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
2858
2859 $res = join("\n", @lines);
2860 $res .= "\n";
2861 }
2862 };
2863
2864 my $err = $@;
2865
2866 if ($err) {
2867 syslog("err", "VM $vmid monitor command failed - $err");
2868 die $err;
2869 }
2870
2871 return $res;
2872}
2873
2874sub qemu_block_resize {
2875 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
2876
2877 my $running = check_running($vmid);
2878
2879 return if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
2880
2881 return if !$running;
2882
2883 vm_mon_cmd($vmid, "block_resize", device => $deviceid, size => int($size));
2884
2885}
2886
2887sub qemu_volume_snapshot {
2888 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
2889
2890 my $running = check_running($vmid);
2891
2892 return if !PVE::Storage::volume_snapshot($storecfg, $volid, $snap, $running);
2893
2894 return if !$running;
2895
2896 vm_mon_cmd($vmid, "snapshot-drive", device => $deviceid, name => $snap);
2897
2898}
2899
2900sub qemu_volume_snapshot_delete {
2901 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
2902
2903 my $running = check_running($vmid);
2904
2905 return if !PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
2906
2907 return if !$running;
2908
2909 vm_mon_cmd($vmid, "delete-drive-snapshot", device => $deviceid, name => $snap);
2910}
2911
2912sub qga_freezefs {
2913 my ($vmid) = @_;
2914
2915 #need to impplement call to qemu-ga
2916}
2917
2918sub qga_unfreezefs {
2919 my ($vmid) = @_;
2920
2921 #need to impplement call to qemu-ga
2922}
2923
2924sub vm_start {
2925 my ($storecfg, $vmid, $statefile, $skiplock, $migratedfrom, $paused) = @_;
2926
2927 lock_config($vmid, sub {
2928 my $conf = load_config($vmid, $migratedfrom);
2929
2930 die "you can't start a vm if it's a template\n" if is_template($conf);
2931
2932 check_lock($conf) if !$skiplock;
2933
2934 die "VM $vmid already running\n" if check_running($vmid, undef, $migratedfrom);
2935
2936 my $defaults = load_defaults();
2937
2938 # set environment variable useful inside network script
2939 $ENV{PVE_MIGRATED_FROM} = $migratedfrom if $migratedfrom;
2940
2941 my ($cmd, $vollist) = config_to_command($storecfg, $vmid, $conf, $defaults);
2942
2943 my $migrate_port = 0;
2944
2945 if ($statefile) {
2946 if ($statefile eq 'tcp') {
2947 $migrate_port = next_migrate_port();
2948 my $migrate_uri = "tcp:localhost:${migrate_port}";
2949 push @$cmd, '-incoming', $migrate_uri;
2950 push @$cmd, '-S';
2951 } else {
2952 push @$cmd, '-loadstate', $statefile;
2953 }
2954 } elsif ($paused) {
2955 push @$cmd, '-S';
2956 }
2957
2958 # host pci devices
2959 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2960 my $d = parse_hostpci($conf->{"hostpci$i"});
2961 next if !$d;
2962 my $info = pci_device_info("0000:$d->{pciid}");
2963 die "IOMMU not present\n" if !check_iommu_support();
2964 die "no pci device info for device '$d->{pciid}'\n" if !$info;
2965 die "can't unbind pci device '$d->{pciid}'\n" if !pci_dev_bind_to_stub($info);
2966 die "can't reset pci device '$d->{pciid}'\n" if !pci_dev_reset($info);
2967 }
2968
2969 PVE::Storage::activate_volumes($storecfg, $vollist);
2970
2971 eval { run_command($cmd, timeout => $statefile ? undef : 30,
2972 umask => 0077); };
2973 my $err = $@;
2974 die "start failed: $err" if $err;
2975
2976 print "migration listens on port $migrate_port\n" if $migrate_port;
2977
2978 if ($statefile && $statefile ne 'tcp') {
2979 eval { vm_mon_cmd_nocheck($vmid, "cont"); };
2980 warn $@ if $@;
2981 }
2982
2983 if($migratedfrom) {
2984 my $capabilities = {};
2985 $capabilities->{capability} = "xbzrle";
2986 $capabilities->{state} = JSON::true;
2987 eval { vm_mon_cmd_nocheck($vmid, "migrate-set-capabilities", capabilities => [$capabilities]); };
2988 }
2989 else{
2990
2991 if (!defined($conf->{balloon}) || $conf->{balloon}) {
2992 vm_mon_cmd_nocheck($vmid, "balloon", value => $conf->{balloon}*1024*1024)
2993 if $conf->{balloon};
2994 vm_mon_cmd_nocheck($vmid, 'qom-set',
2995 path => "machine/peripheral/balloon0",
2996 property => "guest-stats-polling-interval",
2997 value => 2);
2998 }
2999 }
3000 });
3001}
3002
3003sub vm_mon_cmd {
3004 my ($vmid, $execute, %params) = @_;
3005
3006 my $cmd = { execute => $execute, arguments => \%params };
3007 vm_qmp_command($vmid, $cmd);
3008}
3009
3010sub vm_mon_cmd_nocheck {
3011 my ($vmid, $execute, %params) = @_;
3012
3013 my $cmd = { execute => $execute, arguments => \%params };
3014 vm_qmp_command($vmid, $cmd, 1);
3015}
3016
3017sub vm_qmp_command {
3018 my ($vmid, $cmd, $nocheck) = @_;
3019
3020 my $res;
3021
3022 my $timeout;
3023 if ($cmd->{arguments} && $cmd->{arguments}->{timeout}) {
3024 $timeout = $cmd->{arguments}->{timeout};
3025 delete $cmd->{arguments}->{timeout};
3026 }
3027
3028 eval {
3029 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
3030 my $sname = qmp_socket($vmid);
3031 if (-e $sname) {
3032 my $qmpclient = PVE::QMPClient->new();
3033
3034 $res = $qmpclient->cmd($vmid, $cmd, $timeout);
3035 } elsif (-e "${var_run_tmpdir}/$vmid.mon") {
3036 die "can't execute complex command on old monitor - stop/start your vm to fix the problem\n"
3037 if scalar(%{$cmd->{arguments}});
3038 vm_monitor_command($vmid, $cmd->{execute}, $nocheck);
3039 } else {
3040 die "unable to open monitor socket\n";
3041 }
3042 };
3043 if (my $err = $@) {
3044 syslog("err", "VM $vmid qmp command failed - $err");
3045 die $err;
3046 }
3047
3048 return $res;
3049}
3050
3051sub vm_human_monitor_command {
3052 my ($vmid, $cmdline) = @_;
3053
3054 my $res;
3055
3056 my $cmd = {
3057 execute => 'human-monitor-command',
3058 arguments => { 'command-line' => $cmdline},
3059 };
3060
3061 return vm_qmp_command($vmid, $cmd);
3062}
3063
3064sub vm_commandline {
3065 my ($storecfg, $vmid) = @_;
3066
3067 my $conf = load_config($vmid);
3068
3069 my $defaults = load_defaults();
3070
3071 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
3072
3073 return join(' ', @$cmd);
3074}
3075
3076sub vm_reset {
3077 my ($vmid, $skiplock) = @_;
3078
3079 lock_config($vmid, sub {
3080
3081 my $conf = load_config($vmid);
3082
3083 check_lock($conf) if !$skiplock;
3084
3085 vm_mon_cmd($vmid, "system_reset");
3086 });
3087}
3088
3089sub get_vm_volumes {
3090 my ($conf) = @_;
3091
3092 my $vollist = [];
3093 foreach_volid($conf, sub {
3094 my ($volid, $is_cdrom) = @_;
3095
3096 return if $volid =~ m|^/|;
3097
3098 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
3099 return if !$sid;
3100
3101 push @$vollist, $volid;
3102 });
3103
3104 return $vollist;
3105}
3106
3107sub vm_stop_cleanup {
3108 my ($storecfg, $vmid, $conf, $keepActive) = @_;
3109
3110 eval {
3111 fairsched_rmnod($vmid); # try to destroy group
3112
3113 if (!$keepActive) {
3114 my $vollist = get_vm_volumes($conf);
3115 PVE::Storage::deactivate_volumes($storecfg, $vollist);
3116 }
3117
3118 foreach my $ext (qw(mon qmp pid vnc qga)) {
3119 unlink "/var/run/qemu-server/${vmid}.$ext";
3120 }
3121 };
3122 warn $@ if $@; # avoid errors - just warn
3123}
3124
3125# Note: use $nockeck to skip tests if VM configuration file exists.
3126# We need that when migration VMs to other nodes (files already moved)
3127# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
3128sub vm_stop {
3129 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
3130
3131 $force = 1 if !defined($force) && !$shutdown;
3132
3133 if ($migratedfrom){
3134 my $pid = check_running($vmid, $nocheck, $migratedfrom);
3135 kill 15, $pid if $pid;
3136 my $conf = load_config($vmid, $migratedfrom);
3137 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive);
3138 return;
3139 }
3140
3141 lock_config($vmid, sub {
3142
3143 my $pid = check_running($vmid, $nocheck);
3144 return if !$pid;
3145
3146 my $conf;
3147 if (!$nocheck) {
3148 $conf = load_config($vmid);
3149 check_lock($conf) if !$skiplock;
3150 if (!defined($timeout) && $shutdown && $conf->{startup}) {
3151 my $opts = parse_startup($conf->{startup});
3152 $timeout = $opts->{down} if $opts->{down};
3153 }
3154 }
3155
3156 $timeout = 60 if !defined($timeout);
3157
3158 eval {
3159 if ($shutdown) {
3160 $nocheck ? vm_mon_cmd_nocheck($vmid, "system_powerdown") : vm_mon_cmd($vmid, "system_powerdown");
3161
3162 } else {
3163 $nocheck ? vm_mon_cmd_nocheck($vmid, "quit") : vm_mon_cmd($vmid, "quit");
3164 }
3165 };
3166 my $err = $@;
3167
3168 if (!$err) {
3169 my $count = 0;
3170 while (($count < $timeout) && check_running($vmid, $nocheck)) {
3171 $count++;
3172 sleep 1;
3173 }
3174
3175 if ($count >= $timeout) {
3176 if ($force) {
3177 warn "VM still running - terminating now with SIGTERM\n";
3178 kill 15, $pid;
3179 } else {
3180 die "VM quit/powerdown failed - got timeout\n";
3181 }
3182 } else {
3183 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
3184 return;
3185 }
3186 } else {
3187 if ($force) {
3188 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
3189 kill 15, $pid;
3190 } else {
3191 die "VM quit/powerdown failed\n";
3192 }
3193 }
3194
3195 # wait again
3196 $timeout = 10;
3197
3198 my $count = 0;
3199 while (($count < $timeout) && check_running($vmid, $nocheck)) {
3200 $count++;
3201 sleep 1;
3202 }
3203
3204 if ($count >= $timeout) {
3205 warn "VM still running - terminating now with SIGKILL\n";
3206 kill 9, $pid;
3207 sleep 1;
3208 }
3209
3210 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
3211 });
3212}
3213
3214sub vm_suspend {
3215 my ($vmid, $skiplock) = @_;
3216
3217 lock_config($vmid, sub {
3218
3219 my $conf = load_config($vmid);
3220
3221 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
3222
3223 vm_mon_cmd($vmid, "stop");
3224 });
3225}
3226
3227sub vm_resume {
3228 my ($vmid, $skiplock) = @_;
3229
3230 lock_config($vmid, sub {
3231
3232 my $conf = load_config($vmid);
3233
3234 check_lock($conf) if !($skiplock || ($conf->{lock} && $conf->{lock} eq 'backup'));
3235
3236 vm_mon_cmd($vmid, "cont");
3237 });
3238}
3239
3240sub vm_sendkey {
3241 my ($vmid, $skiplock, $key) = @_;
3242
3243 lock_config($vmid, sub {
3244
3245 my $conf = load_config($vmid);
3246
3247 # there is no qmp command, so we use the human monitor command
3248 vm_human_monitor_command($vmid, "sendkey $key");
3249 });
3250}
3251
3252sub vm_destroy {
3253 my ($storecfg, $vmid, $skiplock) = @_;
3254
3255 lock_config($vmid, sub {
3256
3257 my $conf = load_config($vmid);
3258
3259 check_lock($conf) if !$skiplock;
3260
3261 if (!check_running($vmid)) {
3262 fairsched_rmnod($vmid); # try to destroy group
3263 destroy_vm($storecfg, $vmid);
3264 } else {
3265 die "VM $vmid is running - destroy failed\n";
3266 }
3267 });
3268}
3269
3270# pci helpers
3271
3272sub file_write {
3273 my ($filename, $buf) = @_;
3274
3275 my $fh = IO::File->new($filename, "w");
3276 return undef if !$fh;
3277
3278 my $res = print $fh $buf;
3279
3280 $fh->close();
3281
3282 return $res;
3283}
3284
3285sub pci_device_info {
3286 my ($name) = @_;
3287
3288 my $res;
3289
3290 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
3291 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
3292
3293 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
3294 return undef if !defined($irq) || $irq !~ m/^\d+$/;
3295
3296 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
3297 return undef if !defined($vendor) || $vendor !~ s/^0x//;
3298
3299 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
3300 return undef if !defined($product) || $product !~ s/^0x//;
3301
3302 $res = {
3303 name => $name,
3304 vendor => $vendor,
3305 product => $product,
3306 domain => $domain,
3307 bus => $bus,
3308 slot => $slot,
3309 func => $func,
3310 irq => $irq,
3311 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
3312 };
3313
3314 return $res;
3315}
3316
3317sub pci_dev_reset {
3318 my ($dev) = @_;
3319
3320 my $name = $dev->{name};
3321
3322 my $fn = "$pcisysfs/devices/$name/reset";
3323
3324 return file_write($fn, "1");
3325}
3326
3327sub pci_dev_bind_to_stub {
3328 my ($dev) = @_;
3329
3330 my $name = $dev->{name};
3331
3332 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
3333 return 1 if -d $testdir;
3334
3335 my $data = "$dev->{vendor} $dev->{product}";
3336 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
3337
3338 my $fn = "$pcisysfs/devices/$name/driver/unbind";
3339 if (!file_write($fn, $name)) {
3340 return undef if -f $fn;
3341 }
3342
3343 $fn = "$pcisysfs/drivers/pci-stub/bind";
3344 if (! -d $testdir) {
3345 return undef if !file_write($fn, $name);
3346 }
3347
3348 return -d $testdir;
3349}
3350
3351sub print_pci_addr {
3352 my ($id, $bridges) = @_;
3353
3354 my $res = '';
3355 my $devices = {
3356 piix3 => { bus => 0, addr => 1 },
3357 #addr2 : first videocard
3358 balloon0 => { bus => 0, addr => 3 },
3359 watchdog => { bus => 0, addr => 4 },
3360 scsihw0 => { bus => 0, addr => 5 },
3361 scsihw1 => { bus => 0, addr => 6 },
3362 ahci0 => { bus => 0, addr => 7 },
3363 qga0 => { bus => 0, addr => 8 },
3364 virtio0 => { bus => 0, addr => 10 },
3365 virtio1 => { bus => 0, addr => 11 },
3366 virtio2 => { bus => 0, addr => 12 },
3367 virtio3 => { bus => 0, addr => 13 },
3368 virtio4 => { bus => 0, addr => 14 },
3369 virtio5 => { bus => 0, addr => 15 },
3370 hostpci0 => { bus => 0, addr => 16 },
3371 hostpci1 => { bus => 0, addr => 17 },
3372 net0 => { bus => 0, addr => 18 },
3373 net1 => { bus => 0, addr => 19 },
3374 net2 => { bus => 0, addr => 20 },
3375 net3 => { bus => 0, addr => 21 },
3376 net4 => { bus => 0, addr => 22 },
3377 net5 => { bus => 0, addr => 23 },
3378 #addr29 : usb-host (pve-usb.cfg)
3379 'pci.1' => { bus => 0, addr => 30 },
3380 'pci.2' => { bus => 0, addr => 31 },
3381 'net6' => { bus => 1, addr => 1 },
3382 'net7' => { bus => 1, addr => 2 },
3383 'net8' => { bus => 1, addr => 3 },
3384 'net9' => { bus => 1, addr => 4 },
3385 'net10' => { bus => 1, addr => 5 },
3386 'net11' => { bus => 1, addr => 6 },
3387 'net12' => { bus => 1, addr => 7 },
3388 'net13' => { bus => 1, addr => 8 },
3389 'net14' => { bus => 1, addr => 9 },
3390 'net15' => { bus => 1, addr => 10 },
3391 'net16' => { bus => 1, addr => 11 },
3392 'net17' => { bus => 1, addr => 12 },
3393 'net18' => { bus => 1, addr => 13 },
3394 'net19' => { bus => 1, addr => 14 },
3395 'net20' => { bus => 1, addr => 15 },
3396 'net21' => { bus => 1, addr => 16 },
3397 'net22' => { bus => 1, addr => 17 },
3398 'net23' => { bus => 1, addr => 18 },
3399 'net24' => { bus => 1, addr => 19 },
3400 'net25' => { bus => 1, addr => 20 },
3401 'net26' => { bus => 1, addr => 21 },
3402 'net27' => { bus => 1, addr => 22 },
3403 'net28' => { bus => 1, addr => 23 },
3404 'net29' => { bus => 1, addr => 24 },
3405 'net30' => { bus => 1, addr => 25 },
3406 'net31' => { bus => 1, addr => 26 },
3407 'virtio6' => { bus => 2, addr => 1 },
3408 'virtio7' => { bus => 2, addr => 2 },
3409 'virtio8' => { bus => 2, addr => 3 },
3410 'virtio9' => { bus => 2, addr => 4 },
3411 'virtio10' => { bus => 2, addr => 5 },
3412 'virtio11' => { bus => 2, addr => 6 },
3413 'virtio12' => { bus => 2, addr => 7 },
3414 'virtio13' => { bus => 2, addr => 8 },
3415 'virtio14' => { bus => 2, addr => 9 },
3416 'virtio15' => { bus => 2, addr => 10 },
3417 };
3418
3419 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
3420 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
3421 my $bus = $devices->{$id}->{bus};
3422 $res = ",bus=pci.$bus,addr=$addr";
3423 $bridges->{$bus} = 1 if $bridges;
3424 }
3425 return $res;
3426
3427}
3428
3429# vzdump restore implementaion
3430
3431sub tar_archive_read_firstfile {
3432 my $archive = shift;
3433
3434 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
3435
3436 # try to detect archive type first
3437 my $pid = open (TMP, "tar tf '$archive'|") ||
3438 die "unable to open file '$archive'\n";
3439 my $firstfile = <TMP>;
3440 kill 15, $pid;
3441 close TMP;
3442
3443 die "ERROR: archive contaions no data\n" if !$firstfile;
3444 chomp $firstfile;
3445
3446 return $firstfile;
3447}
3448
3449sub tar_restore_cleanup {
3450 my ($storecfg, $statfile) = @_;
3451
3452 print STDERR "starting cleanup\n";
3453
3454 if (my $fd = IO::File->new($statfile, "r")) {
3455 while (defined(my $line = <$fd>)) {
3456 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
3457 my $volid = $2;
3458 eval {
3459 if ($volid =~ m|^/|) {
3460 unlink $volid || die 'unlink failed\n';
3461 } else {
3462 PVE::Storage::vdisk_free($storecfg, $volid);
3463 }
3464 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3465 };
3466 print STDERR "unable to cleanup '$volid' - $@" if $@;
3467 } else {
3468 print STDERR "unable to parse line in statfile - $line";
3469 }
3470 }
3471 $fd->close();
3472 }
3473}
3474
3475sub restore_archive {
3476 my ($archive, $vmid, $user, $opts) = @_;
3477
3478 my $format = $opts->{format};
3479 my $comp;
3480
3481 if ($archive =~ m/\.tgz$/ || $archive =~ m/\.tar\.gz$/) {
3482 $format = 'tar' if !$format;
3483 $comp = 'gzip';
3484 } elsif ($archive =~ m/\.tar$/) {
3485 $format = 'tar' if !$format;
3486 } elsif ($archive =~ m/.tar.lzo$/) {
3487 $format = 'tar' if !$format;
3488 $comp = 'lzop';
3489 } elsif ($archive =~ m/\.vma$/) {
3490 $format = 'vma' if !$format;
3491 } elsif ($archive =~ m/\.vma\.gz$/) {
3492 $format = 'vma' if !$format;
3493 $comp = 'gzip';
3494 } elsif ($archive =~ m/\.vma\.lzo$/) {
3495 $format = 'vma' if !$format;
3496 $comp = 'lzop';
3497 } else {
3498 $format = 'vma' if !$format; # default
3499 }
3500
3501 # try to detect archive format
3502 if ($format eq 'tar') {
3503 return restore_tar_archive($archive, $vmid, $user, $opts);
3504 } else {
3505 return restore_vma_archive($archive, $vmid, $user, $opts, $comp);
3506 }
3507}
3508
3509sub restore_update_config_line {
3510 my ($outfd, $cookie, $vmid, $map, $line, $unique) = @_;
3511
3512 return if $line =~ m/^\#qmdump\#/;
3513 return if $line =~ m/^\#vzdump\#/;
3514 return if $line =~ m/^lock:/;
3515 return if $line =~ m/^unused\d+:/;
3516 return if $line =~ m/^parent:/;
3517
3518 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
3519 # try to convert old 1.X settings
3520 my ($id, $ind, $ethcfg) = ($1, $2, $3);
3521 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
3522 my ($model, $macaddr) = split(/\=/, $devconfig);
3523 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $unique;
3524 my $net = {
3525 model => $model,
3526 bridge => "vmbr$ind",
3527 macaddr => $macaddr,
3528 };
3529 my $netstr = print_net($net);
3530
3531 print $outfd "net$cookie->{netcount}: $netstr\n";
3532 $cookie->{netcount}++;
3533 }
3534 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
3535 my ($id, $netstr) = ($1, $2);
3536 my $net = parse_net($netstr);
3537 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
3538 $netstr = print_net($net);
3539 print $outfd "$id: $netstr\n";
3540 } elsif ($line =~ m/^((ide|scsi|virtio|sata)\d+):\s*(\S+)\s*$/) {
3541 my $virtdev = $1;
3542 my $value = $3;
3543 if ($line =~ m/backup=no/) {
3544 print $outfd "#$line";
3545 } elsif ($virtdev && $map->{$virtdev}) {
3546 my $di = parse_drive($virtdev, $value);
3547 $di->{file} = $map->{$virtdev};
3548 $value = print_drive($vmid, $di);
3549 print $outfd "$virtdev: $value\n";
3550 } else {
3551 print $outfd $line;
3552 }
3553 } else {
3554 print $outfd $line;
3555 }
3556}
3557
3558sub scan_volids {
3559 my ($cfg, $vmid) = @_;
3560
3561 my $info = PVE::Storage::vdisk_list($cfg, undef, $vmid);
3562
3563 my $volid_hash = {};
3564 foreach my $storeid (keys %$info) {
3565 foreach my $item (@{$info->{$storeid}}) {
3566 next if !($item->{volid} && $item->{size});
3567 $volid_hash->{$item->{volid}} = $item;
3568 }
3569 }
3570
3571 return $volid_hash;
3572}
3573
3574sub update_disksize {
3575 my ($vmid, $conf, $volid_hash) = @_;
3576
3577 my $changes;
3578
3579 my $used = {};
3580
3581 # update size info
3582 foreach my $opt (keys %$conf) {
3583 if (valid_drivename($opt)) {
3584 my $drive = parse_drive($opt, $conf->{$opt});
3585 my $volid = $drive->{file};
3586 next if !$volid;
3587
3588 $used->{$volid} = 1;
3589
3590 next if drive_is_cdrom($drive);
3591 next if !$volid_hash->{$volid};
3592
3593 $drive->{size} = $volid_hash->{$volid}->{size};
3594 $changes = 1;
3595 $conf->{$opt} = print_drive($vmid, $drive);
3596 }
3597 }
3598
3599 foreach my $volid (sort keys %$volid_hash) {
3600 next if $volid =~ m/vm-$vmid-state-/;
3601 next if $used->{$volid};
3602 $changes = 1;
3603 add_unused_volume($conf, $volid);
3604 }
3605
3606 return $changes;
3607}
3608
3609sub rescan {
3610 my ($vmid, $nolock) = @_;
3611
3612 my $cfg = PVE::Cluster::cfs_read_file("storage.cfg");
3613
3614 my $volid_hash = scan_volids($cfg, $vmid);
3615
3616 my $updatefn = sub {
3617 my ($vmid) = @_;
3618
3619 my $conf = load_config($vmid);
3620
3621 check_lock($conf);
3622
3623 my $changes = update_disksize($vmid, $conf, $volid_hash);
3624
3625 update_config_nolock($vmid, $conf, 1) if $changes;
3626 };
3627
3628 if (defined($vmid)) {
3629 if ($nolock) {
3630 &$updatefn($vmid);
3631 } else {
3632 lock_config($vmid, $updatefn, $vmid);
3633 }
3634 } else {
3635 my $vmlist = config_list();
3636 foreach my $vmid (keys %$vmlist) {
3637 if ($nolock) {
3638 &$updatefn($vmid);
3639 } else {
3640 lock_config($vmid, $updatefn, $vmid);
3641 }
3642 }
3643 }
3644}
3645
3646sub restore_vma_archive {
3647 my ($archive, $vmid, $user, $opts, $comp) = @_;
3648
3649 my $input = $archive eq '-' ? "<&STDIN" : undef;
3650 my $readfrom = $archive;
3651
3652 my $uncomp = '';
3653 if ($comp) {
3654 $readfrom = '-';
3655 my $qarchive = PVE::Tools::shellquote($archive);
3656 if ($comp eq 'gzip') {
3657 $uncomp = "zcat $qarchive|";
3658 } elsif ($comp eq 'lzop') {
3659 $uncomp = "lzop -d -c $qarchive|";
3660 } else {
3661 die "unknown compression method '$comp'\n";
3662 }
3663
3664 }
3665
3666 my $tmpdir = "/var/tmp/vzdumptmp$$";
3667 rmtree $tmpdir;
3668
3669 # disable interrupts (always do cleanups)
3670 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
3671 warn "got interrupt - ignored\n";
3672 };
3673
3674 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
3675 POSIX::mkfifo($mapfifo, 0600);
3676 my $fifofh;
3677
3678 my $openfifo = sub {
3679 open($fifofh, '>', $mapfifo) || die $!;
3680 };
3681
3682 my $cmd = "${uncomp}vma extract -v -r $mapfifo $readfrom $tmpdir";
3683
3684 my $oldtimeout;
3685 my $timeout = 5;
3686
3687 my $devinfo = {};
3688
3689 my $rpcenv = PVE::RPCEnvironment::get();
3690
3691 my $conffile = config_file($vmid);
3692 my $tmpfn = "$conffile.$$.tmp";
3693
3694 # Note: $oldconf is undef if VM does not exists
3695 my $oldconf = PVE::Cluster::cfs_read_file(cfs_config_path($vmid));
3696
3697 my $print_devmap = sub {
3698 my $virtdev_hash = {};
3699
3700 my $cfgfn = "$tmpdir/qemu-server.conf";
3701
3702 # we can read the config - that is already extracted
3703 my $fh = IO::File->new($cfgfn, "r") ||
3704 "unable to read qemu-server.conf - $!\n";
3705
3706 while (defined(my $line = <$fh>)) {
3707 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
3708 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
3709 die "archive does not contain data for drive '$virtdev'\n"
3710 if !$devinfo->{$devname};
3711 if (defined($opts->{storage})) {
3712 $storeid = $opts->{storage} || 'local';
3713 } elsif (!$storeid) {
3714 $storeid = 'local';
3715 }
3716 $format = 'raw' if !$format;
3717 $devinfo->{$devname}->{devname} = $devname;
3718 $devinfo->{$devname}->{virtdev} = $virtdev;
3719 $devinfo->{$devname}->{format} = $format;
3720 $devinfo->{$devname}->{storeid} = $storeid;
3721
3722 # check permission on storage
3723 my $pool = $opts->{pool}; # todo: do we need that?
3724 if ($user ne 'root@pam') {
3725 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace']);
3726 }
3727
3728 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
3729 }
3730 }
3731
3732 foreach my $devname (keys %$devinfo) {
3733 die "found no device mapping information for device '$devname'\n"
3734 if !$devinfo->{$devname}->{virtdev};
3735 }
3736
3737 my $cfg = cfs_read_file('storage.cfg');
3738
3739 # create empty/temp config
3740 if ($oldconf) {
3741 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
3742 foreach_drive($oldconf, sub {
3743 my ($ds, $drive) = @_;
3744
3745 return if drive_is_cdrom($drive);
3746
3747 my $volid = $drive->{file};
3748
3749 return if !$volid || $volid =~ m|^/|;
3750
3751 my ($path, $owner) = PVE::Storage::path($cfg, $volid);
3752 return if !$path || !$owner || ($owner != $vmid);
3753
3754 # Note: only delete disk we want to restore
3755 # other volumes will become unused
3756 if ($virtdev_hash->{$ds}) {
3757 PVE::Storage::vdisk_free($cfg, $volid);
3758 }
3759 });
3760 }
3761
3762 my $map = {};
3763 foreach my $virtdev (sort keys %$virtdev_hash) {
3764 my $d = $virtdev_hash->{$virtdev};
3765 my $alloc_size = int(($d->{size} + 1024 - 1)/1024);
3766 my $scfg = PVE::Storage::storage_config($cfg, $d->{storeid});
3767 my $volid = PVE::Storage::vdisk_alloc($cfg, $d->{storeid}, $vmid,
3768 $d->{format}, undef, $alloc_size);
3769 print STDERR "new volume ID is '$volid'\n";
3770 $d->{volid} = $volid;
3771 my $path = PVE::Storage::path($cfg, $volid);
3772
3773 my $write_zeros = 1;
3774 # fixme: what other storages types initialize volumes with zero?
3775 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs') {
3776 $write_zeros = 0;
3777 }
3778
3779 print $fifofh "${write_zeros}:$d->{devname}=$path\n";
3780
3781 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
3782 $map->{$virtdev} = $volid;
3783 }
3784
3785 $fh->seek(0, 0) || die "seek failed - $!\n";
3786
3787 my $outfd = new IO::File ($tmpfn, "w") ||
3788 die "unable to write config for VM $vmid\n";
3789
3790 my $cookie = { netcount => 0 };
3791 while (defined(my $line = <$fh>)) {
3792 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3793 }
3794
3795 $fh->close();
3796 $outfd->close();
3797 };
3798
3799 eval {
3800 # enable interrupts
3801 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
3802 die "interrupted by signal\n";
3803 };
3804 local $SIG{ALRM} = sub { die "got timeout\n"; };
3805
3806 $oldtimeout = alarm($timeout);
3807
3808 my $parser = sub {
3809 my $line = shift;
3810
3811 print "$line\n";
3812
3813 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
3814 my ($dev_id, $size, $devname) = ($1, $2, $3);
3815 $devinfo->{$devname} = { size => $size, dev_id => $dev_id };
3816 } elsif ($line =~ m/^CTIME: /) {
3817 &$print_devmap();
3818 print $fifofh "done\n";
3819 my $tmp = $oldtimeout || 0;
3820 $oldtimeout = undef;
3821 alarm($tmp);
3822 close($fifofh);
3823 }
3824 };
3825
3826 print "restore vma archive: $cmd\n";
3827 run_command($cmd, input => $input, outfunc => $parser, afterfork => $openfifo);
3828 };
3829 my $err = $@;
3830
3831 alarm($oldtimeout) if $oldtimeout;
3832
3833 unlink $mapfifo;
3834
3835 if ($err) {
3836 rmtree $tmpdir;
3837 unlink $tmpfn;
3838
3839 my $cfg = cfs_read_file('storage.cfg');
3840 foreach my $devname (keys %$devinfo) {
3841 my $volid = $devinfo->{$devname}->{volid};
3842 next if !$volid;
3843 eval {
3844 if ($volid =~ m|^/|) {
3845 unlink $volid || die 'unlink failed\n';
3846 } else {
3847 PVE::Storage::vdisk_free($cfg, $volid);
3848 }
3849 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3850 };
3851 print STDERR "unable to cleanup '$volid' - $@" if $@;
3852 }
3853 die $err;
3854 }
3855
3856 rmtree $tmpdir;
3857
3858 rename($tmpfn, $conffile) ||
3859 die "unable to commit configuration file '$conffile'\n";
3860
3861 PVE::Cluster::cfs_update(); # make sure we read new file
3862
3863 eval { rescan($vmid, 1); };
3864 warn $@ if $@;
3865}
3866
3867sub restore_tar_archive {
3868 my ($archive, $vmid, $user, $opts) = @_;
3869
3870 if ($archive ne '-') {
3871 my $firstfile = tar_archive_read_firstfile($archive);
3872 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
3873 if $firstfile ne 'qemu-server.conf';
3874 }
3875
3876 my $storecfg = cfs_read_file('storage.cfg');
3877
3878 # destroy existing data - keep empty config
3879 my $vmcfgfn = PVE::QemuServer::config_file($vmid);
3880 destroy_vm($storecfg, $vmid, 1) if -f $vmcfgfn;
3881
3882 my $tocmd = "/usr/lib/qemu-server/qmextract";
3883
3884 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
3885 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3886 $tocmd .= ' --prealloc' if $opts->{prealloc};
3887 $tocmd .= ' --info' if $opts->{info};
3888
3889 # tar option "xf" does not autodetect compression when read from STDIN,
3890 # so we pipe to zcat
3891 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
3892 PVE::Tools::shellquote("--to-command=$tocmd");
3893
3894 my $tmpdir = "/var/tmp/vzdumptmp$$";
3895 mkpath $tmpdir;
3896
3897 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
3898 local $ENV{VZDUMP_VMID} = $vmid;
3899 local $ENV{VZDUMP_USER} = $user;
3900
3901 my $conffile = config_file($vmid);
3902 my $tmpfn = "$conffile.$$.tmp";
3903
3904 # disable interrupts (always do cleanups)
3905 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
3906 print STDERR "got interrupt - ignored\n";
3907 };
3908
3909 eval {
3910 # enable interrupts
3911 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
3912 die "interrupted by signal\n";
3913 };
3914
3915 if ($archive eq '-') {
3916 print "extracting archive from STDIN\n";
3917 run_command($cmd, input => "<&STDIN");
3918 } else {
3919 print "extracting archive '$archive'\n";
3920 run_command($cmd);
3921 }
3922
3923 return if $opts->{info};
3924
3925 # read new mapping
3926 my $map = {};
3927 my $statfile = "$tmpdir/qmrestore.stat";
3928 if (my $fd = IO::File->new($statfile, "r")) {
3929 while (defined (my $line = <$fd>)) {
3930 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
3931 $map->{$1} = $2 if $1;
3932 } else {
3933 print STDERR "unable to parse line in statfile - $line\n";
3934 }
3935 }
3936 $fd->close();
3937 }
3938
3939 my $confsrc = "$tmpdir/qemu-server.conf";
3940
3941 my $srcfd = new IO::File($confsrc, "r") ||
3942 die "unable to open file '$confsrc'\n";
3943
3944 my $outfd = new IO::File ($tmpfn, "w") ||
3945 die "unable to write config for VM $vmid\n";
3946
3947 my $cookie = { netcount => 0 };
3948 while (defined (my $line = <$srcfd>)) {
3949 restore_update_config_line($outfd, $cookie, $vmid, $map, $line, $opts->{unique});
3950 }
3951
3952 $srcfd->close();
3953 $outfd->close();
3954 };
3955 my $err = $@;
3956
3957 if ($err) {
3958
3959 unlink $tmpfn;
3960
3961 tar_restore_cleanup($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info};
3962
3963 die $err;
3964 }
3965
3966 rmtree $tmpdir;
3967
3968 rename $tmpfn, $conffile ||
3969 die "unable to commit configuration file '$conffile'\n";
3970
3971 PVE::Cluster::cfs_update(); # make sure we read new file
3972
3973 eval { rescan($vmid, 1); };
3974 warn $@ if $@;
3975};
3976
3977
3978# Internal snapshots
3979
3980# NOTE: Snapshot create/delete involves several non-atomic
3981# action, and can take a long time.
3982# So we try to avoid locking the file and use 'lock' variable
3983# inside the config file instead.
3984
3985my $snapshot_copy_config = sub {
3986 my ($source, $dest) = @_;
3987
3988 foreach my $k (keys %$source) {
3989 next if $k eq 'snapshots';
3990 next if $k eq 'snapstate';
3991 next if $k eq 'snaptime';
3992 next if $k eq 'vmstate';
3993 next if $k eq 'lock';
3994 next if $k eq 'digest';
3995 next if $k eq 'description';
3996 next if $k =~ m/^unused\d+$/;
3997
3998 $dest->{$k} = $source->{$k};
3999 }
4000};
4001
4002my $snapshot_apply_config = sub {
4003 my ($conf, $snap) = @_;
4004
4005 # copy snapshot list
4006 my $newconf = {
4007 snapshots => $conf->{snapshots},
4008 };
4009
4010 # keep description and list of unused disks
4011 foreach my $k (keys %$conf) {
4012 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
4013 $newconf->{$k} = $conf->{$k};
4014 }
4015
4016 &$snapshot_copy_config($snap, $newconf);
4017
4018 return $newconf;
4019};
4020
4021sub foreach_writable_storage {
4022 my ($conf, $func) = @_;
4023
4024 my $sidhash = {};
4025
4026 foreach my $ds (keys %$conf) {
4027 next if !valid_drivename($ds);
4028
4029 my $drive = parse_drive($ds, $conf->{$ds});
4030 next if !$drive;
4031 next if drive_is_cdrom($drive);
4032
4033 my $volid = $drive->{file};
4034
4035 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
4036 $sidhash->{$sid} = $sid if $sid;
4037 }
4038
4039 foreach my $sid (sort keys %$sidhash) {
4040 &$func($sid);
4041 }
4042}
4043
4044my $alloc_vmstate_volid = sub {
4045 my ($storecfg, $vmid, $conf, $snapname) = @_;
4046
4047 # Note: we try to be smart when selecting a $target storage
4048
4049 my $target;
4050
4051 # search shared storage first
4052 foreach_writable_storage($conf, sub {
4053 my ($sid) = @_;
4054 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4055 return if !$scfg->{shared};
4056
4057 $target = $sid if !$target || $scfg->{path}; # prefer file based storage
4058 });
4059
4060 if (!$target) {
4061 # now search local storage
4062 foreach_writable_storage($conf, sub {
4063 my ($sid) = @_;
4064 my $scfg = PVE::Storage::storage_config($storecfg, $sid);
4065 return if $scfg->{shared};
4066
4067 $target = $sid if !$target || $scfg->{path}; # prefer file based storage;
4068 });
4069 }
4070
4071 $target = 'local' if !$target;
4072
4073 my $driver_state_size = 500; # assume 32MB is enough to safe all driver state;
4074 # we abort live save after $conf->{memory}, so we need at max twice that space
4075 my $size = $conf->{memory}*2 + $driver_state_size;
4076
4077 my $name = "vm-$vmid-state-$snapname";
4078 my $scfg = PVE::Storage::storage_config($storecfg, $target);
4079 $name .= ".raw" if $scfg->{path}; # add filename extension for file base storage
4080 my $volid = PVE::Storage::vdisk_alloc($storecfg, $target, $vmid, 'raw', $name, $size*1024);
4081
4082 return $volid;
4083};
4084
4085my $snapshot_prepare = sub {
4086 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
4087
4088 my $snap;
4089
4090 my $updatefn = sub {
4091
4092 my $conf = load_config($vmid);
4093
4094 die "you can't take a snapshot if it's a template\n"
4095 if is_template($conf);
4096
4097 check_lock($conf);
4098
4099 $conf->{lock} = 'snapshot';
4100
4101 die "snapshot name '$snapname' already used\n"
4102 if defined($conf->{snapshots}->{$snapname});
4103
4104 my $storecfg = PVE::Storage::config();
4105 die "snapshot feature is not available" if !has_feature('snapshot', $conf, $storecfg);
4106
4107 $snap = $conf->{snapshots}->{$snapname} = {};
4108
4109 if ($save_vmstate && check_running($vmid)) {
4110 $snap->{vmstate} = &$alloc_vmstate_volid($storecfg, $vmid, $conf, $snapname);
4111 }
4112
4113 &$snapshot_copy_config($conf, $snap);
4114
4115 $snap->{snapstate} = "prepare";
4116 $snap->{snaptime} = time();
4117 $snap->{description} = $comment if $comment;
4118
4119 update_config_nolock($vmid, $conf, 1);
4120 };
4121
4122 lock_config($vmid, $updatefn);
4123
4124 return $snap;
4125};
4126
4127my $snapshot_commit = sub {
4128 my ($vmid, $snapname) = @_;
4129
4130 my $updatefn = sub {
4131
4132 my $conf = load_config($vmid);
4133
4134 die "missing snapshot lock\n"
4135 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
4136
4137 my $snap = $conf->{snapshots}->{$snapname};
4138
4139 die "snapshot '$snapname' does not exist\n" if !defined($snap);
4140
4141 die "wrong snapshot state\n"
4142 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
4143
4144 delete $snap->{snapstate};
4145 delete $conf->{lock};
4146
4147 my $newconf = &$snapshot_apply_config($conf, $snap);
4148
4149 $newconf->{parent} = $snapname;
4150
4151 update_config_nolock($vmid, $newconf, 1);
4152 };
4153
4154 lock_config($vmid, $updatefn);
4155};
4156
4157sub snapshot_rollback {
4158 my ($vmid, $snapname) = @_;
4159
4160 my $snap;
4161
4162 my $prepare = 1;
4163
4164 my $storecfg = PVE::Storage::config();
4165
4166 my $updatefn = sub {
4167
4168 my $conf = load_config($vmid);
4169
4170 die "you can't rollback if vm is a template\n" if is_template($conf);
4171
4172 $snap = $conf->{snapshots}->{$snapname};
4173
4174 die "snapshot '$snapname' does not exist\n" if !defined($snap);
4175
4176 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
4177 if $snap->{snapstate};
4178
4179 if ($prepare) {
4180 check_lock($conf);
4181 vm_stop($storecfg, $vmid, undef, undef, 5, undef, undef);
4182 }
4183
4184 die "unable to rollback vm $vmid: vm is running\n"
4185 if check_running($vmid);
4186
4187 if ($prepare) {
4188 $conf->{lock} = 'rollback';
4189 } else {
4190 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
4191 delete $conf->{lock};
4192 }
4193
4194 if (!$prepare) {
4195 # copy snapshot config to current config
4196 $conf = &$snapshot_apply_config($conf, $snap);
4197 $conf->{parent} = $snapname;
4198 }
4199
4200 update_config_nolock($vmid, $conf, 1);
4201
4202 if (!$prepare && $snap->{vmstate}) {
4203 my $statefile = PVE::Storage::path($storecfg, $snap->{vmstate});
4204 vm_start($storecfg, $vmid, $statefile);
4205 }
4206 };
4207
4208 lock_config($vmid, $updatefn);
4209
4210 foreach_drive($snap, sub {
4211 my ($ds, $drive) = @_;
4212
4213 return if drive_is_cdrom($drive);
4214
4215 my $volid = $drive->{file};
4216 my $device = "drive-$ds";
4217
4218 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
4219 });
4220
4221 $prepare = 0;
4222 lock_config($vmid, $updatefn);
4223}
4224
4225my $savevm_wait = sub {
4226 my ($vmid) = @_;
4227
4228 for(;;) {
4229 my $stat = vm_mon_cmd_nocheck($vmid, "query-savevm");
4230 if (!$stat->{status}) {
4231 die "savevm not active\n";
4232 } elsif ($stat->{status} eq 'active') {
4233 sleep(1);
4234 next;
4235 } elsif ($stat->{status} eq 'completed') {
4236 last;
4237 } else {
4238 die "query-savevm returned status '$stat->{status}'\n";
4239 }
4240 }
4241};
4242
4243sub snapshot_create {
4244 my ($vmid, $snapname, $save_vmstate, $freezefs, $comment) = @_;
4245
4246 my $snap = &$snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
4247
4248 $freezefs = $save_vmstate = 0 if !$snap->{vmstate}; # vm is not running
4249
4250 my $drivehash = {};
4251
4252 my $running = check_running($vmid);
4253
4254 eval {
4255 # create internal snapshots of all drives
4256
4257 my $storecfg = PVE::Storage::config();
4258
4259 if ($running) {
4260 if ($snap->{vmstate}) {
4261 my $path = PVE::Storage::path($storecfg, $snap->{vmstate});
4262 vm_mon_cmd($vmid, "savevm-start", statefile => $path);
4263 &$savevm_wait($vmid);
4264 } else {
4265 vm_mon_cmd($vmid, "savevm-start");
4266 }
4267 };
4268
4269 qga_freezefs($vmid) if $running && $freezefs;
4270
4271 foreach_drive($snap, sub {
4272 my ($ds, $drive) = @_;
4273
4274 return if drive_is_cdrom($drive);
4275
4276 my $volid = $drive->{file};
4277 my $device = "drive-$ds";
4278
4279 qemu_volume_snapshot($vmid, $device, $storecfg, $volid, $snapname);
4280 $drivehash->{$ds} = 1;
4281 });
4282 };
4283 my $err = $@;
4284
4285 eval { gqa_unfreezefs($vmid) if $running && $freezefs; };
4286 warn $@ if $@;
4287
4288 eval { vm_mon_cmd($vmid, "savevm-end") if $running; };
4289 warn $@ if $@;
4290
4291 if ($err) {
4292 warn "snapshot create failed: starting cleanup\n";
4293 eval { snapshot_delete($vmid, $snapname, 0, $drivehash); };
4294 warn $@ if $@;
4295 die $err;
4296 }
4297
4298 &$snapshot_commit($vmid, $snapname);
4299}
4300
4301# Note: $drivehash is only set when called from snapshot_create.
4302sub snapshot_delete {
4303 my ($vmid, $snapname, $force, $drivehash) = @_;
4304
4305 my $prepare = 1;
4306
4307 my $snap;
4308 my $unused = [];
4309
4310 my $unlink_parent = sub {
4311 my ($confref, $new_parent) = @_;
4312
4313 if ($confref->{parent} && $confref->{parent} eq $snapname) {
4314 if ($new_parent) {
4315 $confref->{parent} = $new_parent;
4316 } else {
4317 delete $confref->{parent};
4318 }
4319 }
4320 };
4321
4322 my $updatefn = sub {
4323 my ($remove_drive) = @_;
4324
4325 my $conf = load_config($vmid);
4326
4327 if (!$drivehash) {
4328 check_lock($conf);
4329 die "you can't delete a snapshot if vm is a template\n"
4330 if is_template($conf);
4331 }
4332
4333 $snap = $conf->{snapshots}->{$snapname};
4334
4335 die "snapshot '$snapname' does not exist\n" if !defined($snap);
4336
4337 # remove parent refs
4338 &$unlink_parent($conf, $snap->{parent});
4339 foreach my $sn (keys %{$conf->{snapshots}}) {
4340 next if $sn eq $snapname;
4341 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
4342 }
4343
4344 if ($remove_drive) {
4345 if ($remove_drive eq 'vmstate') {
4346 delete $snap->{$remove_drive};
4347 } else {
4348 my $drive = parse_drive($remove_drive, $snap->{$remove_drive});
4349 my $volid = $drive->{file};
4350 delete $snap->{$remove_drive};
4351 add_unused_volume($conf, $volid);
4352 }
4353 }
4354
4355 if ($prepare) {
4356 $snap->{snapstate} = 'delete';
4357 } else {
4358 delete $conf->{snapshots}->{$snapname};
4359 delete $conf->{lock} if $drivehash;
4360 foreach my $volid (@$unused) {
4361 add_unused_volume($conf, $volid);
4362 }
4363 }
4364
4365 update_config_nolock($vmid, $conf, 1);
4366 };
4367
4368 lock_config($vmid, $updatefn);
4369
4370 # now remove vmstate file
4371
4372 my $storecfg = PVE::Storage::config();
4373
4374 if ($snap->{vmstate}) {
4375 eval { PVE::Storage::vdisk_free($storecfg, $snap->{vmstate}); };
4376 if (my $err = $@) {
4377 die $err if !$force;
4378 warn $err;
4379 }
4380 # save changes (remove vmstate from snapshot)
4381 lock_config($vmid, $updatefn, 'vmstate') if !$force;
4382 };
4383
4384 # now remove all internal snapshots
4385 foreach_drive($snap, sub {
4386 my ($ds, $drive) = @_;
4387
4388 return if drive_is_cdrom($drive);
4389
4390 my $volid = $drive->{file};
4391 my $device = "drive-$ds";
4392
4393 if (!$drivehash || $drivehash->{$ds}) {
4394 eval { qemu_volume_snapshot_delete($vmid, $device, $storecfg, $volid, $snapname); };
4395 if (my $err = $@) {
4396 die $err if !$force;
4397 warn $err;
4398 }
4399 }
4400
4401 # save changes (remove drive fron snapshot)
4402 lock_config($vmid, $updatefn, $ds) if !$force;
4403 push @$unused, $volid;
4404 });
4405
4406 # now cleanup config
4407 $prepare = 0;
4408 lock_config($vmid, $updatefn);
4409}
4410
4411sub has_feature {
4412 my ($feature, $conf, $storecfg, $snapname, $running) = @_;
4413
4414 my $err = undef;
4415 foreach_drive($conf, sub {
4416 my ($ds, $drive) = @_;
4417
4418 return if drive_is_cdrom($drive);
4419 my $volid = $drive->{file};
4420 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $volid, $snapname, $running);
4421 });
4422
4423 return 1 if !$err;
4424}
4425
4426sub template_create {
4427 my ($vmid, $conf, $disk) = @_;
4428
4429 my $running = check_running($vmid);
4430 die "you can't convert a vm to template if vm is running vm\n" if $running;
4431
4432 my $storecfg = PVE::Storage::config();
4433 my $i = 0;
4434
4435 foreach_drive($conf, sub {
4436 my ($ds, $drive) = @_;
4437
4438 return if drive_is_cdrom($drive);
4439 return if $disk && $ds ne $disk;
4440
4441 my $volid = $drive->{file};
4442 die "volume '$volid' does not support template/clone\n"
4443 if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
4444 });
4445
4446 foreach_drive($conf, sub {
4447 my ($ds, $drive) = @_;
4448
4449 return if drive_is_cdrom($drive);
4450 return if $disk && $ds ne $disk;
4451
4452 my $volid = $drive->{file};
4453 my $voliddst = PVE::Storage::vdisk_create_base($storecfg, $volid);
4454 $drive->{file} = $voliddst;
4455 $conf->{$ds} = PVE::QemuServer::print_drive($vmid, $drive);
4456 PVE::QemuServer::update_config_nolock($vmid, $conf, 1);
4457
4458 });
4459 if($conf->{snapshots}){
4460 delete $conf->{parent};
4461 delete $conf->{snapshots};
4462 PVE::QemuServer::update_config_nolock($vmid, $conf, 1);
4463 #fixme : do we need to delete disks snapshots ?
4464 }
4465}
4466
4467sub is_template {
4468 my ($conf) = @_;
4469
4470 my $baseimagecount = 0;
4471 my $totalvolumecount = 0;
4472 my $storecfg = PVE::Storage::config();
4473
4474 foreach_drive($conf, sub {
4475 my ($ds, $drive) = @_;
4476 return if drive_is_cdrom($drive);
4477 $totalvolumecount++;
4478 my $volid = $drive->{file};
4479 if (PVE::Storage::volume_is_base($storecfg, $volid)){
4480 $baseimagecount++;
4481 }
4482
4483 });
4484
4485 return 0 if $baseimagecount == 0;
4486 return 1 if $baseimagecount == $totalvolumecount; #full template
4487 return 2 if $baseimagecount < $totalvolumecount; #semi-template
4488}
4489
44901;