]> git.proxmox.com Git - qemu-server.git/blame - PVE/QemuServer.pm
fix cdrom permission check
[qemu-server.git] / PVE / QemuServer.pm
CommitLineData
1e3baf05
DM
1package PVE::QemuServer;
2
3use strict;
4use POSIX;
5use IO::Handle;
6use IO::Select;
7use IO::File;
8use IO::Dir;
9use IO::Socket::UNIX;
10use File::Basename;
11use File::Path;
12use File::stat;
13use Getopt::Long;
14use Digest::SHA1;
15use Fcntl ':flock';
16use Cwd 'abs_path';
17use IPC::Open3;
18use Fcntl;
19use PVE::SafeSyslog;
20use Storable qw(dclone);
21use PVE::Exception qw(raise raise_param_exc);
22use PVE::Storage;
23use PVE::Tools qw(run_command lock_file file_read_firstline);
24use PVE::Cluster qw(cfs_register_file cfs_read_file cfs_write_file cfs_lock_file);
25use PVE::INotify;
26use PVE::ProcFSTools;
6b64503e 27use Time::HiRes qw(gettimeofday);
1e3baf05 28
7f0b5beb 29my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
1e3baf05 30
19672434 31# Note about locking: we use flock on the config file protect
1e3baf05
DM
32# against concurent actions.
33# Aditionaly, we have a 'lock' setting in the config file. This
34# can be set to 'migrate' or 'backup'. Most actions are not
35# allowed when such lock is set. But you can ignore this kind of
36# lock with the --skiplock flag.
37
1858638f
DM
38cfs_register_file('/qemu-server/',
39 \&parse_vm_config,
40 \&write_vm_config);
1e3baf05 41
3ea94c60
DM
42PVE::JSONSchema::register_standard_option('skiplock', {
43 description => "Ignore locks - only root is allowed to use this option.",
afdb31d5 44 type => 'boolean',
3ea94c60
DM
45 optional => 1,
46});
47
48PVE::JSONSchema::register_standard_option('pve-qm-stateuri', {
49 description => "Some command save/restore state from this location.",
50 type => 'string',
51 maxLength => 128,
52 optional => 1,
53});
54
1e3baf05
DM
55#no warnings 'redefine';
56
57unless(defined(&_VZSYSCALLS_H_)) {
58 eval 'sub _VZSYSCALLS_H_ () {1;}' unless defined(&_VZSYSCALLS_H_);
59 require 'sys/syscall.ph';
60 if(defined(&__x86_64__)) {
61 eval 'sub __NR_fairsched_vcpus () {499;}' unless defined(&__NR_fairsched_vcpus);
62 eval 'sub __NR_fairsched_mknod () {504;}' unless defined(&__NR_fairsched_mknod);
63 eval 'sub __NR_fairsched_rmnod () {505;}' unless defined(&__NR_fairsched_rmnod);
64 eval 'sub __NR_fairsched_chwt () {506;}' unless defined(&__NR_fairsched_chwt);
65 eval 'sub __NR_fairsched_mvpr () {507;}' unless defined(&__NR_fairsched_mvpr);
66 eval 'sub __NR_fairsched_rate () {508;}' unless defined(&__NR_fairsched_rate);
67 eval 'sub __NR_setluid () {501;}' unless defined(&__NR_setluid);
68 eval 'sub __NR_setublimit () {502;}' unless defined(&__NR_setublimit);
69 }
70 elsif(defined( &__i386__) ) {
71 eval 'sub __NR_fairsched_mknod () {500;}' unless defined(&__NR_fairsched_mknod);
72 eval 'sub __NR_fairsched_rmnod () {501;}' unless defined(&__NR_fairsched_rmnod);
73 eval 'sub __NR_fairsched_chwt () {502;}' unless defined(&__NR_fairsched_chwt);
74 eval 'sub __NR_fairsched_mvpr () {503;}' unless defined(&__NR_fairsched_mvpr);
75 eval 'sub __NR_fairsched_rate () {504;}' unless defined(&__NR_fairsched_rate);
76 eval 'sub __NR_fairsched_vcpus () {505;}' unless defined(&__NR_fairsched_vcpus);
77 eval 'sub __NR_setluid () {511;}' unless defined(&__NR_setluid);
78 eval 'sub __NR_setublimit () {512;}' unless defined(&__NR_setublimit);
79 } else {
80 die("no fairsched syscall for this arch");
81 }
82 require 'asm/ioctl.ph';
83 eval 'sub KVM_GET_API_VERSION () { &_IO(0xAE, 0x);}' unless defined(&KVM_GET_API_VERSION);
84}
85
86sub fairsched_mknod {
87 my ($parent, $weight, $desired) = @_;
88
6b64503e 89 return syscall(&__NR_fairsched_mknod, int($parent), int($weight), int($desired));
1e3baf05
DM
90}
91
92sub fairsched_rmnod {
93 my ($id) = @_;
94
6b64503e 95 return syscall(&__NR_fairsched_rmnod, int($id));
1e3baf05
DM
96}
97
98sub fairsched_mvpr {
99 my ($pid, $newid) = @_;
100
6b64503e 101 return syscall(&__NR_fairsched_mvpr, int($pid), int($newid));
1e3baf05
DM
102}
103
104sub fairsched_vcpus {
105 my ($id, $vcpus) = @_;
106
6b64503e 107 return syscall(&__NR_fairsched_vcpus, int($id), int($vcpus));
1e3baf05
DM
108}
109
110sub fairsched_rate {
111 my ($id, $op, $rate) = @_;
112
6b64503e 113 return syscall(&__NR_fairsched_rate, int($id), int($op), int($rate));
1e3baf05
DM
114}
115
116use constant FAIRSCHED_SET_RATE => 0;
117use constant FAIRSCHED_DROP_RATE => 1;
118use constant FAIRSCHED_GET_RATE => 2;
119
120sub fairsched_cpulimit {
121 my ($id, $limit) = @_;
122
6b64503e 123 my $cpulim1024 = int($limit * 1024 / 100);
1e3baf05
DM
124 my $op = $cpulim1024 ? FAIRSCHED_SET_RATE : FAIRSCHED_DROP_RATE;
125
6b64503e 126 return fairsched_rate($id, $op, $cpulim1024);
1e3baf05
DM
127}
128
129my $nodename = PVE::INotify::nodename();
130
131mkdir "/etc/pve/nodes/$nodename";
132my $confdir = "/etc/pve/nodes/$nodename/qemu-server";
133mkdir $confdir;
134
135my $var_run_tmpdir = "/var/run/qemu-server";
136mkdir $var_run_tmpdir;
137
138my $lock_dir = "/var/lock/qemu-server";
139mkdir $lock_dir;
140
141my $pcisysfs = "/sys/bus/pci";
142
1e3baf05
DM
143my $confdesc = {
144 onboot => {
145 optional => 1,
146 type => 'boolean',
147 description => "Specifies whether a VM will be started during system bootup.",
148 default => 0,
149 },
150 autostart => {
151 optional => 1,
152 type => 'boolean',
153 description => "Automatic restart after crash (currently ignored).",
154 default => 0,
155 },
2ff09f52
DA
156 hotplug => {
157 optional => 1,
e8b9c17c 158 type => 'boolean',
2ff09f52
DA
159 description => "Activate hotplug for disk and network device",
160 default => 0,
161 },
1e3baf05
DM
162 reboot => {
163 optional => 1,
164 type => 'boolean',
165 description => "Allow reboot. If set to '0' the VM exit on reboot.",
166 default => 1,
167 },
168 lock => {
169 optional => 1,
170 type => 'string',
171 description => "Lock/unlock the VM.",
172 enum => [qw(migrate backup)],
173 },
174 cpulimit => {
175 optional => 1,
176 type => 'integer',
177 description => "Limit of CPU usage in per cent. Note if the computer has 2 CPUs, it has total of 200% CPU time. Value '0' indicates no CPU limit.\n\nNOTE: This option is currently ignored.",
178 minimum => 0,
179 default => 0,
180 },
181 cpuunits => {
182 optional => 1,
183 type => 'integer',
184 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
185 minimum => 0,
186 maximum => 500000,
187 default => 1000,
188 },
189 memory => {
190 optional => 1,
191 type => 'integer',
7878afeb 192 description => "Amount of RAM for the VM in MB. This is the maximum available memory when you use the balloon device.",
1e3baf05
DM
193 minimum => 16,
194 default => 512,
195 },
13a48620
DA
196 balloon => {
197 optional => 1,
198 type => 'integer',
199 description => "Amount of target RAM for the VM in MB.",
7878afeb 200 minimum => 16,
13a48620 201 },
1e3baf05
DM
202 keyboard => {
203 optional => 1,
204 type => 'string',
205 description => "Keybord layout for vnc server. Default is read from the datacenter configuration file.",
e95fe75f 206 enum => PVE::Tools::kvmkeymaplist(),
1e3baf05
DM
207 default => 'en-us',
208 },
209 name => {
210 optional => 1,
211 type => 'string',
212 description => "Set a name for the VM. Only used on the configuration web interface.",
213 },
214 description => {
215 optional => 1,
216 type => 'string',
217 description => "Description for the VM. Only used on the configuration web interface.",
218 },
219 ostype => {
220 optional => 1,
221 type => 'string',
222 enum => [qw(other wxp w2k w2k3 w2k8 wvista win7 l24 l26)],
223 description => <<EODESC,
224Used to enable special optimization/features for specific
225operating systems:
226
227other => unspecified OS
228wxp => Microsoft Windows XP
229w2k => Microsoft Windows 2000
230w2k3 => Microsoft Windows 2003
231w2k8 => Microsoft Windows 2008
232wvista => Microsoft Windows Vista
233win7 => Microsoft Windows 7
234l24 => Linux 2.4 Kernel
235l26 => Linux 2.6/3.X Kernel
236
237other|l24|l26 ... no special behaviour
238wxp|w2k|w2k3|w2k8|wvista|win7 ... use --localtime switch
239EODESC
240 },
241 boot => {
242 optional => 1,
243 type => 'string',
244 description => "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n).",
245 pattern => '[acdn]{1,4}',
32baffb4 246 default => 'cdn',
1e3baf05
DM
247 },
248 bootdisk => {
249 optional => 1,
250 type => 'string', format => 'pve-qm-bootdisk',
251 description => "Enable booting from specified disk.",
252 pattern => '(ide|scsi|virtio)\d+',
253 },
254 smp => {
255 optional => 1,
256 type => 'integer',
257 description => "The number of CPUs. Please use option -sockets instead.",
258 minimum => 1,
259 default => 1,
260 },
261 sockets => {
262 optional => 1,
263 type => 'integer',
264 description => "The number of CPU sockets.",
265 minimum => 1,
266 default => 1,
267 },
268 cores => {
269 optional => 1,
270 type => 'integer',
271 description => "The number of cores per socket.",
272 minimum => 1,
273 default => 1,
274 },
275 acpi => {
276 optional => 1,
277 type => 'boolean',
278 description => "Enable/disable ACPI.",
279 default => 1,
280 },
281 kvm => {
282 optional => 1,
283 type => 'boolean',
284 description => "Enable/disable KVM hardware virtualization.",
285 default => 1,
286 },
287 tdf => {
288 optional => 1,
289 type => 'boolean',
da21653b 290 description => "Enable/disable time drift fix. This is ignored for kvm versions newer that 1.0 (not needed anymore).",
1e3baf05
DM
291 default => 1,
292 },
19672434 293 localtime => {
1e3baf05
DM
294 optional => 1,
295 type => 'boolean',
296 description => "Set the real time clock to local time. This is enabled by default if ostype indicates a Microsoft OS.",
297 },
298 freeze => {
299 optional => 1,
300 type => 'boolean',
301 description => "Freeze CPU at startup (use 'c' monitor command to start execution).",
302 },
303 vga => {
304 optional => 1,
305 type => 'string',
306 description => "Select VGA type. If you want to use high resolution modes (>= 1280x1024x16) then you should use option 'std' or 'vmware'. Default is 'std' for win7/w2k8, and 'cirrur' for other OS types",
307 enum => [qw(std cirrus vmware)],
308 },
0ea9541d
DM
309 watchdog => {
310 optional => 1,
311 type => 'string', format => 'pve-qm-watchdog',
312 typetext => '[[model=]i6300esb|ib700] [,[action=]reset|shutdown|poweroff|pause|debug|none]',
313 description => "Create a virtual hardware watchdog device. Once enabled (by a guest action), the watchdog must be periodically polled by an agent inside the guest or else the guest will be restarted (or execute the action specified)",
314 },
1e3baf05
DM
315 startdate => {
316 optional => 1,
19672434 317 type => 'string',
1e3baf05
DM
318 typetext => "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
319 description => "Set the initial date of the real time clock. Valid format for date are: 'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
320 pattern => '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
321 default => 'now',
322 },
323 args => {
324 optional => 1,
325 type => 'string',
326 description => <<EODESCR,
327Note: this option is for experts only. It allows you to pass arbitrary arguments to kvm, for example:
328
329args: -no-reboot -no-hpet
330EODESCR
331 },
332 tablet => {
333 optional => 1,
334 type => 'boolean',
335 default => 1,
336 description => "Enable/disable the usb tablet device. This device is usually needed to allow absolute mouse positioning. Else the mouse runs out of sync with normal vnc clients. If you're running lots of console-only guests on one host, you may consider disabling this to save some context switches.",
337 },
338 migrate_speed => {
339 optional => 1,
340 type => 'integer',
341 description => "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
342 minimum => 0,
343 default => 0,
344 },
345 migrate_downtime => {
346 optional => 1,
347 type => 'integer',
348 description => "Set maximum tolerated downtime (in seconds) for migrations.",
349 minimum => 0,
350 default => 1,
351 },
352 cdrom => {
353 optional => 1,
354 type => 'string', format => 'pve-qm-drive',
355 typetext => 'volume',
356 description => "This is an alias for option -ide2",
357 },
358 cpu => {
359 optional => 1,
360 description => "Emulated CPU type.",
361 type => 'string',
362 enum => [ qw(486 athlon pentium pentium2 pentium3 coreduo core2duo kvm32 kvm64 qemu32 qemu64 phenom host) ],
363 default => 'qemu64',
364 },
365};
366
367# what about other qemu settings ?
368#cpu => 'string',
369#machine => 'string',
370#fda => 'file',
371#fdb => 'file',
372#mtdblock => 'file',
373#sd => 'file',
374#pflash => 'file',
375#snapshot => 'bool',
376#bootp => 'file',
377##tftp => 'dir',
378##smb => 'dir',
379#kernel => 'file',
380#append => 'string',
381#initrd => 'file',
382##soundhw => 'string',
383
384while (my ($k, $v) = each %$confdesc) {
385 PVE::JSONSchema::register_standard_option("pve-qm-$k", $v);
386}
387
388my $MAX_IDE_DISKS = 4;
f62db2a4
DA
389my $MAX_SCSI_DISKS = 14;
390my $MAX_VIRTIO_DISKS = 6;
cdb0931f 391my $MAX_SATA_DISKS = 6;
1e3baf05 392my $MAX_USB_DEVICES = 5;
f62db2a4 393my $MAX_NETS = 6;
1e3baf05 394my $MAX_UNUSED_DISKS = 8;
040b06b7 395my $MAX_HOSTPCI_DEVICES = 2;
bae179aa 396my $MAX_SERIAL_PORTS = 4;
1989a89c 397my $MAX_PARALLEL_PORTS = 3;
1e3baf05
DM
398
399my $nic_model_list = ['rtl8139', 'ne2k_pci', 'e1000', 'pcnet', 'virtio',
400 'ne2k_isa', 'i82551', 'i82557b', 'i82559er'];
6b64503e 401my $nic_model_list_txt = join(' ', sort @$nic_model_list);
1e3baf05
DM
402
403# fixme:
404my $netdesc = {
405 optional => 1,
406 type => 'string', format => 'pve-qm-net',
407 typetext => "MODEL=XX:XX:XX:XX:XX:XX [,bridge=<dev>][,rate=<mbps>]",
408 description => <<EODESCR,
19672434 409Specify network devices.
1e3baf05
DM
410
411MODEL is one of: $nic_model_list_txt
412
19672434 413XX:XX:XX:XX:XX:XX should be an unique MAC address. This is
1e3baf05
DM
414automatically generated if not specified.
415
416The bridge parameter can be used to automatically add the interface to a bridge device. The Proxmox VE standard bridge is called 'vmbr0'.
417
418Option 'rate' is used to limit traffic bandwidth from and to this interface. It is specified as floating point number, unit is 'Megabytes per second'.
419
420If you specify no bridge, we create a kvm 'user' (NATed) network device, which provides DHCP and DNS services. The following addresses are used:
421
42210.0.2.2 Gateway
42310.0.2.3 DNS Server
42410.0.2.4 SMB Server
425
426The DHCP server assign addresses to the guest starting from 10.0.2.15.
427
428EODESCR
429};
430PVE::JSONSchema::register_standard_option("pve-qm-net", $netdesc);
431
432for (my $i = 0; $i < $MAX_NETS; $i++) {
433 $confdesc->{"net$i"} = $netdesc;
434}
435
436my $drivename_hash;
19672434 437
1e3baf05
DM
438my $idedesc = {
439 optional => 1,
440 type => 'string', format => 'pve-qm-drive',
5534dd1a 441 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe] [,format=f] [,backup=yes|no] [,aio=native|threads]',
1e3baf05
DM
442 description => "Use volume as IDE hard disk or CD-ROM (n is 0 to 3).",
443};
444PVE::JSONSchema::register_standard_option("pve-qm-ide", $idedesc);
445
446my $scsidesc = {
447 optional => 1,
448 type => 'string', format => 'pve-qm-drive',
231f2e13 449 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe] [,format=f] [,backup=yes|no] [,aio=native|threads]',
2fe1a152 450 description => "Use volume as SCSI hard disk or CD-ROM (n is 0 to 13).",
1e3baf05
DM
451};
452PVE::JSONSchema::register_standard_option("pve-qm-scsi", $scsidesc);
453
cdb0931f
DA
454my $satadesc = {
455 optional => 1,
456 type => 'string', format => 'pve-qm-drive',
457 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe] [,format=f] [,backup=yes|no] [,aio=native|threads]',
458 description => "Use volume as SATA hard disk or CD-ROM (n is 0 to 5).",
459};
460PVE::JSONSchema::register_standard_option("pve-qm-sata", $satadesc);
461
1e3baf05
DM
462my $virtiodesc = {
463 optional => 1,
464 type => 'string', format => 'pve-qm-drive',
5534dd1a 465 typetext => '[volume=]volume,] [,media=cdrom|disk] [,cyls=c,heads=h,secs=s[,trans=t]] [,snapshot=on|off] [,cache=none|writethrough|writeback|unsafe] [,format=f] [,backup=yes|no] [,aio=native|threads]',
2fe1a152 466 description => "Use volume as VIRTIO hard disk (n is 0 to 5).",
1e3baf05
DM
467};
468PVE::JSONSchema::register_standard_option("pve-qm-virtio", $virtiodesc);
469
470my $usbdesc = {
471 optional => 1,
472 type => 'string', format => 'pve-qm-usb-device',
473 typetext => 'host=HOSTUSBDEVICE',
474 description => <<EODESCR,
2fe1a152 475Configure an USB device (n is 0 to 4). This can be used to
1e3baf05
DM
476pass-through usb devices to the guest. HOSTUSBDEVICE syntax is:
477
19672434 478'bus-port(.port)*' (decimal numbers) or
1e3baf05
DM
479'vendor_id:product_id' (hexadeciaml numbers)
480
19672434 481You can use the 'lsusb -t' command to list existing usb devices.
1e3baf05
DM
482
483Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
484
485EODESCR
486};
487PVE::JSONSchema::register_standard_option("pve-qm-usb", $usbdesc);
488
040b06b7
DA
489my $hostpcidesc = {
490 optional => 1,
491 type => 'string', format => 'pve-qm-hostpci',
492 typetext => "HOSTPCIDEVICE",
493 description => <<EODESCR,
494Map host pci devices. HOSTPCIDEVICE syntax is:
495
496'bus:dev.func' (hexadecimal numbers)
497
498You can us the 'lspci' command to list existing pci devices.
499
500Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
501
502Experimental: user reported problems with this option.
503EODESCR
504};
505PVE::JSONSchema::register_standard_option("pve-qm-hostpci", $hostpcidesc);
506
bae179aa
DA
507my $serialdesc = {
508 optional => 1,
ca0cef26 509 type => 'string',
2fe1a152 510 pattern => '/dev/ttyS\d+',
bae179aa 511 description => <<EODESCR,
19672434 512Map host serial devices (n is 0 to 3).
bae179aa
DA
513
514Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
515
516Experimental: user reported problems with this option.
517EODESCR
518};
bae179aa 519
1989a89c
DA
520my $paralleldesc= {
521 optional => 1,
ca0cef26 522 type => 'string',
2fe1a152 523 pattern => '/dev/parport\d+',
1989a89c 524 description => <<EODESCR,
19672434 525Map host parallel devices (n is 0 to 2).
1989a89c
DA
526
527Note: This option allows direct access to host hardware. So it is no longer possible to migrate such machines - use with special care.
528
529Experimental: user reported problems with this option.
530EODESCR
531};
1989a89c
DA
532
533for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
534 $confdesc->{"parallel$i"} = $paralleldesc;
535}
536
bae179aa
DA
537for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
538 $confdesc->{"serial$i"} = $serialdesc;
539}
540
040b06b7
DA
541for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
542 $confdesc->{"hostpci$i"} = $hostpcidesc;
543}
1e3baf05
DM
544
545for (my $i = 0; $i < $MAX_IDE_DISKS; $i++) {
546 $drivename_hash->{"ide$i"} = 1;
547 $confdesc->{"ide$i"} = $idedesc;
548}
549
cdb0931f
DA
550for (my $i = 0; $i < $MAX_SATA_DISKS; $i++) {
551 $drivename_hash->{"sata$i"} = 1;
552 $confdesc->{"sata$i"} = $satadesc;
553}
554
1e3baf05
DM
555for (my $i = 0; $i < $MAX_SCSI_DISKS; $i++) {
556 $drivename_hash->{"scsi$i"} = 1;
557 $confdesc->{"scsi$i"} = $scsidesc ;
558}
559
560for (my $i = 0; $i < $MAX_VIRTIO_DISKS; $i++) {
561 $drivename_hash->{"virtio$i"} = 1;
562 $confdesc->{"virtio$i"} = $virtiodesc;
563}
564
565for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
566 $confdesc->{"usb$i"} = $usbdesc;
567}
568
569my $unuseddesc = {
570 optional => 1,
571 type => 'string', format => 'pve-volume-id',
572 description => "Reference to unused volumes.",
573};
574
575for (my $i = 0; $i < $MAX_UNUSED_DISKS; $i++) {
576 $confdesc->{"unused$i"} = $unuseddesc;
577}
578
579my $kvm_api_version = 0;
580
581sub kvm_version {
582
583 return $kvm_api_version if $kvm_api_version;
584
6b64503e 585 my $fh = IO::File->new("</dev/kvm") ||
1e3baf05
DM
586 return 0;
587
6b64503e 588 if (my $v = $fh->ioctl(KVM_GET_API_VERSION(), 0)) {
1e3baf05
DM
589 $kvm_api_version = $v;
590 }
591
592 $fh->close();
593
594 return $kvm_api_version;
595}
596
597my $kvm_user_version;
598
599sub kvm_user_version {
600
601 return $kvm_user_version if $kvm_user_version;
602
603 $kvm_user_version = 'unknown';
604
605 my $tmp = `kvm -help 2>/dev/null`;
19672434 606
a3c52213 607 if ($tmp =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?) /) {
1e3baf05
DM
608 $kvm_user_version = $2;
609 }
610
611 return $kvm_user_version;
612
613}
614
615my $kernel_has_vhost_net = -c '/dev/vhost-net';
616
617sub disknames {
618 # order is important - used to autoselect boot disk
19672434 619 return ((map { "ide$_" } (0 .. ($MAX_IDE_DISKS - 1))),
1e3baf05 620 (map { "scsi$_" } (0 .. ($MAX_SCSI_DISKS - 1))),
cdb0931f
DA
621 (map { "virtio$_" } (0 .. ($MAX_VIRTIO_DISKS - 1))),
622 (map { "sata$_" } (0 .. ($MAX_SATA_DISKS - 1))));
1e3baf05
DM
623}
624
625sub valid_drivename {
626 my $dev = shift;
627
6b64503e 628 return defined($drivename_hash->{$dev});
1e3baf05
DM
629}
630
631sub option_exists {
632 my $key = shift;
633 return defined($confdesc->{$key});
19672434 634}
1e3baf05
DM
635
636sub nic_models {
637 return $nic_model_list;
638}
639
640sub os_list_description {
641
642 return {
643 other => 'Other',
644 wxp => 'Windows XP',
645 w2k => 'Windows 2000',
646 w2k3 =>, 'Windows 2003',
647 w2k8 => 'Windows 2008',
648 wvista => 'Windows Vista',
649 win7 => 'Windows 7',
650 l24 => 'Linux 2.4',
651 l26 => 'Linux 2.6',
19672434 652 };
1e3baf05
DM
653}
654
1e3baf05
DM
655sub disk_devive_info {
656 my $dev = shift;
657
658 die "unknown disk device format '$dev'" if $dev !~ m/^(ide|scsi|virtio)(\d+)$/;
659
660 my $bus = $1;
661 my $index = $2;
662 my $maxdev = 1024;
663
664 if ($bus eq 'ide') {
665 $maxdev = 2;
666 } elsif ($bus eq 'scsi') {
f62db2a4 667 $maxdev = 7;
1e3baf05
DM
668 }
669
6b64503e 670 my $controller = int($index / $maxdev);
1e3baf05
DM
671 my $unit = $index % $maxdev;
672
673
674 return { bus => $bus, desc => uc($bus) . " $controller:$unit",
675 controller => $controller, unit => $unit, index => $index };
676
677}
678
679sub qemu_drive_name {
19672434 680 my ($dev, $media) = @_;
1e3baf05 681
6b64503e 682 my $info = disk_devive_info($dev);
1e3baf05
DM
683 my $mediastr = '';
684
685 if (($info->{bus} eq 'ide') || ($info->{bus} eq 'scsi')) {
686 $mediastr = ($media eq 'cdrom') ? "-cd" : "-hd";
19672434 687 return sprintf("%s%i%s%i", $info->{bus}, $info->{controller},
1e3baf05
DM
688 $mediastr, $info->{unit});
689 } else {
19672434 690 return sprintf("%s%i", $info->{bus}, $info->{index});
1e3baf05
DM
691 }
692}
693
694my $cdrom_path;
695
696sub get_cdrom_path {
697
698 return $cdrom_path if $cdrom_path;
699
700 return $cdrom_path = "/dev/cdrom" if -l "/dev/cdrom";
701 return $cdrom_path = "/dev/cdrom1" if -l "/dev/cdrom1";
702 return $cdrom_path = "/dev/cdrom2" if -l "/dev/cdrom2";
703}
704
705sub get_iso_path {
706 my ($storecfg, $vmid, $cdrom) = @_;
707
708 if ($cdrom eq 'cdrom') {
709 return get_cdrom_path();
710 } elsif ($cdrom eq 'none') {
711 return '';
712 } elsif ($cdrom =~ m|^/|) {
713 return $cdrom;
714 } else {
6b64503e 715 return PVE::Storage::path($storecfg, $cdrom);
1e3baf05
DM
716 }
717}
718
719# try to convert old style file names to volume IDs
720sub filename_to_volume_id {
721 my ($vmid, $file, $media) = @_;
722
723 if (!($file eq 'none' || $file eq 'cdrom' ||
724 $file =~ m|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
19672434 725
1e3baf05 726 return undef if $file =~ m|/|;
19672434 727
1e3baf05
DM
728 if ($media && $media eq 'cdrom') {
729 $file = "local:iso/$file";
730 } else {
731 $file = "local:$vmid/$file";
732 }
733 }
734
735 return $file;
736}
737
738sub verify_media_type {
739 my ($opt, $vtype, $media) = @_;
740
741 return if !$media;
742
743 my $etype;
744 if ($media eq 'disk') {
745 $etype = 'image';
746 } elsif ($media eq 'cdrom') {
747 $etype = 'iso';
748 } else {
749 die "internal error";
750 }
751
752 return if ($vtype eq $etype);
19672434 753
1e3baf05
DM
754 raise_param_exc({ $opt => "unexpected media type ($vtype != $etype)" });
755}
756
757sub cleanup_drive_path {
758 my ($opt, $storecfg, $drive) = @_;
759
760 # try to convert filesystem paths to volume IDs
761
762 if (($drive->{file} !~ m/^(cdrom|none)$/) &&
763 ($drive->{file} !~ m|^/dev/.+|) &&
764 ($drive->{file} !~ m/^([^:]+):(.+)$/) &&
19672434 765 ($drive->{file} !~ m/^\d+$/)) {
1e3baf05
DM
766 my ($vtype, $volid) = PVE::Storage::path_to_volume_id($storecfg, $drive->{file});
767 raise_param_exc({ $opt => "unable to associate path '$drive->{file}' to any storage"}) if !$vtype;
768 $drive->{media} = 'cdrom' if !$drive->{media} && $vtype eq 'iso';
769 verify_media_type($opt, $vtype, $drive->{media});
770 $drive->{file} = $volid;
771 }
772
773 $drive->{media} = 'cdrom' if !$drive->{media} && $drive->{file} =~ m/^(cdrom|none)$/;
774}
775
776sub create_conf_nolock {
777 my ($vmid, $settings) = @_;
778
6b64503e 779 my $filename = config_file($vmid);
1e3baf05
DM
780
781 die "configuration file '$filename' already exists\n" if -f $filename;
19672434 782
1e3baf05
DM
783 my $defaults = load_defaults();
784
785 $settings->{name} = "vm$vmid" if !$settings->{name};
786 $settings->{memory} = $defaults->{memory} if !$settings->{memory};
787
788 my $data = '';
789 foreach my $opt (keys %$settings) {
790 next if !$confdesc->{$opt};
791
792 my $value = $settings->{$opt};
793 next if !$value;
794
795 $data .= "$opt: $value\n";
796 }
797
798 PVE::Tools::file_set_contents($filename, $data);
799}
800
801# ideX = [volume=]volume-id[,media=d][,cyls=c,heads=h,secs=s[,trans=t]]
802# [,snapshot=on|off][,cache=on|off][,format=f][,backup=yes|no]
803# [,aio=native|threads]
804
805sub parse_drive {
806 my ($key, $data) = @_;
807
808 my $res = {};
19672434 809
1e3baf05
DM
810 # $key may be undefined - used to verify JSON parameters
811 if (!defined($key)) {
812 $res->{interface} = 'unknown'; # should not harm when used to verify parameters
813 $res->{index} = 0;
814 } elsif ($key =~ m/^([^\d]+)(\d+)$/) {
815 $res->{interface} = $1;
816 $res->{index} = $2;
817 } else {
818 return undef;
819 }
820
821 foreach my $p (split (/,/, $data)) {
822 next if $p =~ m/^\s*$/;
823
824 if ($p =~ m/^(file|volume|cyls|heads|secs|trans|media|snapshot|cache|format|rerror|werror|backup|aio)=(.+)$/) {
825 my ($k, $v) = ($1, $2);
826
827 $k = 'file' if $k eq 'volume';
828
829 return undef if defined $res->{$k};
19672434 830
1e3baf05
DM
831 $res->{$k} = $v;
832 } else {
833 if (!$res->{file} && $p !~ m/=/) {
834 $res->{file} = $p;
835 } else {
836 return undef;
837 }
838 }
839 }
840
841 return undef if !$res->{file};
842
19672434 843 return undef if $res->{cache} &&
5534dd1a 844 $res->{cache} !~ m/^(off|none|writethrough|writeback|unsafe)$/;
1e3baf05
DM
845 return undef if $res->{snapshot} && $res->{snapshot} !~ m/^(on|off)$/;
846 return undef if $res->{cyls} && $res->{cyls} !~ m/^\d+$/;
847 return undef if $res->{heads} && $res->{heads} !~ m/^\d+$/;
848 return undef if $res->{secs} && $res->{secs} !~ m/^\d+$/;
849 return undef if $res->{media} && $res->{media} !~ m/^(disk|cdrom)$/;
850 return undef if $res->{trans} && $res->{trans} !~ m/^(none|lba|auto)$/;
851 return undef if $res->{format} && $res->{format} !~ m/^(raw|cow|qcow|qcow2|vmdk|cloop)$/;
852 return undef if $res->{rerror} && $res->{rerror} !~ m/^(ignore|report|stop)$/;
853 return undef if $res->{werror} && $res->{werror} !~ m/^(enospc|ignore|report|stop)$/;
854 return undef if $res->{backup} && $res->{backup} !~ m/^(yes|no)$/;
855 return undef if $res->{aio} && $res->{aio} !~ m/^(native|threads)$/;
856
857 if ($res->{media} && ($res->{media} eq 'cdrom')) {
858 return undef if $res->{snapshot} || $res->{trans} || $res->{format};
19672434 859 return undef if $res->{heads} || $res->{secs} || $res->{cyls};
1e3baf05
DM
860 return undef if $res->{interface} eq 'virtio';
861 }
862
863 # rerror does not work with scsi drives
864 if ($res->{rerror}) {
865 return undef if $res->{interface} eq 'scsi';
866 }
867
868 return $res;
869}
870
871my @qemu_drive_options = qw(heads secs cyls trans media format cache snapshot rerror werror aio);
872
873sub print_drive {
874 my ($vmid, $drive) = @_;
875
876 my $opts = '';
877 foreach my $o (@qemu_drive_options, 'backup') {
878 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
879 }
880
881 return "$drive->{file}$opts";
882}
883
ca916ecc
DA
884sub print_drivedevice_full {
885 my ($storecfg, $vmid, $drive) = @_;
886
887 my $device = '';
888 my $maxdev = 0;
19672434 889
ca916ecc 890 if ($drive->{interface} eq 'virtio') {
2ed36a41
DM
891 my $pciaddr = print_pci_addr("$drive->{interface}$drive->{index}");
892 $device = "virtio-blk-pci,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}$pciaddr";
893 } elsif ($drive->{interface} eq 'scsi') {
894 $maxdev = 7;
895 my $controller = int($drive->{index} / $maxdev);
896 my $unit = $drive->{index} % $maxdev;
897 my $devicetype = 'hd';
231f2e13
DA
898 my $path = '';
899 if (drive_is_cdrom($drive)) {
900 $devicetype = 'cd';
901 } else {
902 if ($drive->{file} =~ m|^/|) {
903 $path = $drive->{file};
904 } else {
905 $path = PVE::Storage::path($storecfg, $drive->{file});
906 }
907 if ($path =~ m|^/dev/| ) {
908 $devicetype = 'block';
909 }
910 }
ca916ecc 911
7ebe888a 912 $device = "scsi-$devicetype,bus=lsi$controller.0,scsi-id=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
913 } elsif ($drive->{interface} eq 'ide'){
914 $maxdev = 2;
915 my $controller = int($drive->{index} / $maxdev);
916 my $unit = $drive->{index} % $maxdev;
917 my $devicetype = ($drive->{media} && $drive->{media} eq 'cdrom') ? "cd" : "hd";
918
7ebe888a 919 $device = "ide-$devicetype,bus=ide.$controller,unit=$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
cdb0931f
DA
920 } elsif ($drive->{interface} eq 'sata'){
921 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
922 my $unit = $drive->{index} % $MAX_SATA_DISKS;
923 $device = "ide-drive,bus=ahci$controller.$unit,drive=drive-$drive->{interface}$drive->{index},id=$drive->{interface}$drive->{index}";
2ed36a41
DM
924 } elsif ($drive->{interface} eq 'usb') {
925 die "implement me";
926 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
927 } else {
928 die "unsupported interface type";
ca916ecc
DA
929 }
930
3b408e82
DM
931 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex};
932
ca916ecc
DA
933 return $device;
934}
935
1e3baf05
DM
936sub print_drive_full {
937 my ($storecfg, $vmid, $drive) = @_;
938
939 my $opts = '';
940 foreach my $o (@qemu_drive_options) {
3b408e82 941 next if $o eq 'bootindex';
1e3baf05 942 $opts .= ",$o=$drive->{$o}" if $drive->{$o};
19672434 943 }
1e3baf05
DM
944
945 # use linux-aio by default (qemu default is threads)
19672434 946 $opts .= ",aio=native" if !$drive->{aio};
1e3baf05
DM
947
948 my $path;
949 my $volid = $drive->{file};
6b64503e
DM
950 if (drive_is_cdrom($drive)) {
951 $path = get_iso_path($storecfg, $vmid, $volid);
1e3baf05
DM
952 } else {
953 if ($volid =~ m|^/|) {
954 $path = $volid;
955 } else {
6b64503e 956 $path = PVE::Storage::path($storecfg, $volid);
1e3baf05 957 }
2b556977
DM
958 if (!$drive->{cache} && ($path =~ m|^/dev/| || $path =~ m|\.raw$|)) {
959 $opts .= ",cache=none";
960 }
1e3baf05
DM
961 }
962
963 my $pathinfo = $path ? "file=$path," : '';
964
3ebfcc86 965 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1e3baf05
DM
966}
967
cc4d6182
DA
968sub print_netdevice_full {
969 my ($vmid, $conf, $net, $netid) = @_;
970
971 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
972
973 my $device = $net->{model};
974 if ($net->{model} eq 'virtio') {
975 $device = 'virtio-net-pci';
976 };
977
978 # qemu > 0.15 always try to boot from network - we disable that by
979 # not loading the pxe rom file
980 my $extra = ($bootorder !~ m/n/) ? "romfile=," : '';
981 my $pciaddr = print_pci_addr("$netid");
982 my $tmpstr = "$device,${extra}mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
983 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex} ;
984 return $tmpstr;
985}
986
987sub print_netdev_full {
988 my ($vmid, $conf, $net, $netid) = @_;
989
990 my $i = '';
991 if ($netid =~ m/^net(\d+)$/) {
992 $i = int($1);
993 }
994
995 die "got strange net id '$i'\n" if $i >= ${MAX_NETS};
996
997 my $ifname = "tap${vmid}i$i";
998
999 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1000 die "interface name '$ifname' is too long (max 15 character)\n"
1001 if length($ifname) >= 16;
1002
1003 my $vhostparam = '';
1004 $vhostparam = ',vhost=on' if $kernel_has_vhost_net && $net->{model} eq 'virtio';
1005
1006 my $vmname = $conf->{name} || "vm$vmid";
1007
1008 if ($net->{bridge}) {
1009 return "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/pve-bridge$vhostparam";
1010 } else {
1011 return "type=user,id=$netid,hostname=$vmname";
1012 }
1013}
1e3baf05
DM
1014
1015sub drive_is_cdrom {
1016 my ($drive) = @_;
1017
1018 return $drive && $drive->{media} && ($drive->{media} eq 'cdrom');
1019
1020}
1021
040b06b7
DA
1022sub parse_hostpci {
1023 my ($value) = @_;
1024
1025 return undef if !$value;
1026
1027 my $res = {};
1028
1029 if ($value =~ m/^[a-f0-9]{2}:[a-f0-9]{2}\.[a-f0-9]$/) {
1030 $res->{pciid} = $value;
1031 } else {
1032 return undef;
1033 }
1034
1035 return $res;
1036}
1037
1e3baf05
DM
1038# netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1039sub parse_net {
1040 my ($data) = @_;
1041
1042 my $res = {};
1043
6b64503e 1044 foreach my $kvp (split(/,/, $data)) {
1e3baf05
DM
1045
1046 if ($kvp =~ m/^(ne2k_pci|e1000|rtl8139|pcnet|virtio|ne2k_isa|i82551|i82557b|i82559er)(=([0-9a-f]{2}(:[0-9a-f]{2}){5}))?$/i) {
6b64503e 1047 my $model = lc($1);
9f91ff02 1048 my $mac = uc($3) || PVE::Tools::random_ether_addr();
1e3baf05
DM
1049 $res->{model} = $model;
1050 $res->{macaddr} = $mac;
1051 } elsif ($kvp =~ m/^bridge=(\S+)$/) {
1052 $res->{bridge} = $1;
1053 } elsif ($kvp =~ m/^rate=(\d+(\.\d+)?)$/) {
1054 $res->{rate} = $1;
1055 } else {
1056 return undef;
1057 }
19672434 1058
1e3baf05
DM
1059 }
1060
1061 return undef if !$res->{model};
1062
1063 return $res;
1064}
1065
1066sub print_net {
1067 my $net = shift;
1068
1069 my $res = "$net->{model}";
1070 $res .= "=$net->{macaddr}" if $net->{macaddr};
1071 $res .= ",bridge=$net->{bridge}" if $net->{bridge};
1072 $res .= ",rate=$net->{rate}" if $net->{rate};
1073
1074 return $res;
1075}
1076
1077sub add_random_macs {
1078 my ($settings) = @_;
1079
1080 foreach my $opt (keys %$settings) {
1081 next if $opt !~ m/^net(\d+)$/;
1082 my $net = parse_net($settings->{$opt});
1083 next if !$net;
1084 $settings->{$opt} = print_net($net);
1085 }
1086}
1087
1088sub add_unused_volume {
1858638f 1089 my ($config, $volid) = @_;
1e3baf05
DM
1090
1091 my $key;
1092 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1093 my $test = "unused$ind";
1094 if (my $vid = $config->{$test}) {
1095 return if $vid eq $volid; # do not add duplicates
1096 } else {
1097 $key = $test;
19672434 1098 }
1e3baf05
DM
1099 }
1100
1101 die "To many unused volume - please delete them first.\n" if !$key;
1858638f
DM
1102
1103 $config->{$key} = $volid;
1e3baf05 1104
1858638f 1105 return $key;
1e3baf05
DM
1106}
1107
1108# fixme: remove all thos $noerr parameters?
1109
1110PVE::JSONSchema::register_format('pve-qm-bootdisk', \&verify_bootdisk);
1111sub verify_bootdisk {
1112 my ($value, $noerr) = @_;
1113
19672434 1114 return $value if valid_drivename($value);
1e3baf05
DM
1115
1116 return undef if $noerr;
1117
1118 die "invalid boot disk '$value'\n";
1119}
1120
1121PVE::JSONSchema::register_format('pve-qm-net', \&verify_net);
1122sub verify_net {
1123 my ($value, $noerr) = @_;
1124
1125 return $value if parse_net($value);
1126
1127 return undef if $noerr;
19672434 1128
1e3baf05
DM
1129 die "unable to parse network options\n";
1130}
1131
1132PVE::JSONSchema::register_format('pve-qm-drive', \&verify_drive);
1133sub verify_drive {
1134 my ($value, $noerr) = @_;
1135
6b64503e 1136 return $value if parse_drive(undef, $value);
1e3baf05
DM
1137
1138 return undef if $noerr;
19672434 1139
1e3baf05
DM
1140 die "unable to parse drive options\n";
1141}
1142
1143PVE::JSONSchema::register_format('pve-qm-hostpci', \&verify_hostpci);
1144sub verify_hostpci {
1145 my ($value, $noerr) = @_;
1146
040b06b7
DA
1147 return $value if parse_hostpci($value);
1148
1149 return undef if $noerr;
1150
1151 die "unable to parse pci id\n";
1e3baf05
DM
1152}
1153
0ea9541d
DM
1154PVE::JSONSchema::register_format('pve-qm-watchdog', \&verify_watchdog);
1155sub verify_watchdog {
1156 my ($value, $noerr) = @_;
1157
1158 return $value if parse_watchdog($value);
1159
1160 return undef if $noerr;
19672434 1161
0ea9541d
DM
1162 die "unable to parse watchdog options\n";
1163}
1164
1165sub parse_watchdog {
1166 my ($value) = @_;
1167
1168 return undef if !$value;
1169
1170 my $res = {};
1171
6b64503e 1172 foreach my $p (split(/,/, $value)) {
0ea9541d
DM
1173 next if $p =~ m/^\s*$/;
1174
1175 if ($p =~ m/^(model=)?(i6300esb|ib700)$/) {
1176 $res->{model} = $2;
1177 } elsif ($p =~ m/^(action=)?(reset|shutdown|poweroff|pause|debug|none)$/) {
1178 $res->{action} = $2;
1179 } else {
1180 return undef;
1181 }
1182 }
1183
1184 return $res;
1185}
1186
1e3baf05
DM
1187sub parse_usb_device {
1188 my ($value) = @_;
1189
1190 return undef if !$value;
1191
6b64503e 1192 my @dl = split(/,/, $value);
1e3baf05
DM
1193 my $found;
1194
1195 my $res = {};
1196 foreach my $v (@dl) {
1197 if ($v =~ m/^host=([0-9A-Fa-f]{4}):([0-9A-Fa-f]{4})$/) {
1198 $found = 1;
1199 $res->{vendorid} = $1;
1200 $res->{productid} = $2;
1201 } elsif ($v =~ m/^host=(\d+)\-(\d+(\.\d+)*)$/) {
1202 $found = 1;
1203 $res->{hostbus} = $1;
1204 $res->{hostport} = $2;
1205 } else {
1206 return undef;
1207 }
1208 }
1209 return undef if !$found;
1210
1211 return $res;
1212}
19672434 1213
1e3baf05
DM
1214PVE::JSONSchema::register_format('pve-qm-usb-device', \&verify_usb_device);
1215sub verify_usb_device {
1216 my ($value, $noerr) = @_;
1217
1218 return $value if parse_usb_device($value);
1219
1220 return undef if $noerr;
19672434 1221
1e3baf05
DM
1222 die "unable to parse usb device\n";
1223}
1224
1e3baf05
DM
1225# add JSON properties for create and set function
1226sub json_config_properties {
1227 my $prop = shift;
1228
1229 foreach my $opt (keys %$confdesc) {
1230 $prop->{$opt} = $confdesc->{$opt};
1231 }
1232
1233 return $prop;
1234}
1235
1236sub check_type {
1237 my ($key, $value) = @_;
1238
1239 die "unknown setting '$key'\n" if !$confdesc->{$key};
1240
1241 my $type = $confdesc->{$key}->{type};
1242
6b64503e 1243 if (!defined($value)) {
1e3baf05
DM
1244 die "got undefined value\n";
1245 }
1246
1247 if ($value =~ m/[\n\r]/) {
1248 die "property contains a line feed\n";
1249 }
1250
1251 if ($type eq 'boolean') {
19672434
DM
1252 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
1253 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
1254 die "type check ('boolean') failed - got '$value'\n";
1e3baf05
DM
1255 } elsif ($type eq 'integer') {
1256 return int($1) if $value =~ m/^(\d+)$/;
1257 die "type check ('integer') failed - got '$value'\n";
1258 } elsif ($type eq 'string') {
1259 if (my $fmt = $confdesc->{$key}->{format}) {
1260 if ($fmt eq 'pve-qm-drive') {
1261 # special case - we need to pass $key to parse_drive()
6b64503e 1262 my $drive = parse_drive($key, $value);
1e3baf05
DM
1263 return $value if $drive;
1264 die "unable to parse drive options\n";
1265 }
1266 PVE::JSONSchema::check_format($fmt, $value);
19672434
DM
1267 return $value;
1268 }
1e3baf05 1269 $value =~ s/^\"(.*)\"$/$1/;
19672434 1270 return $value;
1e3baf05
DM
1271 } else {
1272 die "internal error"
1273 }
1274}
1275
1276sub lock_config {
1277 my ($vmid, $code, @param) = @_;
1278
6b64503e 1279 my $filename = config_file_lock($vmid);
1e3baf05 1280
5fdbe4f0 1281 my $res = lock_file($filename, 10, $code, @param);
1e3baf05
DM
1282
1283 die $@ if $@;
5fdbe4f0
DM
1284
1285 return $res;
1e3baf05
DM
1286}
1287
1288sub cfs_config_path {
a78ccf26 1289 my ($vmid, $node) = @_;
1e3baf05 1290
a78ccf26
DM
1291 $node = $nodename if !$node;
1292 return "nodes/$node/qemu-server/$vmid.conf";
1e3baf05
DM
1293}
1294
040b06b7
DA
1295sub check_iommu_support{
1296 #fixme : need to check IOMMU support
1297 #http://www.linux-kvm.org/page/How_to_assign_devices_with_VT-d_in_KVM
1298
1299 my $iommu=1;
1300 return $iommu;
1301
1302}
1303
1e3baf05 1304sub config_file {
a78ccf26 1305 my ($vmid, $node) = @_;
1e3baf05 1306
a78ccf26 1307 my $cfspath = cfs_config_path($vmid, $node);
1e3baf05
DM
1308 return "/etc/pve/$cfspath";
1309}
1310
1311sub config_file_lock {
1312 my ($vmid) = @_;
1313
1314 return "$lock_dir/lock-$vmid.conf";
1315}
1316
1317sub touch_config {
1318 my ($vmid) = @_;
1319
6b64503e 1320 my $conf = config_file($vmid);
1e3baf05
DM
1321 utime undef, undef, $conf;
1322}
1323
1e3baf05 1324sub destroy_vm {
a6af7b3e 1325 my ($storecfg, $vmid, $keep_empty_config) = @_;
1e3baf05 1326
6b64503e 1327 my $conffile = config_file($vmid);
1e3baf05 1328
6b64503e 1329 my $conf = load_config($vmid);
1e3baf05 1330
6b64503e 1331 check_lock($conf);
1e3baf05 1332
19672434 1333 # only remove disks owned by this VM
1e3baf05
DM
1334 foreach_drive($conf, sub {
1335 my ($ds, $drive) = @_;
1336
6b64503e 1337 return if drive_is_cdrom($drive);
1e3baf05
DM
1338
1339 my $volid = $drive->{file};
ff1a2432 1340 return if !$volid || $volid =~ m|^/|;
1e3baf05 1341
6b64503e 1342 my ($path, $owner) = PVE::Storage::path($storecfg, $volid);
ff1a2432 1343 return if !$path || !$owner || ($owner != $vmid);
1e3baf05 1344
6b64503e 1345 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05 1346 });
19672434 1347
a6af7b3e 1348 if ($keep_empty_config) {
9c502e26 1349 PVE::Tools::file_set_contents($conffile, "memory: 128\n");
a6af7b3e
DM
1350 } else {
1351 unlink $conffile;
1352 }
1e3baf05
DM
1353
1354 # also remove unused disk
1355 eval {
6b64503e 1356 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);
1e3baf05
DM
1357
1358 eval {
6b64503e 1359 PVE::Storage::foreach_volid($dl, sub {
1e3baf05 1360 my ($volid, $sid, $volname, $d) = @_;
6b64503e 1361 PVE::Storage::vdisk_free($storecfg, $volid);
1e3baf05
DM
1362 });
1363 };
1364 warn $@ if $@;
1365
1366 };
1367 warn $@ if $@;
1368}
1369
1370# fixme: remove?
1371sub load_diskinfo_old {
1372 my ($storecfg, $vmid, $conf) = @_;
1373
1374 my $info = {};
1375 my $res = {};
1376 my $vollist;
1377
1378 foreach_drive($conf, sub {
1379 my ($ds, $di) = @_;
1380
1381 $res->{$ds} = $di;
1382
6b64503e 1383 return if drive_is_cdrom($di);
1e3baf05
DM
1384
1385 if ($di->{file} =~ m|^/dev/.+|) {
6b64503e 1386 $info->{$di->{file}}->{size} = PVE::Storage::file_size_info($di->{file});
1e3baf05
DM
1387 } else {
1388 push @$vollist, $di->{file};
1389 }
1390 });
1391
1392 eval {
6b64503e 1393 my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid, $vollist);
1e3baf05 1394
6b64503e 1395 PVE::Storage::foreach_volid($dl, sub {
1e3baf05
DM
1396 my ($volid, $sid, $volname, $d) = @_;
1397 $info->{$volid} = $d;
1398 });
1399 };
1400 warn $@ if $@;
1401
1402 foreach my $ds (keys %$res) {
1403 my $di = $res->{$ds};
1404
19672434 1405 $res->{$ds}->{disksize} = $info->{$di->{file}} ?
1e3baf05
DM
1406 $info->{$di->{file}}->{size} / (1024*1024) : 0;
1407 }
1408
1409 return $res;
1410}
1411
1412sub load_config {
1413 my ($vmid) = @_;
1414
1415 my $cfspath = cfs_config_path($vmid);
1416
1417 my $conf = PVE::Cluster::cfs_read_file($cfspath);
1418
1419 die "no such VM ('$vmid')\n" if !defined($conf);
1420
1421 return $conf;
19672434 1422}
1e3baf05
DM
1423
1424sub parse_vm_config {
1425 my ($filename, $raw) = @_;
1426
1427 return undef if !defined($raw);
1428
554ac7e7
DM
1429 my $res = {
1430 digest => Digest::SHA1::sha1_hex($raw),
1431 };
1e3baf05 1432
19672434 1433 $filename =~ m|/qemu-server/(\d+)\.conf$|
1e3baf05
DM
1434 || die "got strange filename '$filename'";
1435
1436 my $vmid = $1;
1437
1438 while ($raw && $raw =~ s/^(.*?)(\n|$)//) {
1439 my $line = $1;
19672434 1440
1e3baf05
DM
1441 next if $line =~ m/^\#/;
1442
1443 next if $line =~ m/^\s*$/;
1444
1445 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
1446 my $key = $1;
1447 my $value = PVE::Tools::decode_text($2);
1448 $res->{$key} = $value;
1449 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
1450 my $key = $1;
1451 my $value = $2;
1452 $res->{$key} = $value;
1453 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S+)\s*$/) {
1454 my $key = $1;
1455 my $value = $2;
1456 eval { $value = check_type($key, $value); };
1457 if ($@) {
1458 warn "vm $vmid - unable to parse value of '$key' - $@";
1459 } else {
1460 my $fmt = $confdesc->{$key}->{format};
1461 if ($fmt && $fmt eq 'pve-qm-drive') {
1462 my $v = parse_drive($key, $value);
1463 if (my $volid = filename_to_volume_id($vmid, $v->{file}, $v->{media})) {
1464 $v->{file} = $volid;
6b64503e 1465 $value = print_drive($vmid, $v);
1e3baf05
DM
1466 } else {
1467 warn "vm $vmid - unable to parse value of '$key'\n";
1468 next;
1469 }
1470 }
1471
1472 if ($key eq 'cdrom') {
1473 $res->{ide2} = $value;
1474 } else {
1475 $res->{$key} = $value;
1476 }
1477 }
1478 }
1479 }
1480
1481 # convert old smp to sockets
1482 if ($res->{smp} && !$res->{sockets}) {
1483 $res->{sockets} = $res->{smp};
19672434 1484 }
1e3baf05
DM
1485 delete $res->{smp};
1486
1487 return $res;
1488}
1489
1858638f
DM
1490sub write_vm_config {
1491 my ($filename, $conf) = @_;
1e3baf05 1492
1858638f
DM
1493 if ($conf->{cdrom}) {
1494 die "option ide2 conflicts with cdrom\n" if $conf->{ide2};
1495 $conf->{ide2} = $conf->{cdrom};
1496 delete $conf->{cdrom};
1497 }
1e3baf05
DM
1498
1499 # we do not use 'smp' any longer
1858638f
DM
1500 if ($conf->{sockets}) {
1501 delete $conf->{smp};
1502 } elsif ($conf->{smp}) {
1503 $conf->{sockets} = $conf->{smp};
1504 delete $conf->{cores};
1505 delete $conf->{smp};
1e3baf05
DM
1506 }
1507
1508 my $new_volids = {};
1858638f 1509 foreach my $key (keys %$conf) {
554ac7e7 1510 next if $key eq 'digest';
1858638f 1511 my $value = $conf->{$key};
1e3baf05
DM
1512 if ($key eq 'description') {
1513 $value = PVE::Tools::encode_text($value);
1514 }
1515 eval { $value = check_type($key, $value); };
1516 die "unable to parse value of '$key' - $@" if $@;
1858638f
DM
1517
1518 $conf->{$key} = $value;
1519
1e3baf05
DM
1520 if (valid_drivename($key)) {
1521 my $drive = PVE::QemuServer::parse_drive($key, $value);
1522 $new_volids->{$drive->{file}} = 1 if $drive && $drive->{file};
1523 }
1524 }
1525
1858638f
DM
1526 # remove 'unusedX' settings if we re-add a volume
1527 foreach my $key (keys %$conf) {
1528 my $value = $conf->{$key};
1529 if ($key =~ m/^unused/ && $new_volids->{$value}) {
1530 delete $conf->{$key};
1e3baf05 1531 }
1858638f 1532 }
1e3baf05 1533
1858638f
DM
1534 # gererate RAW data
1535 my $raw = '';
1536 foreach my $key (sort keys %$conf) {
1537 next if $key eq 'digest';
1538 $raw .= "$key: $conf->{$key}\n";
1539 }
1e3baf05 1540
1858638f
DM
1541 return $raw;
1542}
1e3baf05 1543
1858638f
DM
1544sub update_config_nolock {
1545 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 1546
1858638f
DM
1547 check_lock($conf) if !$skiplock;
1548
1549 my $cfspath = cfs_config_path($vmid);
1e3baf05 1550
1858638f
DM
1551 PVE::Cluster::cfs_write_file($cfspath, $conf);
1552}
1e3baf05 1553
1858638f
DM
1554sub update_config {
1555 my ($vmid, $conf, $skiplock) = @_;
1e3baf05 1556
1858638f 1557 lock_config($vmid, &update_config_nolock, $conf, $skiplock);
1e3baf05
DM
1558}
1559
19672434 1560sub load_defaults {
1e3baf05
DM
1561
1562 my $res = {};
1563
1564 # we use static defaults from our JSON schema configuration
1565 foreach my $key (keys %$confdesc) {
1566 if (defined(my $default = $confdesc->{$key}->{default})) {
1567 $res->{$key} = $default;
1568 }
1569 }
19672434 1570
1e3baf05
DM
1571 my $conf = PVE::Cluster::cfs_read_file('datacenter.cfg');
1572 $res->{keyboard} = $conf->{keyboard} if $conf->{keyboard};
1573
1574 return $res;
1575}
1576
1577sub config_list {
1578 my $vmlist = PVE::Cluster::get_vmlist();
1579 my $res = {};
1580 return $res if !$vmlist || !$vmlist->{ids};
1581 my $ids = $vmlist->{ids};
1582
1e3baf05
DM
1583 foreach my $vmid (keys %$ids) {
1584 my $d = $ids->{$vmid};
1585 next if !$d->{node} || $d->{node} ne $nodename;
5ee957cc 1586 next if !$d->{type} || $d->{type} ne 'qemu';
1e3baf05
DM
1587 $res->{$vmid}->{exists} = 1;
1588 }
1589 return $res;
1590}
1591
64e13401
DM
1592# test if VM uses local resources (to prevent migration)
1593sub check_local_resources {
1594 my ($conf, $noerr) = @_;
1595
1596 my $loc_res = 0;
19672434 1597
e0ab7331
DM
1598 $loc_res = 1 if $conf->{hostusb}; # old syntax
1599 $loc_res = 1 if $conf->{hostpci}; # old syntax
64e13401 1600
0d29ab3b 1601 foreach my $k (keys %$conf) {
2fe1a152 1602 $loc_res = 1 if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
64e13401
DM
1603 }
1604
1605 die "VM uses local resources\n" if $loc_res && !$noerr;
1606
1607 return $loc_res;
1608}
1609
1e3baf05
DM
1610sub check_lock {
1611 my ($conf) = @_;
1612
1613 die "VM is locked ($conf->{lock})\n" if $conf->{lock};
1614}
1615
1616sub check_cmdline {
1617 my ($pidfile, $pid) = @_;
1618
6b64503e
DM
1619 my $fh = IO::File->new("/proc/$pid/cmdline", "r");
1620 if (defined($fh)) {
1e3baf05
DM
1621 my $line = <$fh>;
1622 $fh->close;
1623 return undef if !$line;
6b64503e 1624 my @param = split(/\0/, $line);
1e3baf05
DM
1625
1626 my $cmd = $param[0];
1627 return if !$cmd || ($cmd !~ m|kvm$|);
1628
1629 for (my $i = 0; $i < scalar (@param); $i++) {
1630 my $p = $param[$i];
1631 next if !$p;
1632 if (($p eq '-pidfile') || ($p eq '--pidfile')) {
1633 my $p = $param[$i+1];
1634 return 1 if $p && ($p eq $pidfile);
1635 return undef;
1636 }
1637 }
1638 }
1639 return undef;
1640}
1641
1642sub check_running {
e6c3b671 1643 my ($vmid, $nocheck) = @_;
1e3baf05 1644
e6c3b671 1645 my $filename = config_file($vmid);
1e3baf05
DM
1646
1647 die "unable to find configuration file for VM $vmid - no such machine\n"
e6c3b671 1648 if !$nocheck && ! -f $filename;
1e3baf05 1649
e6c3b671 1650 my $pidfile = pidfile_name($vmid);
1e3baf05 1651
e6c3b671
DM
1652 if (my $fd = IO::File->new("<$pidfile")) {
1653 my $st = stat($fd);
1e3baf05 1654 my $line = <$fd>;
6b64503e 1655 close($fd);
1e3baf05
DM
1656
1657 my $mtime = $st->mtime;
1658 if ($mtime > time()) {
1659 warn "file '$filename' modified in future\n";
1660 }
1661
1662 if ($line =~ m/^(\d+)$/) {
1663 my $pid = $1;
e6c3b671
DM
1664 if (check_cmdline($pidfile, $pid)) {
1665 if (my $pinfo = PVE::ProcFSTools::check_process_running($pid)) {
1666 return $pid;
1667 }
1668 }
1e3baf05
DM
1669 }
1670 }
1671
1672 return undef;
1673}
1674
1675sub vzlist {
19672434 1676
1e3baf05
DM
1677 my $vzlist = config_list();
1678
6b64503e 1679 my $fd = IO::Dir->new($var_run_tmpdir) || return $vzlist;
1e3baf05 1680
19672434 1681 while (defined(my $de = $fd->read)) {
1e3baf05
DM
1682 next if $de !~ m/^(\d+)\.pid$/;
1683 my $vmid = $1;
6b64503e
DM
1684 next if !defined($vzlist->{$vmid});
1685 if (my $pid = check_running($vmid)) {
1e3baf05
DM
1686 $vzlist->{$vmid}->{pid} = $pid;
1687 }
1688 }
1689
1690 return $vzlist;
1691}
1692
1693my $storage_timeout_hash = {};
1694
1695sub disksize {
1696 my ($storecfg, $conf) = @_;
1697
1698 my $bootdisk = $conf->{bootdisk};
1699 return undef if !$bootdisk;
1700 return undef if !valid_drivename($bootdisk);
1701
1702 return undef if !$conf->{$bootdisk};
1703
1704 my $drive = parse_drive($bootdisk, $conf->{$bootdisk});
1705 return undef if !defined($drive);
1706
1707 return undef if drive_is_cdrom($drive);
1708
1709 my $volid = $drive->{file};
1710 return undef if !$volid;
1711
1712 my $path;
1713 my $storeid;
1714 my $timeoutid;
1715
1716 if ($volid =~ m|^/|) {
1717 $path = $timeoutid = $volid;
1718 } else {
f0cab979
DM
1719 eval {
1720 $storeid = $timeoutid = PVE::Storage::parse_volume_id($volid);
1721 $path = PVE::Storage::path($storecfg, $volid);
1722 };
1723 if (my $err = $@) {
1724 warn $err;
1725 return undef;
1726 }
1e3baf05
DM
1727 }
1728
1729 my $last_timeout = $storage_timeout_hash->{$timeoutid};
1730 if ($last_timeout) {
1731 if ((time() - $last_timeout) < 30) {
1732 # skip storage with errors
1733 return undef ;
1734 }
1735 delete $storage_timeout_hash->{$timeoutid};
1736 }
1737
1738 my ($size, $format, $used);
1739
1740 ($size, $format, $used) = PVE::Storage::file_size_info($path, 1);
1741
1742 if (!defined($format)) {
1743 # got timeout
1744 $storage_timeout_hash->{$timeoutid} = time();
1745 return undef;
1746 }
1747
1748 return wantarray ? ($size, $used) : $size;
1749}
1750
1751my $last_proc_pid_stat;
1752
1753sub vmstatus {
1754 my ($opt_vmid) = @_;
1755
1756 my $res = {};
1757
19672434 1758 my $storecfg = PVE::Storage::config();
1e3baf05
DM
1759
1760 my $list = vzlist();
694fcad4 1761 my ($uptime) = PVE::ProcFSTools::read_proc_uptime(1);
1e3baf05 1762
ae4915a2
DM
1763 my $cpucount = $cpuinfo->{cpus} || 1;
1764
1e3baf05
DM
1765 foreach my $vmid (keys %$list) {
1766 next if $opt_vmid && ($vmid ne $opt_vmid);
1767
1768 my $cfspath = cfs_config_path($vmid);
1769 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
1770
1771 my $d = {};
1772 $d->{pid} = $list->{$vmid}->{pid};
1773
1774 # fixme: better status?
1775 $d->{status} = $list->{$vmid}->{pid} ? 'running' : 'stopped';
1776
1777 my ($size, $used) = disksize($storecfg, $conf);
1778 if (defined($size) && defined($used)) {
1779 $d->{disk} = $used;
1780 $d->{maxdisk} = $size;
1781 } else {
1782 $d->{disk} = 0;
1783 $d->{maxdisk} = 0;
1784 }
1785
1786 $d->{cpus} = ($conf->{sockets} || 1) * ($conf->{cores} || 1);
ae4915a2
DM
1787 $d->{cpus} = $cpucount if $d->{cpus} > $cpucount;
1788
1e3baf05 1789 $d->{name} = $conf->{name} || "VM $vmid";
19672434 1790 $d->{maxmem} = $conf->{memory} ? $conf->{memory}*(1024*1024) : 0;
1e3baf05 1791
1e3baf05
DM
1792 $d->{uptime} = 0;
1793 $d->{cpu} = 0;
1e3baf05
DM
1794 $d->{mem} = 0;
1795
1796 $d->{netout} = 0;
1797 $d->{netin} = 0;
1798
1799 $d->{diskread} = 0;
1800 $d->{diskwrite} = 0;
1801
1802 $res->{$vmid} = $d;
1803 }
1804
1805 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
1806 foreach my $dev (keys %$netdev) {
1807 next if $dev !~ m/^tap([1-9]\d*)i/;
1808 my $vmid = $1;
1809 my $d = $res->{$vmid};
1810 next if !$d;
19672434 1811
1e3baf05
DM
1812 $d->{netout} += $netdev->{$dev}->{receive};
1813 $d->{netin} += $netdev->{$dev}->{transmit};
1814 }
1815
1e3baf05
DM
1816 my $ctime = gettimeofday;
1817
1818 foreach my $vmid (keys %$list) {
1819
1820 my $d = $res->{$vmid};
1821 my $pid = $d->{pid};
1822 next if !$pid;
1823
1824 if (my $fh = IO::File->new("/proc/$pid/io", "r")) {
1825 my $data = {};
6b64503e 1826 while (defined(my $line = <$fh>)) {
1e3baf05
DM
1827 if ($line =~ m/^([rw]char):\s+(\d+)$/) {
1828 $data->{$1} = $2;
1829 }
1830 }
1831 close($fh);
1832 $d->{diskread} = $data->{rchar} || 0;
1833 $d->{diskwrite} = $data->{wchar} || 0;
1834 }
1835
694fcad4
DM
1836 my $pstat = PVE::ProcFSTools::read_proc_pid_stat($pid);
1837 next if !$pstat; # not running
19672434 1838
694fcad4 1839 my $used = $pstat->{utime} + $pstat->{stime};
1e3baf05 1840
694fcad4 1841 $d->{uptime} = int(($uptime - $pstat->{starttime})/$cpuinfo->{user_hz});
1e3baf05 1842
694fcad4 1843 if ($pstat->{vsize}) {
6b64503e 1844 $d->{mem} = int(($pstat->{rss}/$pstat->{vsize})*$d->{maxmem});
1e3baf05
DM
1845 }
1846
1847 my $old = $last_proc_pid_stat->{$pid};
1848 if (!$old) {
19672434
DM
1849 $last_proc_pid_stat->{$pid} = {
1850 time => $ctime,
1e3baf05
DM
1851 used => $used,
1852 cpu => 0,
1e3baf05
DM
1853 };
1854 next;
1855 }
1856
7f0b5beb 1857 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
1e3baf05
DM
1858
1859 if ($dtime > 1000) {
1860 my $dutime = $used - $old->{used};
1861
ae4915a2 1862 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
1e3baf05 1863 $last_proc_pid_stat->{$pid} = {
19672434 1864 time => $ctime,
1e3baf05
DM
1865 used => $used,
1866 cpu => $d->{cpu},
1e3baf05
DM
1867 };
1868 } else {
1869 $d->{cpu} = $old->{cpu};
1e3baf05
DM
1870 }
1871 }
1872
1873 return $res;
1874}
1875
1876sub foreach_drive {
1877 my ($conf, $func) = @_;
1878
1879 foreach my $ds (keys %$conf) {
1880 next if !valid_drivename($ds);
1881
6b64503e 1882 my $drive = parse_drive($ds, $conf->{$ds});
1e3baf05
DM
1883 next if !$drive;
1884
1885 &$func($ds, $drive);
1886 }
1887}
1888
1889sub config_to_command {
1890 my ($storecfg, $vmid, $conf, $defaults, $migrate_uri) = @_;
1891
1892 my $cmd = [];
b78ebef7 1893 my $pciaddr = '';
1e3baf05
DM
1894 my $kvmver = kvm_user_version();
1895 my $vernum = 0; # unknown
a3c52213
DM
1896 if ($kvmver =~ m/^(\d+)\.(\d+)$/) {
1897 $vernum = $1*1000000+$2*1000;
1898 } elsif ($kvmver =~ m/^(\d+)\.(\d+)\.(\d+)$/) {
1e3baf05
DM
1899 $vernum = $1*1000000+$2*1000+$3;
1900 }
1901
a3c52213 1902 die "detected old qemu-kvm binary ($kvmver)\n" if $vernum < 15000;
1e3baf05
DM
1903
1904 my $have_ovz = -f '/proc/vz/vestat';
1905
1906 push @$cmd, '/usr/bin/kvm';
1907
1908 push @$cmd, '-id', $vmid;
1909
1910 my $use_virtio = 0;
1911
6b64503e 1912 my $socket = monitor_socket($vmid);
abb39b66
DA
1913 push @$cmd, '-chardev', "socket,id=monitor,path=$socket,server,nowait";
1914 push @$cmd, '-mon', "chardev=monitor,mode=readline";
1e3baf05 1915
6b64503e 1916 $socket = vnc_socket($vmid);
1e3baf05
DM
1917 push @$cmd, '-vnc', "unix:$socket,x509,password";
1918
6b64503e 1919 push @$cmd, '-pidfile' , pidfile_name($vmid);
19672434 1920
1e3baf05
DM
1921 push @$cmd, '-daemonize';
1922
1923 push @$cmd, '-incoming', $migrate_uri if $migrate_uri;
1924
1c060867
DM
1925 my $use_usb2 = 0;
1926 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
1927 next if !$conf->{"usb$i"};
1928 $use_usb2 = 1;
1929 }
1e3baf05 1930 # include usb device config
1c060867 1931 push @$cmd, '-readconfig', '/usr/share/qemu-server/pve-usb.cfg' if $use_usb2;
19672434 1932
1e3baf05 1933 # enable absolute mouse coordinates (needed by vnc)
6b64503e 1934 my $tablet = defined($conf->{tablet}) ? $conf->{tablet} : $defaults->{tablet};
1c060867
DM
1935 if ($tablet) {
1936 if ($use_usb2) {
1937 push @$cmd, '-device', 'usb-tablet,bus=ehci.0,port=6';
1938 } else {
1939 push @$cmd, '-usbdevice', 'tablet';
1940 }
1941 }
1e3baf05
DM
1942
1943 # host pci devices
040b06b7
DA
1944 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
1945 my $d = parse_hostpci($conf->{"hostpci$i"});
1946 next if !$d;
b78ebef7
DA
1947 $pciaddr = print_pci_addr("hostpci$i");
1948 push @$cmd, '-device', "pci-assign,host=$d->{pciid},id=hostpci$i$pciaddr";
1e3baf05
DM
1949 }
1950
1951 # usb devices
1952 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
1953 my $d = parse_usb_device($conf->{"usb$i"});
1954 next if !$d;
1955 if ($d->{vendorid} && $d->{productid}) {
1956 push @$cmd, '-device', "usb-host,vendorid=$d->{vendorid},productid=$d->{productid}";
1957 } elsif (defined($d->{hostbus}) && defined($d->{hostport})) {
1958 push @$cmd, '-device', "usb-host,hostbus=$d->{hostbus},hostport=$d->{hostport}";
1959 }
1960 }
1961
1e3baf05 1962 # serial devices
bae179aa 1963 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
34978be3 1964 if (my $path = $conf->{"serial$i"}) {
19672434 1965 die "no such serial device\n" if ! -c $path;
34978be3
DM
1966 push @$cmd, '-chardev', "tty,id=serial$i,path=$path";
1967 push @$cmd, '-device', "isa-serial,chardev=serial$i";
1968 }
1e3baf05
DM
1969 }
1970
1971 # parallel devices
1989a89c 1972 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
34978be3 1973 if (my $path = $conf->{"parallel$i"}) {
19672434 1974 die "no such parallel device\n" if ! -c $path;
34978be3
DM
1975 push @$cmd, '-chardev', "parport,id=parallel$i,path=$path";
1976 push @$cmd, '-device', "isa-parallel,chardev=parallel$i";
1977 }
1e3baf05
DM
1978 }
1979
1980 my $vmname = $conf->{name} || "vm$vmid";
1981
1982 push @$cmd, '-name', $vmname;
19672434 1983
1e3baf05
DM
1984 my $sockets = 1;
1985 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
1986 $sockets = $conf->{sockets} if $conf->{sockets};
1987
1988 my $cores = $conf->{cores} || 1;
1989
1e3baf05
DM
1990 push @$cmd, '-smp', "sockets=$sockets,cores=$cores";
1991
1992 push @$cmd, '-cpu', $conf->{cpu} if $conf->{cpu};
1993
1e3baf05
DM
1994 push @$cmd, '-nodefaults';
1995
32baffb4 1996 my $bootorder = $conf->{boot} || $confdesc->{boot}->{default};
3b408e82 1997
0888fdce
DM
1998 my $bootindex_hash = {};
1999 my $i = 1;
2000 foreach my $o (split(//, $bootorder)) {
2001 $bootindex_hash->{$o} = $i*100;
2002 $i++;
afdb31d5 2003 }
3b408e82
DM
2004
2005 push @$cmd, '-boot', "menu=on";
1e3baf05 2006
6b64503e 2007 push @$cmd, '-no-acpi' if defined($conf->{acpi}) && $conf->{acpi} == 0;
1e3baf05 2008
6b64503e 2009 push @$cmd, '-no-reboot' if defined($conf->{reboot}) && $conf->{reboot} == 0;
1e3baf05
DM
2010
2011 my $vga = $conf->{vga};
2012 if (!$vga) {
2013 if ($conf->{ostype} && ($conf->{ostype} eq 'win7' || $conf->{ostype} eq 'w2k8')) {
2014 $vga = 'std';
2015 } else {
2016 $vga = 'cirrus';
2017 }
2018 }
19672434 2019
1e3baf05
DM
2020 push @$cmd, '-vga', $vga if $vga; # for kvm 77 and later
2021
2022 # time drift fix
6b64503e 2023 my $tdf = defined($conf->{tdf}) ? $conf->{tdf} : $defaults->{tdf};
da21653b
DM
2024 # ignore - no longer supported by newer kvm
2025 # push @$cmd, '-tdf' if $tdf;
1e3baf05 2026
6b64503e 2027 my $nokvm = defined($conf->{kvm}) && $conf->{kvm} == 0 ? 1 : 0;
1e3baf05
DM
2028
2029 if (my $ost = $conf->{ostype}) {
2030 # other, wxp, w2k, w2k3, w2k8, wvista, win7, l24, l26
2031
2032 if ($ost =~ m/^w/) { # windows
6b64503e 2033 push @$cmd, '-localtime' if !defined($conf->{localtime});
1e3baf05
DM
2034
2035 # use rtc-td-hack when acpi is enabled
6b64503e 2036 if (!(defined($conf->{acpi}) && $conf->{acpi} == 0)) {
1e3baf05
DM
2037 push @$cmd, '-rtc-td-hack';
2038 }
2039 }
2040
2041 # -tdf ?
19672434
DM
2042 # -no-acpi
2043 # -no-kvm
1e3baf05
DM
2044 # -win2k-hack ?
2045 }
2046
7f0b5beb
DM
2047 if ($nokvm) {
2048 push @$cmd, '-no-kvm';
2049 } else {
2050 die "No accelerator found!\n" if !$cpuinfo->{hvm};
2051 }
1e3baf05
DM
2052
2053 push @$cmd, '-localtime' if $conf->{localtime};
2054
2055 push @$cmd, '-startdate', $conf->{startdate} if $conf->{startdate};
2056
2057 push @$cmd, '-S' if $conf->{freeze};
2058
2059 # set keyboard layout
2060 my $kb = $conf->{keyboard} || $defaults->{keyboard};
2061 push @$cmd, '-k', $kb if $kb;
2062
2063 # enable sound
2064 #my $soundhw = $conf->{soundhw} || $defaults->{soundhw};
2065 #push @$cmd, '-soundhw', 'es1370';
2066 #push @$cmd, '-soundhw', $soundhw if $soundhw;
b78ebef7 2067 $pciaddr = print_pci_addr("balloon0");
13b5a753 2068 push @$cmd, '-device', "virtio-balloon-pci,id=balloon0$pciaddr" if $conf->{balloon};
1e3baf05 2069
0ea9541d
DM
2070 if ($conf->{watchdog}) {
2071 my $wdopts = parse_watchdog($conf->{watchdog});
0a40e8ea
DA
2072 $pciaddr = print_pci_addr("watchdog");
2073 my $watchdog = $wdopts->{model} || 'i6300esb';
2074 push @$cmd, '-device', "$watchdog$pciaddr";
0ea9541d
DM
2075 push @$cmd, '-watchdog-action', $wdopts->{action} if $wdopts->{action};
2076 }
2077
1e3baf05 2078 my $vollist = [];
941e0c42 2079 my $scsicontroller = {};
26ee04b6 2080 my $ahcicontroller = {};
1e3baf05
DM
2081
2082 foreach_drive($conf, sub {
2083 my ($ds, $drive) = @_;
2084
ff1a2432 2085 if (PVE::Storage::parse_volume_id($drive->{file}, 1)) {
1e3baf05 2086 push @$vollist, $drive->{file};
ff1a2432 2087 }
afdb31d5 2088
1e3baf05 2089 $use_virtio = 1 if $ds =~ m/^virtio/;
3b408e82
DM
2090
2091 if (drive_is_cdrom ($drive)) {
2092 if ($bootindex_hash->{d}) {
2093 $drive->{bootindex} = $bootindex_hash->{d};
2094 $bootindex_hash->{d} += 1;
2095 }
2096 } else {
2097 if ($bootindex_hash->{c}) {
2098 $drive->{bootindex} = $bootindex_hash->{c} if $conf->{bootdisk} && ($conf->{bootdisk} eq $ds);
2099 $bootindex_hash->{c} += 1;
2100 }
2101 }
2102
941e0c42
DA
2103 if ($drive->{interface} eq 'scsi') {
2104 my $maxdev = 7;
6b64503e 2105 my $controller = int($drive->{index} / $maxdev);
69b6ae0c
DA
2106 $pciaddr = print_pci_addr("lsi$controller");
2107 push @$cmd, '-device', "lsi,id=lsi$controller$pciaddr" if !$scsicontroller->{$controller};
58dc808d 2108 $scsicontroller->{$controller}=1;
941e0c42 2109 }
3b408e82 2110
26ee04b6
DA
2111 if ($drive->{interface} eq 'sata') {
2112 my $controller = int($drive->{index} / $MAX_SATA_DISKS);
2113 $pciaddr = print_pci_addr("ahci$controller");
2114 push @$cmd, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr" if !$ahcicontroller->{$controller};
2115 $ahcicontroller->{$controller}=1;
2116 }
2117
2118 push @$cmd, '-drive',print_drive_full($storecfg, $vmid, $drive);
6b64503e 2119 push @$cmd, '-device',print_drivedevice_full($storecfg,$vmid, $drive);
1e3baf05
DM
2120 });
2121
2122 push @$cmd, '-m', $conf->{memory} || $defaults->{memory};
19672434 2123
cc4d6182 2124 for (my $i = 0; $i < $MAX_NETS; $i++) {
5f0c4c32 2125 next if !$conf->{"net$i"};
cc4d6182
DA
2126 my $d = parse_net($conf->{"net$i"});
2127 next if !$d;
1e3baf05 2128
cc4d6182 2129 $use_virtio = 1 if $d->{model} eq 'virtio';
1e3baf05 2130
cc4d6182
DA
2131 if ($bootindex_hash->{n}) {
2132 $d->{bootindex} = $bootindex_hash->{n};
2133 $bootindex_hash->{n} += 1;
2134 }
1e3baf05 2135
cc4d6182
DA
2136 my $netdevfull = print_netdev_full($vmid,$conf,$d,"net$i");
2137 push @$cmd, '-netdev', $netdevfull;
1e3baf05 2138
cc4d6182
DA
2139 my $netdevicefull = print_netdevice_full($vmid,$conf,$d,"net$i");
2140 push @$cmd, '-device', $netdevicefull;
19672434
DM
2141 }
2142
1e3baf05
DM
2143
2144 # hack: virtio with fairsched is unreliable, so we do not use fairsched
2145 # when the VM uses virtio devices.
19672434
DM
2146 if (!$use_virtio && $have_ovz) {
2147
6b64503e 2148 my $cpuunits = defined($conf->{cpuunits}) ?
1e3baf05
DM
2149 $conf->{cpuunits} : $defaults->{cpuunits};
2150
2151 push @$cmd, '-cpuunits', $cpuunits if $cpuunits;
2152
2153 # fixme: cpulimit is currently ignored
2154 #push @$cmd, '-cpulimit', $conf->{cpulimit} if $conf->{cpulimit};
2155 }
2156
2157 # add custom args
2158 if ($conf->{args}) {
3ada46c9 2159 my $aa = PVE::Tools::split_args($conf->{args});
1e3baf05
DM
2160 push @$cmd, @$aa;
2161 }
2162
2163 return wantarray ? ($cmd, $vollist) : $cmd;
2164}
19672434 2165
1e3baf05
DM
2166sub vnc_socket {
2167 my ($vmid) = @_;
2168 return "${var_run_tmpdir}/$vmid.vnc";
2169}
2170
2171sub monitor_socket {
2172 my ($vmid) = @_;
2173 return "${var_run_tmpdir}/$vmid.mon";
2174}
2175
2176sub pidfile_name {
2177 my ($vmid) = @_;
2178 return "${var_run_tmpdir}/$vmid.pid";
2179}
2180
1e3baf05
DM
2181sub next_migrate_port {
2182
2183 for (my $p = 60000; $p < 60010; $p++) {
2184
6b64503e
DM
2185 my $sock = IO::Socket::INET->new(Listen => 5,
2186 LocalAddr => 'localhost',
2187 LocalPort => $p,
2188 ReuseAddr => 1,
2189 Proto => 0);
1e3baf05
DM
2190
2191 if ($sock) {
6b64503e 2192 close($sock);
1e3baf05
DM
2193 return $p;
2194 }
2195 }
2196
2197 die "unable to find free migration port";
2198}
2199
86fdcfb2
DA
2200sub vm_devices_list {
2201 my ($vmid) = @_;
2202
ff1a2432 2203 my $res = vm_monitor_command ($vmid, "info pci");
1dc4f496
DM
2204
2205 my @lines = split ("\n", $res);
2206 my $devices;
2207 my $bus;
2208 my $addr;
2209 my $id;
afdb31d5 2210
1dc4f496
DM
2211 foreach my $line (@lines) {
2212 $line =~ s/^\s+//;
2213 if ($line =~ m/^Bus (\d+), device (\d+), function (\d+):$/) {
2214 $bus=$1;
2215 $addr=$2;
2216 }
2217 if ($line =~ m/^id "([a-z][a-z_\-]*\d*)"$/) {
86fdcfb2
DA
2218 $id=$1;
2219 $devices->{$id}->{bus}=$bus;
2220 $devices->{$id}->{addr}=$addr;
1dc4f496
DM
2221 }
2222 }
86fdcfb2 2223
1dc4f496 2224 return $devices;
86fdcfb2
DA
2225}
2226
ec21aa11 2227sub vm_deviceplug {
f19d1c47 2228 my ($storecfg, $conf, $vmid, $deviceid, $device) = @_;
ae57f6b3 2229
2630d2a9 2230 return 1 if !check_running($vmid) || !$conf->{hotplug};
afdb31d5 2231
95d6343b
DA
2232 my $devices_list = vm_devices_list($vmid);
2233 return 1 if defined($devices_list->{$deviceid});
2234
5e5dcb73
DA
2235 if ($deviceid =~ m/^(virtio)(\d+)$/) {
2236 return undef if !qemu_driveadd($storecfg, $vmid, $device);
1dc4f496 2237 my $devicefull = print_drivedevice_full($storecfg, $vmid, $device);
5e5dcb73
DA
2238 qemu_deviceadd($vmid, $devicefull);
2239 if(!qemu_deviceaddverify($vmid, $deviceid)) {
2240 qemu_drivedel($vmid, $deviceid);
2241 return undef;
2242 }
f19d1c47 2243 }
cfc817c7
DA
2244
2245 if ($deviceid =~ m/^(lsi)(\d+)$/) {
2246 my $pciaddr = print_pci_addr($deviceid);
2247 my $devicefull = "lsi,id=$deviceid$pciaddr";
2248 qemu_deviceadd($vmid, $devicefull);
2249 return undef if(!qemu_deviceaddverify($vmid, $deviceid));
2250 }
2251
a4f091a0
DA
2252 if ($deviceid =~ m/^(scsi)(\d+)$/) {
2253 return undef if !qemu_findorcreatelsi($storecfg,$conf, $vmid, $device);
2254 return undef if !qemu_driveadd($storecfg, $vmid, $device);
2255 my $devicefull = print_drivedevice_full($storecfg, $vmid, $device);
2256 if(!qemu_deviceadd($vmid, $devicefull)) {
2257 qemu_drivedel($vmid, $deviceid);
2258 return undef;
2259 }
2260 }
2261
2630d2a9
DA
2262 if ($deviceid =~ m/^(net)(\d+)$/) {
2263 return undef if !qemu_netdevadd($vmid, $conf, $device, $deviceid);
2264 my $netdevicefull = print_netdevice_full($vmid, $conf, $device, $deviceid);
2265 qemu_deviceadd($vmid, $netdevicefull);
2266 if(!qemu_deviceaddverify($vmid, $deviceid)) {
2267 qemu_netdevdel($vmid, $deviceid);
2268 return undef;
2269 }
2270 }
2271
5e5dcb73 2272 return 1;
a4dea331
DA
2273}
2274
ec21aa11 2275sub vm_deviceunplug {
f19d1c47 2276 my ($vmid, $conf, $deviceid) = @_;
873c2d69 2277
5e5dcb73 2278 return 1 if !check_running ($vmid) || !$conf->{hotplug};
873c2d69 2279
95d6343b
DA
2280 my $devices_list = vm_devices_list($vmid);
2281 return 1 if !defined($devices_list->{$deviceid});
2282
ae57f6b3 2283 die "can't unplug bootdisk" if $conf->{bootdisk} && $conf->{bootdisk} eq $deviceid;
f19d1c47 2284
5e5dcb73
DA
2285 if ($deviceid =~ m/^(virtio)(\d+)$/) {
2286 return undef if !qemu_drivedel($vmid, $deviceid);
2287 qemu_devicedel($vmid, $deviceid);
2288 return undef if !qemu_devicedelverify($vmid, $deviceid);
2289 }
cfc817c7
DA
2290
2291 if ($deviceid =~ m/^(lsi)(\d+)$/) {
2292 return undef if !qemu_devicedel($vmid, $deviceid);
2293 }
2294
a4f091a0
DA
2295 if ($deviceid =~ m/^(scsi)(\d+)$/) {
2296 return undef if !qemu_devicedel($vmid, $deviceid);
2297 return undef if !qemu_drivedel($vmid, $deviceid);
2298 }
2299
2630d2a9
DA
2300 if ($deviceid =~ m/^(net)(\d+)$/) {
2301 return undef if !qemu_netdevdel($vmid, $deviceid);
2302 qemu_devicedel($vmid, $deviceid);
2303 return undef if !qemu_devicedelverify($vmid, $deviceid);
2304 }
2305
5e5dcb73
DA
2306 return 1;
2307}
2308
2309sub qemu_deviceadd {
2310 my ($vmid, $devicefull) = @_;
873c2d69 2311
5e5dcb73
DA
2312 my $ret = vm_monitor_command($vmid, "device_add $devicefull");
2313 $ret =~ s/^\s+//;
afdb31d5 2314 # Otherwise, if the command succeeds, no output is sent. So any non-empty string shows an error
5e5dcb73
DA
2315 return 1 if $ret eq "";
2316 syslog("err", "error on hotplug device : $ret");
2317 return undef;
f19d1c47 2318
5e5dcb73 2319}
afdb31d5 2320
5e5dcb73
DA
2321sub qemu_devicedel {
2322 my($vmid, $deviceid) = @_;
f19d1c47 2323
5e5dcb73
DA
2324 my $ret = vm_monitor_command($vmid, "device_del $deviceid");
2325 $ret =~ s/^\s+//;
2326 return 1 if $ret eq "";
2327 syslog("err", "detaching device $deviceid failed : $ret");
2328 return undef;
2329}
2330
2331sub qemu_driveadd {
2332 my($storecfg, $vmid, $device) = @_;
2333
2334 my $drive = print_drive_full($storecfg, $vmid, $device);
2335 my $ret = vm_monitor_command($vmid, "drive_add auto $drive");
2336 # If the command succeeds qemu prints: "OK"
2337 if ($ret !~ m/OK/s) {
2338 syslog("err", "adding drive failed: $ret");
2339 return undef;
f19d1c47 2340 }
5e5dcb73
DA
2341 return 1;
2342}
afdb31d5 2343
5e5dcb73
DA
2344sub qemu_drivedel {
2345 my($vmid, $deviceid) = @_;
873c2d69 2346
5e5dcb73
DA
2347 my $ret = vm_monitor_command($vmid, "drive_del drive-$deviceid");
2348 $ret =~ s/^\s+//;
2349 if ($ret =~ m/Device \'.*?\' not found/s) {
afdb31d5 2350 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
5e5dcb73
DA
2351 }
2352 elsif ($ret ne "") {
2353 syslog("err", "deleting drive $deviceid failed : $ret");
2354 return undef;
873c2d69 2355 }
5e5dcb73
DA
2356 return 1;
2357}
f19d1c47 2358
5e5dcb73
DA
2359sub qemu_deviceaddverify {
2360 my ($vmid,$deviceid) = @_;
873c2d69 2361
5e5dcb73
DA
2362 for (my $i = 0; $i <= 5; $i++) {
2363 my $devices_list = vm_devices_list($vmid);
2364 return 1 if defined($devices_list->{$deviceid});
2365 sleep 1;
afdb31d5 2366 }
5e5dcb73
DA
2367 syslog("err", "error on hotplug device $deviceid");
2368 return undef;
2369}
afdb31d5 2370
5e5dcb73
DA
2371
2372sub qemu_devicedelverify {
2373 my ($vmid,$deviceid) = @_;
2374
2375 #need to verify the device is correctly remove as device_del is async and empty return is not reliable
2376 for (my $i = 0; $i <= 5; $i++) {
2377 my $devices_list = vm_devices_list($vmid);
2378 return 1 if !defined($devices_list->{$deviceid});
2379 sleep 1;
afdb31d5 2380 }
5e5dcb73
DA
2381 syslog("err", "error on hot-unplugging device $deviceid");
2382 return undef;
873c2d69
DA
2383}
2384
cfc817c7
DA
2385sub qemu_findorcreatelsi {
2386 my ($storecfg, $conf, $vmid, $device) = @_;
2387
2388 my $maxdev = 7;
2389 my $controller = int($device->{index} / $maxdev);
2390 my $lsiid="lsi$controller";
2391 my $devices_list = vm_devices_list($vmid);
2392
2393 if(!defined($devices_list->{$lsiid})) {
2394 return undef if !vm_deviceplug($storecfg, $conf, $vmid, $lsiid);
2395 }
2396 return 1;
2397}
2398
2630d2a9
DA
2399sub qemu_netdevadd {
2400 my ($vmid, $conf, $device, $deviceid) = @_;
2401
2402 my $netdev = print_netdev_full($vmid, $conf, $device, $deviceid);
2403 my $ret = vm_monitor_command($vmid, "netdev_add $netdev");
2404 $ret =~ s/^\s+//;
2405
2406 #if the command succeeds, no output is sent. So any non-empty string shows an error
2407 return 1 if $ret eq "";
2408 syslog("err", "adding netdev failed: $ret");
2409 return undef;
2410}
2411
2412sub qemu_netdevdel {
2413 my ($vmid, $deviceid) = @_;
2414
2415 my $ret = vm_monitor_command($vmid, "netdev_del $deviceid");
2416 $ret =~ s/^\s+//;
2417 #if the command succeeds, no output is sent. So any non-empty string shows an error
2418 return 1 if $ret eq "";
2419 syslog("err", "deleting netdev failed: $ret");
2420 return undef;
2421}
2422
1e3baf05
DM
2423sub vm_start {
2424 my ($storecfg, $vmid, $statefile, $skiplock) = @_;
2425
6b64503e
DM
2426 lock_config($vmid, sub {
2427 my $conf = load_config($vmid);
1e3baf05 2428
6b64503e 2429 check_lock($conf) if !$skiplock;
1e3baf05 2430
ff1a2432 2431 die "VM $vmid already running\n" if check_running($vmid);
1e3baf05
DM
2432
2433 my $migrate_uri;
2434 my $migrate_port = 0;
2435
2436 if ($statefile) {
2437 if ($statefile eq 'tcp') {
2438 $migrate_port = next_migrate_port();
2439 $migrate_uri = "tcp:localhost:${migrate_port}";
2440 } else {
2441 if (-f $statefile) {
2442 $migrate_uri = "exec:cat $statefile";
2443 } else {
2444 warn "state file '$statefile' does not exist - doing normal startup\n";
2445 }
2446 }
2447 }
2448
2449 my $defaults = load_defaults();
2450
e6c3b671 2451 my ($cmd, $vollist) = config_to_command($storecfg, $vmid, $conf, $defaults, $migrate_uri);
1e3baf05 2452 # host pci devices
040b06b7
DA
2453 for (my $i = 0; $i < $MAX_HOSTPCI_DEVICES; $i++) {
2454 my $d = parse_hostpci($conf->{"hostpci$i"});
2455 next if !$d;
2456 my $info = pci_device_info("0000:$d->{pciid}");
2457 die "IOMMU not present\n" if !check_iommu_support();
2458 die "no pci device info for device '$d->{pciid}'\n" if !$info;
2459 die "can't unbind pci device '$d->{pciid}'\n" if !pci_dev_bind_to_stub($info);
2460 die "can't reset pci device '$d->{pciid}'\n" if !pci_dev_reset($info);
2461 }
1e3baf05
DM
2462
2463 PVE::Storage::activate_volumes($storecfg, $vollist);
2464
6b64503e 2465 eval { run_command($cmd, timeout => $migrate_uri ? undef : 30); };
1e3baf05 2466 my $err = $@;
ff1a2432 2467 die "start failed: $err" if $err;
1e3baf05
DM
2468
2469 if ($statefile) {
2470
2471 if ($statefile eq 'tcp') {
2472 print "migration listens on port $migrate_port\n";
2473 } else {
2474 unlink $statefile;
2475 # fixme: send resume - is that necessary ?
ff1a2432 2476 eval { vm_monitor_command($vmid, "cont"); };
1e3baf05
DM
2477 }
2478 }
afdb31d5 2479
48e1a963
DM
2480 # always set migrate speed (overwrite kvm default of 32m)
2481 # we set a very hight default of 8192m which is basically unlimited
2482 my $migrate_speed = $defaults->{migrate_speed} || 8192;
2483 $migrate_speed = $conf->{migrate_speed} || $migrate_speed;
afdb31d5 2484 eval {
1e3baf05 2485 my $cmd = "migrate_set_speed ${migrate_speed}m";
afdb31d5 2486 vm_monitor_command($vmid, $cmd);
48e1a963 2487 };
1e3baf05 2488
19672434 2489 if (my $migrate_downtime =
1e3baf05
DM
2490 $conf->{migrate_downtime} || $defaults->{migrate_downtime}) {
2491 my $cmd = "migrate_set_downtime ${migrate_downtime}";
ff1a2432 2492 eval { vm_monitor_command($vmid, $cmd); };
1e3baf05 2493 }
e6c3b671 2494
7878afeb 2495 vm_balloonset($vmid, $conf->{balloon}) if $conf->{balloon};
1e3baf05
DM
2496 });
2497}
2498
2499sub __read_avail {
2500 my ($fh, $timeout) = @_;
2501
2502 my $sel = new IO::Select;
6b64503e 2503 $sel->add($fh);
1e3baf05
DM
2504
2505 my $res = '';
2506 my $buf;
2507
2508 my @ready;
6b64503e 2509 while (scalar (@ready = $sel->can_read($timeout))) {
1e3baf05 2510 my $count;
6b64503e 2511 if ($count = $fh->sysread($buf, 8192)) {
1e3baf05
DM
2512 if ($buf =~ /^(.*)\(qemu\) $/s) {
2513 $res .= $1;
2514 last;
2515 } else {
2516 $res .= $buf;
2517 }
2518 } else {
6b64503e 2519 if (!defined($count)) {
1e3baf05
DM
2520 die "$!\n";
2521 }
2522 last;
2523 }
2524 }
2525
6b64503e 2526 die "monitor read timeout\n" if !scalar(@ready);
1e3baf05
DM
2527
2528 return $res;
2529}
2530
2531sub vm_monitor_command {
ff1a2432 2532 my ($vmid, $cmdstr, $nocheck) = @_;
1e3baf05
DM
2533
2534 my $res;
2535
1e3baf05 2536 eval {
ff1a2432 2537 die "VM $vmid not running\n" if !check_running($vmid, $nocheck);
1e3baf05 2538
e6c3b671 2539 my $sname = monitor_socket($vmid);
1e3baf05 2540
6b64503e 2541 my $sock = IO::Socket::UNIX->new( Peer => $sname ) ||
1e3baf05
DM
2542 die "unable to connect to VM $vmid socket - $!\n";
2543
2544 my $timeout = 3;
2545
19672434 2546 # hack: migrate sometime blocks the monitor (when migrate_downtime
1e3baf05
DM
2547 # is set)
2548 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
2549 $timeout = 60*60; # 1 hour
2550 }
2551
2552 # read banner;
6b64503e 2553 my $data = __read_avail($sock, $timeout);
19672434 2554
1e3baf05
DM
2555 if ($data !~ m/^QEMU\s+(\S+)\s+monitor\s/) {
2556 die "got unexpected qemu monitor banner\n";
2557 }
2558
2559 my $sel = new IO::Select;
6b64503e 2560 $sel->add($sock);
1e3baf05 2561
6b64503e 2562 if (!scalar(my @ready = $sel->can_write($timeout))) {
1e3baf05
DM
2563 die "monitor write error - timeout";
2564 }
2565
2566 my $fullcmd = "$cmdstr\r";
2567
ae57f6b3
DM
2568 # syslog('info', "VM $vmid monitor command: $cmdstr");
2569
1e3baf05 2570 my $b;
6b64503e 2571 if (!($b = $sock->syswrite($fullcmd)) || ($b != length($fullcmd))) {
1e3baf05
DM
2572 die "monitor write error - $!";
2573 }
2574
2575 return if ($cmdstr eq 'q') || ($cmdstr eq 'quit');
2576
19672434 2577 $timeout = 20;
1e3baf05
DM
2578
2579 if ($cmdstr =~ m/^(info\s+migrate|migrate\s)/) {
2580 $timeout = 60*60; # 1 hour
2581 } elsif ($cmdstr =~ m/^(eject|change)/) {
2582 $timeout = 60; # note: cdrom mount command is slow
2583 }
6b64503e 2584 if ($res = __read_avail($sock, $timeout)) {
19672434 2585
6b64503e 2586 my @lines = split("\r?\n", $res);
1e3baf05
DM
2587
2588 shift @lines if $lines[0] !~ m/^unknown command/; # skip echo
19672434 2589
6b64503e 2590 $res = join("\n", @lines);
1e3baf05
DM
2591 $res .= "\n";
2592 }
2593 };
2594
2595 my $err = $@;
2596
2597 if ($err) {
6b64503e 2598 syslog("err", "VM $vmid monitor command failed - $err");
1e3baf05
DM
2599 die $err;
2600 }
2601
2602 return $res;
2603}
2604
2605sub vm_commandline {
2606 my ($storecfg, $vmid) = @_;
2607
6b64503e 2608 my $conf = load_config($vmid);
1e3baf05
DM
2609
2610 my $defaults = load_defaults();
2611
6b64503e 2612 my $cmd = config_to_command($storecfg, $vmid, $conf, $defaults);
1e3baf05 2613
6b64503e 2614 return join(' ', @$cmd);
1e3baf05
DM
2615}
2616
2617sub vm_reset {
2618 my ($vmid, $skiplock) = @_;
2619
6b64503e 2620 lock_config($vmid, sub {
1e3baf05 2621
6b64503e 2622 my $conf = load_config($vmid);
1e3baf05 2623
6b64503e 2624 check_lock($conf) if !$skiplock;
1e3baf05 2625
ff1a2432
DM
2626 vm_monitor_command($vmid, "system_reset");
2627 });
2628}
2629
2630sub get_vm_volumes {
2631 my ($conf) = @_;
1e3baf05 2632
ff1a2432
DM
2633 my $vollist = [];
2634 foreach_drive($conf, sub {
2635 my ($ds, $drive) = @_;
2636
2637 my ($sid, $volname) = PVE::Storage::parse_volume_id($drive->{file}, 1);
2638 return if !$sid;
2639
2640 my $volid = $drive->{file};
2641 return if !$volid || $volid =~ m|^/|;
2642
2643 push @$vollist, $volid;
1e3baf05 2644 });
ff1a2432
DM
2645
2646 return $vollist;
2647}
2648
2649sub vm_stop_cleanup {
254575e9 2650 my ($storecfg, $vmid, $conf, $keepActive) = @_;
ff1a2432 2651
745fed70
DM
2652 eval {
2653 fairsched_rmnod($vmid); # try to destroy group
ff1a2432 2654
254575e9
DM
2655 if (!$keepActive) {
2656 my $vollist = get_vm_volumes($conf);
2657 PVE::Storage::deactivate_volumes($storecfg, $vollist);
2658 }
745fed70
DM
2659 };
2660 warn $@ if $@; # avoid errors - just warn
1e3baf05
DM
2661}
2662
e6c3b671 2663# Note: use $nockeck to skip tests if VM configuration file exists.
254575e9
DM
2664# We need that when migration VMs to other nodes (files already moved)
2665# Note: we set $keepActive in vzdump stop mode - volumes need to stay active
1e3baf05 2666sub vm_stop {
254575e9 2667 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive) = @_;
9269013a
DM
2668
2669 $timeout = 60 if !defined($timeout);
ff1a2432 2670
9269013a 2671 $force = 1 if !defined($force) && !$shutdown;
1e3baf05 2672
e6c3b671 2673 lock_config($vmid, sub {
1e3baf05 2674
e6c3b671 2675 my $pid = check_running($vmid, $nocheck);
ff1a2432 2676 return if !$pid;
1e3baf05 2677
ff1a2432 2678 my $conf;
e6c3b671 2679 if (!$nocheck) {
ff1a2432 2680 $conf = load_config($vmid);
e6c3b671
DM
2681 check_lock($conf) if !$skiplock;
2682 }
19672434 2683
9269013a
DM
2684 eval {
2685 if ($shutdown) {
2686 vm_monitor_command($vmid, "system_powerdown", $nocheck);
2687 } else {
2688 vm_monitor_command($vmid, "quit", $nocheck);
afdb31d5 2689 }
9269013a 2690 };
1e3baf05
DM
2691 my $err = $@;
2692
2693 if (!$err) {
1e3baf05 2694 my $count = 0;
e6c3b671 2695 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
2696 $count++;
2697 sleep 1;
2698 }
2699
2700 if ($count >= $timeout) {
9269013a
DM
2701 if ($force) {
2702 warn "VM still running - terminating now with SIGTERM\n";
2703 kill 15, $pid;
2704 } else {
2705 die "VM quit/powerdown failed - got timeout\n";
2706 }
2707 } else {
254575e9 2708 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
9269013a 2709 return;
1e3baf05
DM
2710 }
2711 } else {
9269013a
DM
2712 if ($force) {
2713 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
2714 kill 15, $pid;
2715 } else {
afdb31d5 2716 die "VM quit/powerdown failed\n";
9269013a 2717 }
1e3baf05
DM
2718 }
2719
2720 # wait again
ff1a2432 2721 $timeout = 10;
1e3baf05
DM
2722
2723 my $count = 0;
e6c3b671 2724 while (($count < $timeout) && check_running($vmid, $nocheck)) {
1e3baf05
DM
2725 $count++;
2726 sleep 1;
2727 }
2728
2729 if ($count >= $timeout) {
ff1a2432 2730 warn "VM still running - terminating now with SIGKILL\n";
1e3baf05 2731 kill 9, $pid;
ff1a2432 2732 sleep 1;
1e3baf05
DM
2733 }
2734
254575e9 2735 vm_stop_cleanup($storecfg, $vmid, $conf, $keepActive) if $conf;
ff1a2432 2736 });
1e3baf05
DM
2737}
2738
2739sub vm_suspend {
2740 my ($vmid, $skiplock) = @_;
2741
6b64503e 2742 lock_config($vmid, sub {
1e3baf05 2743
6b64503e 2744 my $conf = load_config($vmid);
1e3baf05 2745
6b64503e 2746 check_lock($conf) if !$skiplock;
1e3baf05 2747
ff1a2432 2748 vm_monitor_command($vmid, "stop");
1e3baf05
DM
2749 });
2750}
2751
2752sub vm_resume {
2753 my ($vmid, $skiplock) = @_;
2754
6b64503e 2755 lock_config($vmid, sub {
1e3baf05 2756
6b64503e 2757 my $conf = load_config($vmid);
1e3baf05 2758
6b64503e 2759 check_lock($conf) if !$skiplock;
1e3baf05 2760
ff1a2432 2761 vm_monitor_command($vmid, "cont");
1e3baf05
DM
2762 });
2763}
2764
5fdbe4f0
DM
2765sub vm_sendkey {
2766 my ($vmid, $skiplock, $key) = @_;
1e3baf05 2767
6b64503e 2768 lock_config($vmid, sub {
1e3baf05 2769
6b64503e 2770 my $conf = load_config($vmid);
1e3baf05 2771
ff1a2432 2772 vm_monitor_command($vmid, "sendkey $key");
1e3baf05
DM
2773 });
2774}
2775
2776sub vm_destroy {
2777 my ($storecfg, $vmid, $skiplock) = @_;
2778
6b64503e 2779 lock_config($vmid, sub {
1e3baf05 2780
6b64503e 2781 my $conf = load_config($vmid);
1e3baf05 2782
6b64503e 2783 check_lock($conf) if !$skiplock;
1e3baf05 2784
ff1a2432
DM
2785 if (!check_running($vmid)) {
2786 fairsched_rmnod($vmid); # try to destroy group
2787 destroy_vm($storecfg, $vmid);
2788 } else {
2789 die "VM $vmid is running - destroy failed\n";
1e3baf05
DM
2790 }
2791 });
2792}
2793
2794sub vm_stopall {
ff1a2432 2795 my ($storecfg, $timeout) = @_;
1e3baf05
DM
2796
2797 $timeout = 3*60 if !$timeout;
2798
ff1a2432
DM
2799 my $cleanuphash = {};
2800
1e3baf05
DM
2801 my $vzlist = vzlist();
2802 my $count = 0;
2803 foreach my $vmid (keys %$vzlist) {
2804 next if !$vzlist->{$vmid}->{pid};
2805 $count++;
ff1a2432 2806 $cleanuphash->{$vmid} = 1;
1e3baf05
DM
2807 }
2808
ff1a2432 2809 return if !$count;
1e3baf05 2810
ff1a2432
DM
2811 my $msg = "Stopping Qemu Server - sending shutdown requests to all VMs\n";
2812 syslog('info', $msg);
2813 warn $msg;
1e3baf05 2814
ff1a2432
DM
2815 foreach my $vmid (keys %$vzlist) {
2816 next if !$vzlist->{$vmid}->{pid};
bbbe5146
DM
2817 eval { vm_monitor_command($vmid, "system_powerdown"); };
2818 warn $@ if $@;
ff1a2432 2819 }
1e3baf05 2820
ff1a2432
DM
2821 my $wt = 5;
2822 my $maxtries = int(($timeout + $wt -1)/$wt);
2823 my $try = 0;
2824 while (($try < $maxtries) && $count) {
2825 $try++;
2826 sleep $wt;
afdb31d5 2827
ff1a2432
DM
2828 $vzlist = vzlist();
2829 $count = 0;
2830 foreach my $vmid (keys %$vzlist) {
2831 next if !$vzlist->{$vmid}->{pid};
2832 $count++;
1e3baf05 2833 }
ff1a2432
DM
2834 last if !$count;
2835 }
1e3baf05 2836
ff1a2432 2837 if ($count) {
1e3baf05
DM
2838
2839 foreach my $vmid (keys %$vzlist) {
2840 next if !$vzlist->{$vmid}->{pid};
19672434 2841
ff1a2432
DM
2842 warn "VM $vmid still running - sending stop now\n";
2843 eval { vm_monitor_command($vmid, "quit"); };
2844 warn $@ if $@;
1e3baf05
DM
2845 }
2846
2847 $timeout = 30;
6b64503e 2848 $maxtries = int(($timeout + $wt -1)/$wt);
1e3baf05
DM
2849 $try = 0;
2850 while (($try < $maxtries) && $count) {
2851 $try++;
2852 sleep $wt;
afdb31d5 2853
1e3baf05
DM
2854 $vzlist = vzlist();
2855 $count = 0;
2856 foreach my $vmid (keys %$vzlist) {
2857 next if !$vzlist->{$vmid}->{pid};
2858 $count++;
2859 }
2860 last if !$count;
2861 }
2862
ff1a2432 2863 if ($count) {
1e3baf05 2864
ff1a2432
DM
2865 foreach my $vmid (keys %$vzlist) {
2866 next if !$vzlist->{$vmid}->{pid};
19672434 2867
ff1a2432
DM
2868 warn "VM $vmid still running - terminating now with SIGTERM\n";
2869 kill 15, $vzlist->{$vmid}->{pid};
2870 }
2871 sleep 1;
1e3baf05
DM
2872 }
2873
2874 # this is called by system shotdown scripts, so remaining
2875 # processes gets killed anyways (no need to send kill -9 here)
ff1a2432 2876 }
1e3baf05 2877
ff1a2432
DM
2878 $vzlist = vzlist();
2879 foreach my $vmid (keys %$cleanuphash) {
2880 next if $vzlist->{$vmid}->{pid};
afdb31d5 2881 eval {
ff1a2432 2882 my $conf = load_config($vmid);
afdb31d5 2883 vm_stop_cleanup($storecfg, $vmid, $conf);
ff1a2432
DM
2884 };
2885 warn $@ if $@;
1e3baf05 2886 }
ff1a2432
DM
2887
2888 $msg = "Qemu Server stopped\n";
2889 syslog('info', $msg);
2890 print $msg;
1e3baf05
DM
2891}
2892
2893# pci helpers
2894
2895sub file_write {
2896 my ($filename, $buf) = @_;
2897
6b64503e 2898 my $fh = IO::File->new($filename, "w");
1e3baf05
DM
2899 return undef if !$fh;
2900
2901 my $res = print $fh $buf;
2902
2903 $fh->close();
2904
2905 return $res;
2906}
2907
2908sub pci_device_info {
2909 my ($name) = @_;
2910
2911 my $res;
2912
2913 return undef if $name !~ m/^([a-f0-9]{4}):([a-f0-9]{2}):([a-f0-9]{2})\.([a-f0-9])$/;
2914 my ($domain, $bus, $slot, $func) = ($1, $2, $3, $4);
2915
2916 my $irq = file_read_firstline("$pcisysfs/devices/$name/irq");
2917 return undef if !defined($irq) || $irq !~ m/^\d+$/;
2918
2919 my $vendor = file_read_firstline("$pcisysfs/devices/$name/vendor");
2920 return undef if !defined($vendor) || $vendor !~ s/^0x//;
2921
2922 my $product = file_read_firstline("$pcisysfs/devices/$name/device");
2923 return undef if !defined($product) || $product !~ s/^0x//;
2924
2925 $res = {
2926 name => $name,
2927 vendor => $vendor,
2928 product => $product,
2929 domain => $domain,
2930 bus => $bus,
2931 slot => $slot,
2932 func => $func,
2933 irq => $irq,
2934 has_fl_reset => -f "$pcisysfs/devices/$name/reset" || 0,
2935 };
2936
2937 return $res;
2938}
2939
2940sub pci_dev_reset {
2941 my ($dev) = @_;
2942
2943 my $name = $dev->{name};
2944
2945 my $fn = "$pcisysfs/devices/$name/reset";
2946
6b64503e 2947 return file_write($fn, "1");
1e3baf05
DM
2948}
2949
2950sub pci_dev_bind_to_stub {
2951 my ($dev) = @_;
2952
2953 my $name = $dev->{name};
2954
2955 my $testdir = "$pcisysfs/drivers/pci-stub/$name";
2956 return 1 if -d $testdir;
2957
2958 my $data = "$dev->{vendor} $dev->{product}";
6b64503e 2959 return undef if !file_write("$pcisysfs/drivers/pci-stub/new_id", $data);
1e3baf05
DM
2960
2961 my $fn = "$pcisysfs/devices/$name/driver/unbind";
6b64503e 2962 if (!file_write($fn, $name)) {
1e3baf05
DM
2963 return undef if -f $fn;
2964 }
2965
2966 $fn = "$pcisysfs/drivers/pci-stub/bind";
2967 if (! -d $testdir) {
6b64503e 2968 return undef if !file_write($fn, $name);
1e3baf05
DM
2969 }
2970
2971 return -d $testdir;
2972}
2973
afdb31d5 2974sub print_pci_addr {
72a063e4 2975 my ($id) = @_;
6b64503e 2976
72a063e4 2977 my $res = '';
6b64503e 2978 my $devices = {
e5f7f8ed
DA
2979 #addr1 : ide,parallel,serial (motherboard)
2980 #addr2 : first videocard
13b5a753 2981 balloon0 => { bus => 0, addr => 3 },
0a40e8ea 2982 watchdog => { bus => 0, addr => 4 },
69b6ae0c
DA
2983 lsi0 => { bus => 0, addr => 5 },
2984 lsi1 => { bus => 0, addr => 6 },
26ee04b6 2985 ahci0 => { bus => 0, addr => 7 },
6b64503e
DM
2986 virtio0 => { bus => 0, addr => 10 },
2987 virtio1 => { bus => 0, addr => 11 },
2988 virtio2 => { bus => 0, addr => 12 },
2989 virtio3 => { bus => 0, addr => 13 },
2990 virtio4 => { bus => 0, addr => 14 },
2991 virtio5 => { bus => 0, addr => 15 },
b78ebef7
DA
2992 hostpci0 => { bus => 0, addr => 16 },
2993 hostpci1 => { bus => 0, addr => 17 },
f290f8d9
DA
2994 net0 => { bus => 0, addr => 18 },
2995 net1 => { bus => 0, addr => 19 },
2996 net2 => { bus => 0, addr => 20 },
2997 net3 => { bus => 0, addr => 21 },
2998 net4 => { bus => 0, addr => 22 },
2999 net5 => { bus => 0, addr => 23 },
e5f7f8ed 3000 #addr29 : usb-host (pve-usb.cfg)
6b64503e
DM
3001 };
3002
3003 if (defined($devices->{$id}->{bus}) && defined($devices->{$id}->{addr})) {
72a063e4
DA
3004 my $addr = sprintf("0x%x", $devices->{$id}->{addr});
3005 $res = ",bus=pci.$devices->{$id}->{bus},addr=$addr";
3006 }
3007 return $res;
3008
3009}
3010
13a48620 3011sub vm_balloonset {
7878afeb 3012 my ($vmid, $value) = @_;
13a48620 3013
ff1a2432 3014 vm_monitor_command($vmid, "balloon $value");
13a48620
DA
3015}
3016
3e16d5fc
DM
3017# vzdump restore implementaion
3018
3019sub archive_read_firstfile {
3020 my $archive = shift;
afdb31d5 3021
3e16d5fc
DM
3022 die "ERROR: file '$archive' does not exist\n" if ! -f $archive;
3023
3024 # try to detect archive type first
3025 my $pid = open (TMP, "tar tf '$archive'|") ||
3026 die "unable to open file '$archive'\n";
3027 my $firstfile = <TMP>;
3028 kill 15, $pid;
3029 close TMP;
3030
3031 die "ERROR: archive contaions no data\n" if !$firstfile;
3032 chomp $firstfile;
3033
3034 return $firstfile;
3035}
3036
3037sub restore_cleanup {
3038 my $statfile = shift;
3039
3040 print STDERR "starting cleanup\n";
3041
3042 if (my $fd = IO::File->new($statfile, "r")) {
3043 while (defined(my $line = <$fd>)) {
3044 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
3045 my $volid = $2;
3046 eval {
3047 if ($volid =~ m|^/|) {
3048 unlink $volid || die 'unlink failed\n';
3049 } else {
3050 my $cfg = cfs_read_file('storage.cfg');
3051 PVE::Storage::vdisk_free($cfg, $volid);
3052 }
afdb31d5 3053 print STDERR "temporary volume '$volid' sucessfuly removed\n";
3e16d5fc
DM
3054 };
3055 print STDERR "unable to cleanup '$volid' - $@" if $@;
3056 } else {
3057 print STDERR "unable to parse line in statfile - $line";
afdb31d5 3058 }
3e16d5fc
DM
3059 }
3060 $fd->close();
3061 }
3062}
3063
3064sub restore_archive {
a0d1b1a2 3065 my ($archive, $vmid, $user, $opts) = @_;
3e16d5fc 3066
9c502e26
DM
3067 if ($archive ne '-') {
3068 my $firstfile = archive_read_firstfile($archive);
3069 die "ERROR: file '$archive' dos not lock like a QemuServer vzdump backup\n"
3070 if $firstfile ne 'qemu-server.conf';
3071 }
3e16d5fc
DM
3072
3073 my $tocmd = "/usr/lib/qemu-server/qmextract";
3074
2415a446 3075 $tocmd .= " --storage " . PVE::Tools::shellquote($opts->{storage}) if $opts->{storage};
a0d1b1a2 3076 $tocmd .= " --pool " . PVE::Tools::shellquote($opts->{pool}) if $opts->{pool};
3e16d5fc
DM
3077 $tocmd .= ' --prealloc' if $opts->{prealloc};
3078 $tocmd .= ' --info' if $opts->{info};
3079
a0d1b1a2 3080 # tar option "xf" does not autodetect compression when read from STDIN,
9c502e26 3081 # so we pipe to zcat
2415a446
DM
3082 my $cmd = "zcat -f|tar xf " . PVE::Tools::shellquote($archive) . " " .
3083 PVE::Tools::shellquote("--to-command=$tocmd");
3e16d5fc
DM
3084
3085 my $tmpdir = "/var/tmp/vzdumptmp$$";
3086 mkpath $tmpdir;
3087
3088 local $ENV{VZDUMP_TMPDIR} = $tmpdir;
3089 local $ENV{VZDUMP_VMID} = $vmid;
a0d1b1a2 3090 local $ENV{VZDUMP_USER} = $user;
3e16d5fc
DM
3091
3092 my $conffile = PVE::QemuServer::config_file($vmid);
3093 my $tmpfn = "$conffile.$$.tmp";
3094
3095 # disable interrupts (always do cleanups)
3096 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = sub {
3097 print STDERR "got interrupt - ignored\n";
3098 };
3099
afdb31d5 3100 eval {
3e16d5fc
DM
3101 # enable interrupts
3102 local $SIG{INT} = $SIG{TERM} = $SIG{QUIT} = $SIG{HUP} = $SIG{PIPE} = sub {
3103 die "interrupted by signal\n";
3104 };
3105
9c502e26
DM
3106 if ($archive eq '-') {
3107 print "extracting archive from STDIN\n";
3108 run_command($cmd, input => "<&STDIN");
3109 } else {
3110 print "extracting archive '$archive'\n";
3111 run_command($cmd);
3112 }
3e16d5fc
DM
3113
3114 return if $opts->{info};
3115
3116 # read new mapping
3117 my $map = {};
3118 my $statfile = "$tmpdir/qmrestore.stat";
3119 if (my $fd = IO::File->new($statfile, "r")) {
3120 while (defined (my $line = <$fd>)) {
3121 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
3122 $map->{$1} = $2 if $1;
3123 } else {
3124 print STDERR "unable to parse line in statfile - $line\n";
3125 }
3126 }
3127 $fd->close();
3128 }
3129
3130 my $confsrc = "$tmpdir/qemu-server.conf";
3131
3132 my $srcfd = new IO::File($confsrc, "r") ||
3133 die "unable to open file '$confsrc'\n";
3134
3135 my $outfd = new IO::File ($tmpfn, "w") ||
3136 die "unable to write config for VM $vmid\n";
3137
51586c3a
DM
3138 my $netcount = 0;
3139
3e16d5fc
DM
3140 while (defined (my $line = <$srcfd>)) {
3141 next if $line =~ m/^\#vzdump\#/;
3142 next if $line =~ m/^lock:/;
3143 next if $line =~ m/^unused\d+:/;
3144
51586c3a
DM
3145 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
3146 # try to convert old 1.X settings
3147 my ($id, $ind, $ethcfg) = ($1, $2, $3);
3148 foreach my $devconfig (PVE::Tools::split_list($ethcfg)) {
3149 my ($model, $macaddr) = split(/\=/, $devconfig);
3150 $macaddr = PVE::Tools::random_ether_addr() if !$macaddr || $opts->{unique};
3151 my $net = {
3152 model => $model,
3153 bridge => "vmbr$ind",
3154 macaddr => $macaddr,
3155 };
3156 my $netstr = print_net($net);
3157 print $outfd "net${netcount}: $netstr\n";
3158 $netcount++;
3159 }
3160 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && ($opts->{unique})) {
3161 my ($id, $netstr) = ($1, $2);
3162 my $net = parse_net($netstr);
3163 $net->{macaddr} = PVE::Tools::random_ether_addr() if $net->{macaddr};
3164 $netstr = print_net($net);
afdb31d5 3165 print $outfd "$id: $netstr\n";
51586c3a 3166 } elsif ($line =~ m/^((ide|scsi|virtio)\d+):\s*(\S+)\s*$/) {
3e16d5fc
DM
3167 my $virtdev = $1;
3168 my $value = $2;
3169 if ($line =~ m/backup=no/) {
3170 print $outfd "#$line";
3171 } elsif ($virtdev && $map->{$virtdev}) {
3172 my $di = PVE::QemuServer::parse_drive($virtdev, $value);
3173 $di->{file} = $map->{$virtdev};
3174 $value = PVE::QemuServer::print_drive($vmid, $di);
3175 print $outfd "$virtdev: $value\n";
3176 } else {
3177 print $outfd $line;
3178 }
3179 } else {
3180 print $outfd $line;
3181 }
3182 }
3183
3184 $srcfd->close();
3185 $outfd->close();
3186 };
3187 my $err = $@;
3188
afdb31d5 3189 if ($err) {
3e16d5fc
DM
3190
3191 unlink $tmpfn;
3192
3193 restore_cleanup("$tmpdir/qmrestore.stat") if !$opts->{info};
afdb31d5 3194
3e16d5fc 3195 die $err;
afdb31d5 3196 }
3e16d5fc
DM
3197
3198 rmtree $tmpdir;
3199
3200 rename $tmpfn, $conffile ||
3201 die "unable to commit configuration file '$conffile'\n";
3202};
3203
1e3baf05 32041;