1 package PVE
::QemuServer
;
11 use File
::Copy
qw(copy);
22 use List
::Util
qw(first);
25 use Storable
qw(dclone);
26 use Time
::HiRes
qw(gettimeofday usleep);
30 use PVE
::Cluster
qw(cfs_register_file cfs_read_file cfs_write_file);
33 use PVE
::DataCenterConfig
;
34 use PVE
::Exception
qw(raise raise_param_exc);
35 use PVE
::Format
qw(render_duration render_bytes);
36 use PVE
::GuestHelpers
qw(safe_string_ne safe_num_ne safe_boolean_ne);
38 use PVE
::JSONSchema
qw(get_standard_option parse_property_string);
41 use PVE
::RESTEnvironment
qw(log_warn);
42 use PVE
::RPCEnvironment
;
46 use PVE
::Tools
qw(run_command file_read_firstline file_get_contents dir_glob_foreach get_host_arch $IPV6RE);
50 use PVE
::QemuServer
::Helpers
qw(min_version config_aware_timeout windows_version);
51 use PVE
::QemuServer
::Cloudinit
;
52 use PVE
::QemuServer
::CGroup
;
53 use PVE
::QemuServer
::CPUConfig
qw(print_cpu_device get_cpu_options);
54 use PVE
::QemuServer
::Drive
qw(is_valid_drivename drive_is_cloudinit drive_is_cdrom drive_is_read_only parse_drive print_drive);
55 use PVE
::QemuServer
::Machine
;
56 use PVE
::QemuServer
::Memory
;
57 use PVE
::QemuServer
::Monitor
qw(mon_cmd);
58 use PVE
::QemuServer
::PCI
qw(print_pci_addr print_pcie_addr print_pcie_root_port parse_hostpci);
59 use PVE
::QemuServer
::USB
qw(parse_usb_device);
63 require PVE
::Network
::SDN
::Zones
;
67 my $EDK2_FW_BASE = '/usr/share/pve-edk2-firmware/';
71 "$EDK2_FW_BASE/OVMF_CODE_4M.fd",
72 "$EDK2_FW_BASE/OVMF_VARS_4M.fd",
75 "$EDK2_FW_BASE/OVMF_CODE_4M.fd",
76 "$EDK2_FW_BASE/OVMF_VARS_4M.ms.fd",
79 "$EDK2_FW_BASE/OVMF_CODE_4M.secboot.fd",
80 "$EDK2_FW_BASE/OVMF_VARS_4M.fd",
83 "$EDK2_FW_BASE/OVMF_CODE_4M.secboot.fd",
84 "$EDK2_FW_BASE/OVMF_VARS_4M.ms.fd",
87 "$EDK2_FW_BASE/OVMF_CODE.fd",
88 "$EDK2_FW_BASE/OVMF_VARS.fd",
93 "$EDK2_FW_BASE/AAVMF_CODE.fd",
94 "$EDK2_FW_BASE/AAVMF_VARS.fd",
99 my $cpuinfo = PVE
::ProcFSTools
::read_cpuinfo
();
101 # Note about locking: we use flock on the config file protect against concurent actions.
102 # Aditionaly, we have a 'lock' setting in the config file. This can be set to 'migrate',
103 # 'backup', 'snapshot' or 'rollback'. Most actions are not allowed when such lock is set.
104 # But you can ignore this kind of lock with the --skiplock flag.
112 PVE
::JSONSchema
::register_standard_option
('pve-qm-stateuri', {
113 description
=> "Some command save/restore state from this location.",
119 PVE
::JSONSchema
::register_standard_option
('pve-qemu-machine', {
120 description
=> "Specifies the QEMU machine type.",
122 pattern
=> '(pc|pc(-i440fx)?-\d+(\.\d+)+(\+pve\d+)?(\.pxe)?|q35|pc-q35-\d+(\.\d+)+(\+pve\d+)?(\.pxe)?|virt(?:-\d+(\.\d+)+)?(\+pve\d+)?)',
127 # FIXME: remove in favor of just using the INotify one, it's cached there exactly the same way
130 $nodename_cache //= PVE
::INotify
::nodename
();
131 return $nodename_cache;
138 enum
=> [qw(i6300esb ib700)],
139 description
=> "Watchdog type to emulate.",
140 default => 'i6300esb',
145 enum
=> [qw(reset shutdown poweroff pause debug none)],
146 description
=> "The action to perform if after activation the guest fails to poll the watchdog in time.",
150 PVE
::JSONSchema
::register_format
('pve-qm-watchdog', $watchdog_fmt);
154 description
=> "Enable/disable communication with a QEMU Guest Agent (QGA) running in the VM.",
159 fstrim_cloned_disks
=> {
160 description
=> "Run fstrim after moving a disk or migrating the VM.",
166 description
=> "Select the agent type",
170 enum
=> [qw(virtio isa)],
176 description
=> "Select the VGA type.",
181 enum
=> [qw(cirrus qxl qxl2 qxl3 qxl4 none serial0 serial1 serial2 serial3 std virtio virtio-gl vmware)],
184 description
=> "Sets the VGA memory (in MiB). Has no effect with serial display.",
196 description
=> "The size of the file in MB.",
200 pattern
=> '[a-zA-Z0-9\-]+',
202 format_description
=> 'string',
203 description
=> "The name of the file. Will be prefixed with 'pve-shm-'. Default is the VMID. Will be deleted when the VM is stopped.",
210 enum
=> [qw(ich9-intel-hda intel-hda AC97)],
211 description
=> "Configure an audio device."
215 enum
=> ['spice', 'none'],
218 description
=> "Driver backend for the audio device."
222 my $spice_enhancements_fmt = {
227 description
=> "Enable folder sharing via SPICE. Needs Spice-WebDAV daemon installed in the VM."
231 enum
=> ['off', 'all', 'filter'],
234 description
=> "Enable video streaming. Uses compression for detected video streams."
241 enum
=> ['/dev/urandom', '/dev/random', '/dev/hwrng'],
243 description
=> "The file on the host to gather entropy from. In most cases '/dev/urandom'"
244 ." should be preferred over '/dev/random' to avoid entropy-starvation issues on the"
245 ." host. Using urandom does *not* decrease security in any meaningful way, as it's"
246 ." still seeded from real entropy, and the bytes provided will most likely be mixed"
247 ." with real entropy on the guest as well. '/dev/hwrng' can be used to pass through"
248 ." a hardware RNG from the host.",
252 description
=> "Maximum bytes of entropy allowed to get injected into the guest every"
253 ." 'period' milliseconds. Prefer a lower value when using '/dev/random' as source. Use"
254 ." `0` to disable limiting (potentially dangerous!).",
257 # default is 1 KiB/s, provides enough entropy to the guest to avoid boot-starvation issues
258 # (e.g. systemd etc...) while allowing no chance of overwhelming the host, provided we're
259 # reading from /dev/urandom
264 description
=> "Every 'period' milliseconds the entropy-injection quota is reset, allowing"
265 ." the guest to retrieve another 'max_bytes' of entropy.",
271 my $meta_info_fmt = {
274 description
=> "The guest creation timestamp as UNIX epoch time",
280 description
=> "The QEMU (machine) version from the time this VM was created.",
281 pattern
=> '\d+(\.\d+)+',
290 description
=> "Specifies whether a VM will be started during system bootup.",
296 description
=> "Automatic restart after crash (currently ignored).",
301 type
=> 'string', format
=> 'pve-hotplug-features',
302 description
=> "Selectively enable hotplug features. This is a comma separated list of"
303 ." hotplug features: 'network', 'disk', 'cpu', 'memory', 'usb' and 'cloudinit'. Use '0' to disable"
304 ." hotplug completely. Using '1' as value is an alias for the default `network,disk,usb`."
305 ." USB hotplugging is possible for guests with machine version >= 7.1 and ostype l26 or"
307 default => 'network,disk,usb',
312 description
=> "Allow reboot. If set to '0' the VM exit on reboot.",
318 description
=> "Lock/unlock the VM.",
319 enum
=> [qw(backup clone create migrate rollback snapshot snapshot-delete suspending suspended)],
324 description
=> "Limit of CPU usage.",
325 verbose_description
=> "Limit of CPU usage.\n\nNOTE: If the computer has 2 CPUs, it has"
326 ." total of '2' CPU time. Value '0' indicates no CPU limit.",
334 description
=> "CPU weight for a VM, will be clamped to [1, 10000] in cgroup v2.",
335 verbose_description
=> "CPU weight for a VM. Argument is used in the kernel fair scheduler."
336 ." The larger the number is, the more CPU time this VM gets. Number is relative to"
337 ." weights of all the other running VMs.",
340 default => 'cgroup v1: 1024, cgroup v2: 100',
345 description
=> "Amount of RAM for the VM in MB. This is the maximum available memory when"
346 ." you use the balloon device.",
353 description
=> "Amount of target RAM for the VM in MB. Using zero disables the ballon driver.",
359 description
=> "Amount of memory shares for auto-ballooning. The larger the number is, the"
360 ." more memory this VM gets. Number is relative to weights of all other running VMs."
361 ." Using zero disables auto-ballooning. Auto-ballooning is done by pvestatd.",
369 description
=> "Keyboard layout for VNC server. This option is generally not required and"
370 ." is often better handled from within the guest OS.",
371 enum
=> PVE
::Tools
::kvmkeymaplist
(),
376 type
=> 'string', format
=> 'dns-name',
377 description
=> "Set a name for the VM. Only used on the configuration web interface.",
382 description
=> "SCSI controller model",
383 enum
=> [qw(lsi lsi53c810 virtio-scsi-pci virtio-scsi-single megasas pvscsi)],
389 description
=> "Description for the VM. Shown in the web-interface VM's summary."
390 ." This is saved as comment inside the configuration file.",
391 maxLength
=> 1024 * 8,
396 enum
=> [qw(other wxp w2k w2k3 w2k8 wvista win7 win8 win10 win11 l24 l26 solaris)],
397 description
=> "Specify guest operating system.",
398 verbose_description
=> <<EODESC,
399 Specify guest operating system. This is used to enable special
400 optimization/features for specific operating systems:
403 other;; unspecified OS
404 wxp;; Microsoft Windows XP
405 w2k;; Microsoft Windows 2000
406 w2k3;; Microsoft Windows 2003
407 w2k8;; Microsoft Windows 2008
408 wvista;; Microsoft Windows Vista
409 win7;; Microsoft Windows 7
410 win8;; Microsoft Windows 8/2012/2012r2
411 win10;; Microsoft Windows 10/2016/2019
412 win11;; Microsoft Windows 11/2022
413 l24;; Linux 2.4 Kernel
414 l26;; Linux 2.6 - 5.X Kernel
415 solaris;; Solaris/OpenSolaris/OpenIndiania kernel
420 type
=> 'string', format
=> 'pve-qm-boot',
421 description
=> "Specify guest boot order. Use the 'order=' sub-property as usage with no"
422 ." key or 'legacy=' is deprecated.",
426 type
=> 'string', format
=> 'pve-qm-bootdisk',
427 description
=> "Enable booting from specified disk. Deprecated: Use 'boot: order=foo;bar' instead.",
428 pattern
=> '(ide|sata|scsi|virtio)\d+',
433 description
=> "The number of CPUs. Please use option -sockets instead.",
440 description
=> "The number of CPU sockets.",
447 description
=> "The number of cores per socket.",
454 description
=> "Enable/disable NUMA.",
460 description
=> "Enable/disable hugepages memory.",
461 enum
=> [qw(any 2 1024)],
467 description
=> "Use together with hugepages. If enabled, hugepages will not not be deleted"
468 ." after VM shutdown and can be used for subsequent starts.",
473 description
=> "Number of hotplugged vcpus.",
480 description
=> "Enable/disable ACPI.",
485 description
=> "Enable/disable communication with the QEMU Guest Agent and its properties.",
487 format
=> $agent_fmt,
492 description
=> "Enable/disable KVM hardware virtualization.",
498 description
=> "Enable/disable time drift fix.",
504 description
=> "Set the real time clock (RTC) to local time. This is enabled by default if"
505 ." the `ostype` indicates a Microsoft Windows OS.",
510 description
=> "Freeze CPU at startup (use 'c' monitor command to start execution).",
514 type
=> 'string', format
=> $vga_fmt,
515 description
=> "Configure the VGA hardware.",
516 verbose_description
=> "Configure the VGA Hardware. If you want to use high resolution"
517 ." modes (>= 1280x1024x16) you may need to increase the vga memory option. Since QEMU"
518 ." 2.9 the default VGA display type is 'std' for all OS types besides some Windows"
519 ." versions (XP and older) which use 'cirrus'. The 'qxl' option enables the SPICE"
520 ." display server. For win* OS you can select how many independent displays you want,"
521 ." Linux guests can add displays them self.\nYou can also run without any graphic card,"
522 ." using a serial device as terminal.",
526 type
=> 'string', format
=> 'pve-qm-watchdog',
527 description
=> "Create a virtual hardware watchdog device.",
528 verbose_description
=> "Create a virtual hardware watchdog device. Once enabled (by a guest"
529 ." action), the watchdog must be periodically polled by an agent inside the guest or"
530 ." else the watchdog will reset the guest (or execute the respective action specified)",
535 typetext
=> "(now | YYYY-MM-DD | YYYY-MM-DDTHH:MM:SS)",
536 description
=> "Set the initial date of the real time clock. Valid format for date are:"
537 ."'now' or '2006-06-17T16:01:21' or '2006-06-17'.",
538 pattern
=> '(now|\d{4}-\d{1,2}-\d{1,2}(T\d{1,2}:\d{1,2}:\d{1,2})?)',
541 startup
=> get_standard_option
('pve-startup-order'),
545 description
=> "Enable/disable Template.",
551 description
=> "Arbitrary arguments passed to kvm.",
552 verbose_description
=> <<EODESCR,
553 Arbitrary arguments passed to kvm, for example:
555 args: -no-reboot -no-hpet
557 NOTE: this option is for experts only.
564 description
=> "Enable/disable the USB tablet device.",
565 verbose_description
=> "Enable/disable the USB tablet device. This device is usually needed"
566 ." to allow absolute mouse positioning with VNC. Else the mouse runs out of sync with"
567 ." normal VNC clients. If you're running lots of console-only guests on one host, you"
568 ." may consider disabling this to save some context switches. This is turned off by"
569 ." default if you use spice (`qm set <vmid> --vga qxl`).",
574 description
=> "Set maximum speed (in MB/s) for migrations. Value 0 is no limit.",
578 migrate_downtime
=> {
581 description
=> "Set maximum tolerated downtime (in seconds) for migrations.",
587 type
=> 'string', format
=> 'pve-qm-ide',
588 typetext
=> '<volume>',
589 description
=> "This is an alias for option -ide2",
593 description
=> "Emulated CPU type.",
595 format
=> 'pve-vm-cpu-conf',
597 parent
=> get_standard_option
('pve-snapshot-name', {
599 description
=> "Parent snapshot name. This is used internally, and should not be modified.",
603 description
=> "Timestamp for snapshots.",
609 type
=> 'string', format
=> 'pve-volume-id',
610 description
=> "Reference to a volume which stores the VM state. This is used internally"
613 vmstatestorage
=> get_standard_option
('pve-storage-id', {
614 description
=> "Default storage for VM state volumes/files.",
617 runningmachine
=> get_standard_option
('pve-qemu-machine', {
618 description
=> "Specifies the QEMU machine type of the running vm. This is used internally"
622 description
=> "Specifies the QEMU '-cpu' parameter of the running vm. This is used"
623 ." internally for snapshots.",
626 pattern
=> $PVE::QemuServer
::CPUConfig
::qemu_cmdline_cpu_re
,
627 format_description
=> 'QEMU -cpu parameter'
629 machine
=> get_standard_option
('pve-qemu-machine'),
631 description
=> "Virtual processor architecture. Defaults to the host.",
634 enum
=> [qw(x86_64 aarch64)],
637 description
=> "Specify SMBIOS type 1 fields.",
638 type
=> 'string', format
=> 'pve-qm-smbios1',
645 description
=> "Sets the protection flag of the VM. This will disable the remove VM and"
646 ." remove disk operations.",
652 enum
=> [ qw(seabios ovmf) ],
653 description
=> "Select BIOS implementation.",
654 default => 'seabios',
658 pattern
=> '(?:[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}|[01])',
659 format_description
=> 'UUID',
660 description
=> "Set VM Generation ID. Use '1' to autogenerate on create or update, pass '0'"
661 ." to disable explicitly.",
662 verbose_description
=> "The VM generation ID (vmgenid) device exposes a 128-bit integer"
663 ." value identifier to the guest OS. This allows to notify the guest operating system"
664 ." when the virtual machine is executed with a different configuration (e.g. snapshot"
665 ." execution or creation from a template). The guest operating system notices the"
666 ." change, and is then able to react as appropriate by marking its copies of"
667 ." distributed databases as dirty, re-initializing its random number generator, etc.\n"
668 ."Note that auto-creation only works when done through API/CLI create or update methods"
669 .", but not when manually editing the config file.",
670 default => "1 (autogenerated)",
675 format
=> 'pve-volume-id',
677 description
=> "Script that will be executed during various steps in the vms lifetime.",
681 format
=> $ivshmem_fmt,
682 description
=> "Inter-VM shared memory. Useful for direct communication between VMs, or to"
688 format
=> $audio_fmt,
689 description
=> "Configure a audio device, useful in combination with QXL/Spice.",
692 spice_enhancements
=> {
694 format
=> $spice_enhancements_fmt,
695 description
=> "Configure additional enhancements for SPICE.",
699 type
=> 'string', format
=> 'pve-tag-list',
700 description
=> 'Tags of the VM. This is only meta information.',
706 description
=> "Configure a VirtIO-based Random Number Generator.",
711 format
=> $meta_info_fmt,
712 description
=> "Some (read-only) meta-information about this guest.",
716 type
=> 'string', format
=> 'pve-cpuset',
717 description
=> "List of host cores used to execute guest processes, for example: 0,5,8-11",
726 description
=> 'Specify a custom file containing all meta data passed to the VM via"
727 ." cloud-init. This is provider specific meaning configdrive2 and nocloud differ.',
728 format
=> 'pve-volume-id',
729 format_description
=> 'volume',
734 description
=> 'Specify a custom file containing all network data passed to the VM via'
736 format
=> 'pve-volume-id',
737 format_description
=> 'volume',
742 description
=> 'Specify a custom file containing all user data passed to the VM via'
744 format
=> 'pve-volume-id',
745 format_description
=> 'volume',
750 description
=> 'Specify a custom file containing all vendor data passed to the VM via'
752 format
=> 'pve-volume-id',
753 format_description
=> 'volume',
756 PVE
::JSONSchema
::register_format
('pve-qm-cicustom', $cicustom_fmt);
758 my $confdesc_cloudinit = {
762 description
=> 'Specifies the cloud-init configuration format. The default depends on the'
763 .' configured operating system type (`ostype`. We use the `nocloud` format for Linux,'
764 .' and `configdrive2` for windows.',
765 enum
=> ['configdrive2', 'nocloud', 'opennebula'],
770 description
=> "cloud-init: User name to change ssh keys and password for instead of the"
771 ." image's configured default user.",
776 description
=> 'cloud-init: Password to assign the user. Using this is generally not'
777 .' recommended. Use ssh keys instead. Also note that older cloud-init versions do not'
778 .' support hashed passwords.',
783 description
=> 'cloud-init: Specify custom files to replace the automatically generated'
785 format
=> 'pve-qm-cicustom',
790 description
=> 'cloud-init: Sets DNS search domains for a container. Create will'
791 .' automatically use the setting from the host if neither searchdomain nor nameserver'
796 type
=> 'string', format
=> 'address-list',
797 description
=> 'cloud-init: Sets DNS server IP address for a container. Create will'
798 .' automatically use the setting from the host if neither searchdomain nor nameserver'
804 format
=> 'urlencoded',
805 description
=> "cloud-init: Setup public SSH keys (one key per line, OpenSSH format).",
809 # what about other qemu settings ?
811 #machine => 'string',
824 ##soundhw => 'string',
826 while (my ($k, $v) = each %$confdesc) {
827 PVE
::JSONSchema
::register_standard_option
("pve-qm-$k", $v);
830 my $MAX_USB_DEVICES = 14;
832 my $MAX_SERIAL_PORTS = 4;
833 my $MAX_PARALLEL_PORTS = 3;
839 pattern
=> qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
840 description
=> "CPUs accessing this NUMA node.",
841 format_description
=> "id[-id];...",
845 description
=> "Amount of memory this NUMA node provides.",
850 pattern
=> qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
851 description
=> "Host NUMA nodes to use.",
852 format_description
=> "id[-id];...",
857 enum
=> [qw(preferred bind interleave)],
858 description
=> "NUMA allocation policy.",
862 PVE
::JSONSchema
::register_format
('pve-qm-numanode', $numa_fmt);
865 type
=> 'string', format
=> $numa_fmt,
866 description
=> "NUMA topology.",
868 PVE
::JSONSchema
::register_standard_option
("pve-qm-numanode", $numadesc);
870 for (my $i = 0; $i < $MAX_NUMA; $i++) {
871 $confdesc->{"numa$i"} = $numadesc;
874 my $nic_model_list = [
890 my $nic_model_list_txt = join(' ', sort @$nic_model_list);
892 my $net_fmt_bridge_descr = <<__EOD__;
893 Bridge to attach the network device to. The Proxmox VE standard bridge
896 If you do not specify a bridge, we create a kvm user (NATed) network
897 device, which provides DHCP and DNS services. The following addresses
904 The DHCP server assign addresses to the guest starting from 10.0.2.15.
908 macaddr
=> get_standard_option
('mac-addr', {
909 description
=> "MAC address. That address must be unique withing your network. This is"
910 ." automatically generated if not specified.",
914 description
=> "Network Card Model. The 'virtio' model provides the best performance with"
915 ." very low CPU overhead. If your guest does not support this driver, it is usually"
916 ." best to use 'e1000'.",
917 enum
=> $nic_model_list,
920 (map { $_ => { keyAlias
=> 'model', alias
=> 'macaddr' }} @$nic_model_list),
921 bridge
=> get_standard_option
('pve-bridge-id', {
922 description
=> $net_fmt_bridge_descr,
927 minimum
=> 0, maximum
=> 64,
928 description
=> 'Number of packet queues to be used on the device.',
934 description
=> "Rate limit in mbps (megabytes per second) as floating point number.",
939 minimum
=> 1, maximum
=> 4094,
940 description
=> 'VLAN tag to apply to packets on this interface.',
945 pattern
=> qr/\d+(?:-\d+)?(?:;\d+(?:-\d+)?)*/,
946 description
=> 'VLAN trunks to pass through this interface.',
947 format_description
=> 'vlanid[;vlanid...]',
952 description
=> 'Whether this interface should be protected by the firewall.',
957 description
=> 'Whether this interface should be disconnected (like pulling the plug).',
962 minimum
=> 1, maximum
=> 65520,
963 description
=> "Force MTU, for VirtIO only. Set to '1' to use the bridge MTU",
970 type
=> 'string', format
=> $net_fmt,
971 description
=> "Specify network devices.",
974 PVE
::JSONSchema
::register_standard_option
("pve-qm-net", $netdesc);
979 format
=> 'pve-ipv4-config',
980 format_description
=> 'IPv4Format/CIDR',
981 description
=> 'IPv4 address in CIDR format.',
988 format_description
=> 'GatewayIPv4',
989 description
=> 'Default gateway for IPv4 traffic.',
995 format
=> 'pve-ipv6-config',
996 format_description
=> 'IPv6Format/CIDR',
997 description
=> 'IPv6 address in CIDR format.',
1004 format_description
=> 'GatewayIPv6',
1005 description
=> 'Default gateway for IPv6 traffic.',
1010 PVE
::JSONSchema
::register_format
('pve-qm-ipconfig', $ipconfig_fmt);
1011 my $ipconfigdesc = {
1013 type
=> 'string', format
=> 'pve-qm-ipconfig',
1014 description
=> <<'EODESCR',
1015 cloud-init: Specify IP addresses and gateways for the corresponding interface.
1017 IP addresses use CIDR notation, gateways are optional but need an IP of the same type specified.
1019 The special string 'dhcp' can be used for IP addresses to use DHCP, in which case no explicit
1020 gateway should be provided.
1021 For IPv6 the special string 'auto' can be used to use stateless autoconfiguration. This requires
1022 cloud-init 19.4 or newer.
1024 If cloud-init is enabled and neither an IPv4 nor an IPv6 address is specified, it defaults to using
1028 PVE
::JSONSchema
::register_standard_option
("pve-qm-ipconfig", $netdesc);
1030 for (my $i = 0; $i < $MAX_NETS; $i++) {
1031 $confdesc->{"net$i"} = $netdesc;
1032 $confdesc_cloudinit->{"ipconfig$i"} = $ipconfigdesc;
1035 foreach my $key (keys %$confdesc_cloudinit) {
1036 $confdesc->{$key} = $confdesc_cloudinit->{$key};
1039 PVE
::JSONSchema
::register_format
('pve-cpuset', \
&pve_verify_cpuset
);
1040 sub pve_verify_cpuset
{
1041 my ($set_text, $noerr) = @_;
1043 my ($count, $members) = eval { PVE
::CpuSet
::parse_cpuset
($set_text) };
1047 die "unable to parse cpuset option\n";
1050 return PVE
::CpuSet-
>new($members)->short_string();
1053 PVE
::JSONSchema
::register_format
('pve-volume-id-or-qm-path', \
&verify_volume_id_or_qm_path
);
1054 sub verify_volume_id_or_qm_path
{
1055 my ($volid, $noerr) = @_;
1057 return $volid if $volid eq 'none' || $volid eq 'cdrom';
1059 return verify_volume_id_or_absolute_path
($volid, $noerr);
1062 PVE
::JSONSchema
::register_format
('pve-volume-id-or-absolute-path', \
&verify_volume_id_or_absolute_path
);
1063 sub verify_volume_id_or_absolute_path
{
1064 my ($volid, $noerr) = @_;
1066 return $volid if $volid =~ m
|^/|;
1068 $volid = eval { PVE
::JSONSchema
::check_format
('pve-volume-id', $volid, '') };
1079 type
=> 'string', format
=> 'pve-qm-usb-device',
1080 format_description
=> 'HOSTUSBDEVICE|spice',
1081 description
=> <<EODESCR,
1082 The Host USB device or port or the value 'spice'. HOSTUSBDEVICE syntax is:
1084 'bus-port(.port)*' (decimal numbers) or
1085 'vendor_id:product_id' (hexadeciaml numbers) or
1088 You can use the 'lsusb -t' command to list existing usb devices.
1090 NOTE: This option allows direct access to host hardware. So it is no longer possible to migrate such
1091 machines - use with special care.
1093 The value 'spice' can be used to add a usb redirection devices for spice.
1099 description
=> "Specifies whether if given host option is a USB3 device or port."
1100 ." For modern guests (machine version >= 7.1 and ostype l26 and windows > 7), this flag"
1101 ." is irrelevant (all devices are plugged into a xhci controller).",
1108 type
=> 'string', format
=> $usb_fmt,
1109 description
=> "Configure an USB device (n is 0 to 4, for machine version >= 7.1 and ostype"
1110 ." l26 or windows > 7, n can be up to 14).",
1112 PVE
::JSONSchema
::register_standard_option
("pve-qm-usb", $usbdesc);
1117 pattern
=> '(/dev/.+|socket)',
1118 description
=> "Create a serial device inside the VM (n is 0 to 3)",
1119 verbose_description
=> <<EODESCR,
1120 Create a serial device inside the VM (n is 0 to 3), and pass through a
1121 host serial device (i.e. /dev/ttyS0), or create a unix socket on the
1122 host side (use 'qm terminal' to open a terminal connection).
1124 NOTE: If you pass through a host serial device, it is no longer possible to migrate such machines -
1125 use with special care.
1127 CAUTION: Experimental! User reported problems with this option.
1134 pattern
=> '/dev/parport\d+|/dev/usb/lp\d+',
1135 description
=> "Map host parallel devices (n is 0 to 2).",
1136 verbose_description
=> <<EODESCR,
1137 Map host parallel devices (n is 0 to 2).
1139 NOTE: This option allows direct access to host hardware. So it is no longer possible to migrate such
1140 machines - use with special care.
1142 CAUTION: Experimental! User reported problems with this option.
1146 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
1147 $confdesc->{"parallel$i"} = $paralleldesc;
1150 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
1151 $confdesc->{"serial$i"} = $serialdesc;
1154 for (my $i = 0; $i < $PVE::QemuServer
::PCI
::MAX_HOSTPCI_DEVICES
; $i++) {
1155 $confdesc->{"hostpci$i"} = $PVE::QemuServer
::PCI
::hostpcidesc
;
1158 for my $key (keys %{$PVE::QemuServer
::Drive
::drivedesc_hash
}) {
1159 $confdesc->{$key} = $PVE::QemuServer
::Drive
::drivedesc_hash-
>{$key};
1162 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
1163 $confdesc->{"usb$i"} = $usbdesc;
1171 description
=> "Boot on floppy (a), hard disk (c), CD-ROM (d), or network (n)."
1172 . " Deprecated, use 'order=' instead.",
1173 pattern
=> '[acdn]{1,4}',
1174 format_description
=> "[acdn]{1,4}",
1176 # note: this is also the fallback if boot: is not given at all
1182 format
=> 'pve-qm-bootdev-list',
1183 format_description
=> "device[;device...]",
1184 description
=> <<EODESC,
1185 The guest will attempt to boot from devices in the order they appear here.
1187 Disks, optical drives and passed-through storage USB devices will be directly
1188 booted from, NICs will load PXE, and PCIe devices will either behave like disks
1189 (e.g. NVMe) or load an option ROM (e.g. RAID controller, hardware NIC).
1191 Note that only devices in this list will be marked as bootable and thus loaded
1192 by the guest firmware (BIOS/UEFI). If you require multiple disks for booting
1193 (e.g. software-raid), you need to specify all of them here.
1195 Overrides the deprecated 'legacy=[acdn]*' value when given.
1199 PVE
::JSONSchema
::register_format
('pve-qm-boot', $boot_fmt);
1201 PVE
::JSONSchema
::register_format
('pve-qm-bootdev', \
&verify_bootdev
);
1202 sub verify_bootdev
{
1203 my ($dev, $noerr) = @_;
1205 my $special = $dev =~ m/^efidisk/ || $dev =~ m/^tpmstate/;
1206 return $dev if PVE
::QemuServer
::Drive
::is_valid_drivename
($dev) && !$special;
1210 return 0 if $dev !~ m/^$base\d+$/;
1211 return 0 if !$confdesc->{$dev};
1215 return $dev if $check->("net");
1216 return $dev if $check->("usb");
1217 return $dev if $check->("hostpci");
1220 die "invalid boot device '$dev'\n";
1223 sub print_bootorder
{
1225 return "" if !@$devs;
1226 my $data = { order
=> join(';', @$devs) };
1227 return PVE
::JSONSchema
::print_property_string
($data, $boot_fmt);
1230 my $kvm_api_version = 0;
1233 return $kvm_api_version if $kvm_api_version;
1235 open my $fh, '<', '/dev/kvm' or return;
1237 # 0xae00 => KVM_GET_API_VERSION
1238 $kvm_api_version = ioctl($fh, 0xae00, 0);
1241 return $kvm_api_version;
1244 my $kvm_user_version = {};
1247 sub kvm_user_version
{
1250 $binary //= get_command_for_arch
(get_host_arch
()); # get the native arch by default
1251 my $st = stat($binary);
1253 my $cachedmtime = $kvm_mtime->{$binary} // -1;
1254 return $kvm_user_version->{$binary} if $kvm_user_version->{$binary} &&
1255 $cachedmtime == $st->mtime;
1257 $kvm_user_version->{$binary} = 'unknown';
1258 $kvm_mtime->{$binary} = $st->mtime;
1262 if ($line =~ m/^QEMU( PC)? emulator version (\d+\.\d+(\.\d+)?)(\.\d+)?[,\s]/) {
1263 $kvm_user_version->{$binary} = $2;
1267 eval { run_command
([$binary, '--version'], outfunc
=> $code); };
1270 return $kvm_user_version->{$binary};
1273 my sub extract_version
{
1274 my ($machine_type, $version) = @_;
1275 $version = kvm_user_version
() if !defined($version);
1276 return PVE
::QemuServer
::Machine
::extract_version
($machine_type, $version)
1279 sub kernel_has_vhost_net
{
1280 return -c
'/dev/vhost-net';
1285 return defined($confdesc->{$key});
1289 sub get_cdrom_path
{
1291 return $cdrom_path if defined($cdrom_path);
1293 $cdrom_path = first
{ -l
$_ } map { "/dev/cdrom$_" } ('', '1', '2');
1295 if (!defined($cdrom_path)) {
1296 log_warn
("no physical CD-ROM available, ignoring");
1304 my ($storecfg, $vmid, $cdrom) = @_;
1306 if ($cdrom eq 'cdrom') {
1307 return get_cdrom_path
();
1308 } elsif ($cdrom eq 'none') {
1310 } elsif ($cdrom =~ m
|^/|) {
1313 return PVE
::Storage
::path
($storecfg, $cdrom);
1317 # try to convert old style file names to volume IDs
1318 sub filename_to_volume_id
{
1319 my ($vmid, $file, $media) = @_;
1321 if (!($file eq 'none' || $file eq 'cdrom' ||
1322 $file =~ m
|^/dev/.+| || $file =~ m/^([^:]+):(.+)$/)) {
1324 return if $file =~ m
|/|;
1326 if ($media && $media eq 'cdrom') {
1327 $file = "local:iso/$file";
1329 $file = "local:$vmid/$file";
1336 sub verify_media_type
{
1337 my ($opt, $vtype, $media) = @_;
1342 if ($media eq 'disk') {
1344 } elsif ($media eq 'cdrom') {
1347 die "internal error";
1350 return if ($vtype eq $etype);
1352 raise_param_exc
({ $opt => "unexpected media type ($vtype != $etype)" });
1355 sub cleanup_drive_path
{
1356 my ($opt, $storecfg, $drive) = @_;
1358 # try to convert filesystem paths to volume IDs
1360 if (($drive->{file
} !~ m/^(cdrom|none)$/) &&
1361 ($drive->{file
} !~ m
|^/dev/.+|) &&
1362 ($drive->{file
} !~ m/^([^:]+):(.+)$/) &&
1363 ($drive->{file
} !~ m/^\d+$/)) {
1364 my ($vtype, $volid) = PVE
::Storage
::path_to_volume_id
($storecfg, $drive->{file
});
1365 raise_param_exc
({ $opt => "unable to associate path '$drive->{file}' to any storage"})
1367 $drive->{media
} = 'cdrom' if !$drive->{media
} && $vtype eq 'iso';
1368 verify_media_type
($opt, $vtype, $drive->{media
});
1369 $drive->{file
} = $volid;
1372 $drive->{media
} = 'cdrom' if !$drive->{media
} && $drive->{file
} =~ m/^(cdrom|none)$/;
1375 sub parse_hotplug_features
{
1380 return $res if $data eq '0';
1382 $data = $confdesc->{hotplug
}->{default} if $data eq '1';
1384 foreach my $feature (PVE
::Tools
::split_list
($data)) {
1385 if ($feature =~ m/^(network|disk|cpu|memory|usb|cloudinit)$/) {
1388 die "invalid hotplug feature '$feature'\n";
1394 PVE
::JSONSchema
::register_format
('pve-hotplug-features', \
&pve_verify_hotplug_features
);
1395 sub pve_verify_hotplug_features
{
1396 my ($value, $noerr) = @_;
1398 return $value if parse_hotplug_features
($value);
1402 die "unable to parse hotplug option\n";
1406 my($fh, $noerr) = @_;
1409 my $SG_GET_VERSION_NUM = 0x2282;
1411 my $versionbuf = "\x00" x
8;
1412 my $ret = ioctl($fh, $SG_GET_VERSION_NUM, $versionbuf);
1414 die "scsi ioctl SG_GET_VERSION_NUM failoed - $!\n" if !$noerr;
1417 my $version = unpack("I", $versionbuf);
1418 if ($version < 30000) {
1419 die "scsi generic interface too old\n" if !$noerr;
1423 my $buf = "\x00" x
36;
1424 my $sensebuf = "\x00" x
8;
1425 my $cmd = pack("C x3 C x1", 0x12, 36);
1427 # see /usr/include/scsi/sg.h
1428 my $sg_io_hdr_t = "i i C C s I P P P I I i P C C C C S S i I I";
1431 $sg_io_hdr_t, ord('S'), -3, length($cmd), length($sensebuf), 0, length($buf), $buf, $cmd, $sensebuf, 6000
1434 $ret = ioctl($fh, $SG_IO, $packet);
1436 die "scsi ioctl SG_IO failed - $!\n" if !$noerr;
1440 my @res = unpack($sg_io_hdr_t, $packet);
1441 if ($res[17] || $res[18]) {
1442 die "scsi ioctl SG_IO status error - $!\n" if !$noerr;
1447 $res->@{qw(type removable vendor product revision)} = unpack("C C x6 A8 A16 A4", $buf);
1449 $res->{removable
} = $res->{removable
} & 128 ?
1 : 0;
1450 $res->{type
} &= 0x1F;
1458 my $fh = IO
::File-
>new("+<$path") || return;
1459 my $res = scsi_inquiry
($fh, 1);
1465 sub print_tabletdevice_full
{
1466 my ($conf, $arch) = @_;
1468 my $q35 = PVE
::QemuServer
::Machine
::machine_type_is_q35
($conf);
1470 # we use uhci for old VMs because tablet driver was buggy in older qemu
1472 if ($q35 || $arch eq 'aarch64') {
1478 return "usb-tablet,id=tablet,bus=$usbbus.0,port=1";
1481 sub print_keyboarddevice_full
{
1482 my ($conf, $arch) = @_;
1484 return if $arch ne 'aarch64';
1486 return "usb-kbd,id=keyboard,bus=ehci.0,port=2";
1489 my sub get_drive_id
{
1491 return "$drive->{interface}$drive->{index}";
1494 sub print_drivedevice_full
{
1495 my ($storecfg, $conf, $vmid, $drive, $bridges, $arch, $machine_type) = @_;
1500 my $drive_id = get_drive_id
($drive);
1501 if ($drive->{interface
} eq 'virtio') {
1502 my $pciaddr = print_pci_addr
("$drive_id", $bridges, $arch, $machine_type);
1503 $device = "virtio-blk-pci,drive=drive-$drive_id,id=${drive_id}${pciaddr}";
1504 $device .= ",iothread=iothread-$drive_id" if $drive->{iothread
};
1505 } elsif ($drive->{interface
} eq 'scsi') {
1507 my ($maxdev, $controller, $controller_prefix) = scsihw_infos
($conf, $drive);
1508 my $unit = $drive->{index} % $maxdev;
1509 my $devicetype = 'hd';
1511 if (drive_is_cdrom
($drive)) {
1514 if ($drive->{file
} =~ m
|^/|) {
1515 $path = $drive->{file
};
1516 if (my $info = path_is_scsi
($path)) {
1517 if ($info->{type
} == 0 && $drive->{scsiblock
}) {
1518 $devicetype = 'block';
1519 } elsif ($info->{type
} == 1) { # tape
1520 $devicetype = 'generic';
1524 $path = PVE
::Storage
::path
($storecfg, $drive->{file
});
1527 # for compatibility only, we prefer scsi-hd (#2408, #2355, #2380)
1528 my $version = extract_version
($machine_type, kvm_user_version
());
1529 if ($path =~ m/^iscsi\:\/\
// &&
1530 !min_version
($version, 4, 1)) {
1531 $devicetype = 'generic';
1535 if (!$conf->{scsihw
} || $conf->{scsihw
} =~ m/^lsi/ || $conf->{scsihw
} eq 'pvscsi') {
1536 $device = "scsi-$devicetype,bus=$controller_prefix$controller.0,scsi-id=$unit";
1538 $device = "scsi-$devicetype,bus=$controller_prefix$controller.0,channel=0,scsi-id=0"
1539 .",lun=$drive->{index}";
1541 $device .= ",drive=drive-$drive_id,id=$drive_id";
1543 if ($drive->{ssd
} && ($devicetype eq 'block' || $devicetype eq 'hd')) {
1544 $device .= ",rotation_rate=1";
1546 $device .= ",wwn=$drive->{wwn}" if $drive->{wwn
};
1548 } elsif ($drive->{interface
} eq 'ide' || $drive->{interface
} eq 'sata') {
1549 my $maxdev = ($drive->{interface
} eq 'sata') ?
$PVE::QemuServer
::Drive
::MAX_SATA_DISKS
: 2;
1550 my $controller = int($drive->{index} / $maxdev);
1551 my $unit = $drive->{index} % $maxdev;
1552 my $devicetype = ($drive->{media
} && $drive->{media
} eq 'cdrom') ?
"cd" : "hd";
1554 $device = "ide-$devicetype";
1555 if ($drive->{interface
} eq 'ide') {
1556 $device .= ",bus=ide.$controller,unit=$unit";
1558 $device .= ",bus=ahci$controller.$unit";
1560 $device .= ",drive=drive-$drive_id,id=$drive_id";
1562 if ($devicetype eq 'hd') {
1563 if (my $model = $drive->{model
}) {
1564 $model = URI
::Escape
::uri_unescape
($model);
1565 $device .= ",model=$model";
1567 if ($drive->{ssd
}) {
1568 $device .= ",rotation_rate=1";
1571 $device .= ",wwn=$drive->{wwn}" if $drive->{wwn
};
1572 } elsif ($drive->{interface
} eq 'usb') {
1574 # -device ide-drive,bus=ide.1,unit=0,drive=drive-ide0-1-0,id=ide0-1-0
1576 die "unsupported interface type";
1579 $device .= ",bootindex=$drive->{bootindex}" if $drive->{bootindex
};
1581 if (my $serial = $drive->{serial
}) {
1582 $serial = URI
::Escape
::uri_unescape
($serial);
1583 $device .= ",serial=$serial";
1590 sub get_initiator_name
{
1593 my $fh = IO
::File-
>new('/etc/iscsi/initiatorname.iscsi') || return;
1594 while (defined(my $line = <$fh>)) {
1595 next if $line !~ m/^\s*InitiatorName\s*=\s*([\.\-:\w]+)/;
1604 sub print_drive_commandline_full
{
1605 my ($storecfg, $vmid, $drive, $pbs_name, $io_uring) = @_;
1608 my $volid = $drive->{file
};
1609 my $format = $drive->{format
};
1610 my $drive_id = get_drive_id
($drive);
1612 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($volid, 1);
1613 my $scfg = $storeid ? PVE
::Storage
::storage_config
($storecfg, $storeid) : undef;
1615 if (drive_is_cdrom
($drive)) {
1616 $path = get_iso_path
($storecfg, $vmid, $volid);
1617 die "$drive_id: cannot back cdrom drive with PBS snapshot\n" if $pbs_name;
1620 $path = PVE
::Storage
::path
($storecfg, $volid);
1621 $format //= qemu_img_format
($scfg, $volname);
1628 my $is_rbd = $path =~ m/^rbd:/;
1631 my @qemu_drive_options = qw(heads secs cyls trans media cache rerror werror aio discard);
1632 foreach my $o (@qemu_drive_options) {
1633 $opts .= ",$o=$drive->{$o}" if defined($drive->{$o});
1636 # snapshot only accepts on|off
1637 if (defined($drive->{snapshot
})) {
1638 my $v = $drive->{snapshot
} ?
'on' : 'off';
1639 $opts .= ",snapshot=$v";
1642 if (defined($drive->{ro
})) { # ro maps to QEMUs `readonly`, which accepts `on` or `off` only
1643 $opts .= ",readonly=" . ($drive->{ro
} ?
'on' : 'off');
1646 foreach my $type (['', '-total'], [_rd
=> '-read'], [_wr
=> '-write']) {
1647 my ($dir, $qmpname) = @$type;
1648 if (my $v = $drive->{"mbps$dir"}) {
1649 $opts .= ",throttling.bps$qmpname=".int($v*1024*1024);
1651 if (my $v = $drive->{"mbps${dir}_max"}) {
1652 $opts .= ",throttling.bps$qmpname-max=".int($v*1024*1024);
1654 if (my $v = $drive->{"bps${dir}_max_length"}) {
1655 $opts .= ",throttling.bps$qmpname-max-length=$v";
1657 if (my $v = $drive->{"iops${dir}"}) {
1658 $opts .= ",throttling.iops$qmpname=$v";
1660 if (my $v = $drive->{"iops${dir}_max"}) {
1661 $opts .= ",throttling.iops$qmpname-max=$v";
1663 if (my $v = $drive->{"iops${dir}_max_length"}) {
1664 $opts .= ",throttling.iops$qmpname-max-length=$v";
1669 $format = "rbd" if $is_rbd;
1670 die "$drive_id: Proxmox Backup Server backed drive cannot auto-detect the format\n"
1672 $opts .= ",format=alloc-track,file.driver=$format";
1674 $opts .= ",format=$format";
1677 my $cache_direct = 0;
1679 if (my $cache = $drive->{cache
}) {
1680 $cache_direct = $cache =~ /^(?:off|none|directsync)$/;
1681 } elsif (!drive_is_cdrom
($drive) && !($scfg && $scfg->{type
} eq 'btrfs' && !$scfg->{nocow
})) {
1682 $opts .= ",cache=none";
1686 # io_uring with cache mode writeback or writethrough on krbd will hang...
1687 my $rbd_no_io_uring = $scfg && $scfg->{type
} eq 'rbd' && $scfg->{krbd
} && !$cache_direct;
1689 # io_uring with cache mode writeback or writethrough on LVM will hang, without cache only
1690 # sometimes, just plain disable...
1691 my $lvm_no_io_uring = $scfg && $scfg->{type
} eq 'lvm';
1693 # io_uring causes problems when used with CIFS since kernel 5.15
1694 # Some discussion: https://www.spinics.net/lists/linux-cifs/msg26734.html
1695 my $cifs_no_io_uring = $scfg && $scfg->{type
} eq 'cifs';
1697 if (!$drive->{aio
}) {
1698 if ($io_uring && !$rbd_no_io_uring && !$lvm_no_io_uring && !$cifs_no_io_uring) {
1699 # io_uring supports all cache modes
1700 $opts .= ",aio=io_uring";
1702 # aio native works only with O_DIRECT
1704 $opts .= ",aio=native";
1706 $opts .= ",aio=threads";
1711 if (!drive_is_cdrom
($drive)) {
1713 if (defined($drive->{detect_zeroes
}) && !$drive->{detect_zeroes
}) {
1714 $detectzeroes = 'off';
1715 } elsif ($drive->{discard
}) {
1716 $detectzeroes = $drive->{discard
} eq 'on' ?
'unmap' : 'on';
1718 # This used to be our default with discard not being specified:
1719 $detectzeroes = 'on';
1722 # note: 'detect-zeroes' works per blockdev and we want it to persist
1723 # after the alloc-track is removed, so put it on 'file' directly
1724 my $dz_param = $pbs_name ?
"file.detect-zeroes" : "detect-zeroes";
1725 $opts .= ",$dz_param=$detectzeroes" if $detectzeroes;
1729 $opts .= ",backing=$pbs_name";
1730 $opts .= ",auto-remove=on";
1733 # my $file_param = $pbs_name ? "file.file.filename" : "file";
1734 my $file_param = "file";
1736 # non-rbd drivers require the underlying file to be a seperate block
1737 # node, so add a second .file indirection
1738 $file_param .= ".file" if !$is_rbd;
1739 $file_param .= ".filename";
1741 my $pathinfo = $path ?
"$file_param=$path," : '';
1743 return "${pathinfo}if=none,id=drive-$drive->{interface}$drive->{index}$opts";
1746 sub print_pbs_blockdev
{
1747 my ($pbs_conf, $pbs_name) = @_;
1748 my $blockdev = "driver=pbs,node-name=$pbs_name,read-only=on";
1749 $blockdev .= ",repository=$pbs_conf->{repository}";
1750 $blockdev .= ",namespace=$pbs_conf->{namespace}" if $pbs_conf->{namespace
};
1751 $blockdev .= ",snapshot=$pbs_conf->{snapshot}";
1752 $blockdev .= ",archive=$pbs_conf->{archive}";
1753 $blockdev .= ",keyfile=$pbs_conf->{keyfile}" if $pbs_conf->{keyfile
};
1757 sub print_netdevice_full
{
1758 my ($vmid, $conf, $net, $netid, $bridges, $use_old_bios_files, $arch, $machine_type, $machine_version) = @_;
1760 my $device = $net->{model
};
1761 if ($net->{model
} eq 'virtio') {
1762 $device = 'virtio-net-pci';
1765 my $pciaddr = print_pci_addr
("$netid", $bridges, $arch, $machine_type);
1766 my $tmpstr = "$device,mac=$net->{macaddr},netdev=$netid$pciaddr,id=$netid";
1767 if ($net->{queues
} && $net->{queues
} > 1 && $net->{model
} eq 'virtio'){
1768 # Consider we have N queues, the number of vectors needed is 2 * N + 2, i.e., one per in
1769 # and out of each queue plus one config interrupt and control vector queue
1770 my $vectors = $net->{queues
} * 2 + 2;
1771 $tmpstr .= ",vectors=$vectors,mq=on";
1772 if (min_version
($machine_version, 7, 1)) {
1773 $tmpstr .= ",packed=on";
1777 if (min_version
($machine_version, 7, 1) && $net->{model
} eq 'virtio'){
1778 $tmpstr .= ",rx_queue_size=1024,tx_queue_size=1024";
1781 $tmpstr .= ",bootindex=$net->{bootindex}" if $net->{bootindex
} ;
1783 if (my $mtu = $net->{mtu
}) {
1784 if ($net->{model
} eq 'virtio' && $net->{bridge
}) {
1785 my $bridge_mtu = PVE
::Network
::read_bridge_mtu
($net->{bridge
});
1788 } elsif ($mtu < 576) {
1789 die "netdev $netid: MTU '$mtu' is smaller than the IP minimum MTU '576'\n";
1790 } elsif ($mtu > $bridge_mtu) {
1791 die "netdev $netid: MTU '$mtu' is bigger than the bridge MTU '$bridge_mtu'\n";
1793 $tmpstr .= ",host_mtu=$mtu";
1795 warn "WARN: netdev $netid: ignoring MTU '$mtu', not using VirtIO or no bridge configured.\n";
1799 if ($use_old_bios_files) {
1801 if ($device eq 'virtio-net-pci') {
1802 $romfile = 'pxe-virtio.rom';
1803 } elsif ($device eq 'e1000') {
1804 $romfile = 'pxe-e1000.rom';
1805 } elsif ($device eq 'e1000e') {
1806 $romfile = 'pxe-e1000e.rom';
1807 } elsif ($device eq 'ne2k') {
1808 $romfile = 'pxe-ne2k_pci.rom';
1809 } elsif ($device eq 'pcnet') {
1810 $romfile = 'pxe-pcnet.rom';
1811 } elsif ($device eq 'rtl8139') {
1812 $romfile = 'pxe-rtl8139.rom';
1814 $tmpstr .= ",romfile=$romfile" if $romfile;
1820 sub print_netdev_full
{
1821 my ($vmid, $conf, $arch, $net, $netid, $hotplug) = @_;
1824 if ($netid =~ m/^net(\d+)$/) {
1828 die "got strange net id '$i'\n" if $i >= ${MAX_NETS
};
1830 my $ifname = "tap${vmid}i$i";
1832 # kvm uses TUNSETIFF ioctl, and that limits ifname length
1833 die "interface name '$ifname' is too long (max 15 character)\n"
1834 if length($ifname) >= 16;
1836 my $vhostparam = '';
1837 if (is_native
($arch)) {
1838 $vhostparam = ',vhost=on' if kernel_has_vhost_net
() && $net->{model
} eq 'virtio';
1841 my $vmname = $conf->{name
} || "vm$vmid";
1844 my $script = $hotplug ?
"pve-bridge-hotplug" : "pve-bridge";
1846 if ($net->{bridge
}) {
1847 $netdev = "type=tap,id=$netid,ifname=${ifname},script=/var/lib/qemu-server/$script"
1848 .",downscript=/var/lib/qemu-server/pve-bridgedown$vhostparam";
1850 $netdev = "type=user,id=$netid,hostname=$vmname";
1853 $netdev .= ",queues=$net->{queues}" if ($net->{queues
} && $net->{model
} eq 'virtio');
1859 'cirrus' => 'cirrus-vga',
1861 'vmware' => 'vmware-svga',
1862 'virtio' => 'virtio-vga',
1863 'virtio-gl' => 'virtio-vga-gl',
1866 sub print_vga_device
{
1867 my ($conf, $vga, $arch, $machine_version, $machine, $id, $qxlnum, $bridges) = @_;
1869 my $type = $vga_map->{$vga->{type
}};
1870 if ($arch eq 'aarch64' && defined($type) && $type eq 'virtio-vga') {
1871 $type = 'virtio-gpu';
1873 my $vgamem_mb = $vga->{memory
};
1875 my $max_outputs = '';
1877 $type = $id ?
'qxl' : 'qxl-vga';
1879 if (!$conf->{ostype
} || $conf->{ostype
} =~ m/^(?:l\d\d)|(?:other)$/) {
1880 # set max outputs so linux can have up to 4 qxl displays with one device
1881 if (min_version
($machine_version, 4, 1)) {
1882 $max_outputs = ",max_outputs=4";
1887 die "no devicetype for $vga->{type}\n" if !$type;
1891 if ($vga->{type
} =~ /^virtio/) {
1892 my $bytes = PVE
::Tools
::convert_size
($vgamem_mb, "mb" => "b");
1893 $memory = ",max_hostmem=$bytes";
1895 # from https://www.spice-space.org/multiple-monitors.html
1896 $memory = ",vgamem_mb=$vga->{memory}";
1897 my $ram = $vgamem_mb * 4;
1898 my $vram = $vgamem_mb * 2;
1899 $memory .= ",ram_size_mb=$ram,vram_size_mb=$vram";
1901 $memory = ",vgamem_mb=$vga->{memory}";
1903 } elsif ($qxlnum && $id) {
1904 $memory = ",ram_size=67108864,vram_size=33554432";
1908 if ($type eq 'VGA' && windows_version
($conf->{ostype
})) {
1909 $edidoff=",edid=off" if (!defined($conf->{bios
}) || $conf->{bios
} ne 'ovmf');
1912 my $q35 = PVE
::QemuServer
::Machine
::machine_type_is_q35
($conf);
1913 my $vgaid = "vga" . ($id // '');
1915 if ($q35 && $vgaid eq 'vga') {
1916 # the first display uses pcie.0 bus on q35 machines
1917 $pciaddr = print_pcie_addr
($vgaid, $bridges, $arch, $machine);
1919 $pciaddr = print_pci_addr
($vgaid, $bridges, $arch, $machine);
1922 if ($vga->{type
} eq 'virtio-gl') {
1923 my $base = '/usr/lib/x86_64-linux-gnu/lib';
1924 die "missing libraries for '$vga->{type}' detected! Please install 'libgl1' and 'libegl1'\n"
1925 if !-e
"${base}EGL.so.1" || !-e
"${base}GL.so.1";
1927 die "no DRM render node detected (/dev/dri/renderD*), no GPU? - needed for '$vga->{type}' display\n"
1928 if !PVE
::Tools
::dir_glob_regex
('/dev/dri/', "renderD.*");
1931 return "$type,id=${vgaid}${memory}${max_outputs}${pciaddr}${edidoff}";
1934 sub parse_number_sets
{
1937 foreach my $part (split(/;/, $set)) {
1938 if ($part =~ /^\s*(\d+)(?:-(\d+))?\s*$/) {
1939 die "invalid range: $part ($2 < $1)\n" if defined($2) && $2 < $1;
1940 push @$res, [ $1, $2 ];
1942 die "invalid range: $part\n";
1951 my $res = parse_property_string
($numa_fmt, $data);
1952 $res->{cpus
} = parse_number_sets
($res->{cpus
}) if defined($res->{cpus
});
1953 $res->{hostnodes
} = parse_number_sets
($res->{hostnodes
}) if defined($res->{hostnodes
});
1957 # netX: e1000=XX:XX:XX:XX:XX:XX,bridge=vmbr0,rate=<mbps>
1959 my ($data, $disable_mac_autogen) = @_;
1961 my $res = eval { parse_property_string
($net_fmt, $data) };
1966 if (!defined($res->{macaddr
}) && !$disable_mac_autogen) {
1967 my $dc = PVE
::Cluster
::cfs_read_file
('datacenter.cfg');
1968 $res->{macaddr
} = PVE
::Tools
::random_ether_addr
($dc->{mac_prefix
});
1973 # ipconfigX ip=cidr,gw=ip,ip6=cidr,gw6=ip
1974 sub parse_ipconfig
{
1977 my $res = eval { parse_property_string
($ipconfig_fmt, $data) };
1983 if ($res->{gw
} && !$res->{ip
}) {
1984 warn 'gateway specified without specifying an IP address';
1987 if ($res->{gw6
} && !$res->{ip6
}) {
1988 warn 'IPv6 gateway specified without specifying an IPv6 address';
1991 if ($res->{gw
} && $res->{ip
} eq 'dhcp') {
1992 warn 'gateway specified together with DHCP';
1995 if ($res->{gw6
} && $res->{ip6
} !~ /^$IPV6RE/) {
1997 warn "IPv6 gateway specified together with $res->{ip6} address";
2001 if (!$res->{ip
} && !$res->{ip6
}) {
2002 return { ip
=> 'dhcp', ip6
=> 'dhcp' };
2011 return PVE
::JSONSchema
::print_property_string
($net, $net_fmt);
2014 sub add_random_macs
{
2015 my ($settings) = @_;
2017 foreach my $opt (keys %$settings) {
2018 next if $opt !~ m/^net(\d+)$/;
2019 my $net = parse_net
($settings->{$opt});
2021 $settings->{$opt} = print_net
($net);
2025 sub vm_is_volid_owner
{
2026 my ($storecfg, $vmid, $volid) = @_;
2028 if ($volid !~ m
|^/|) {
2030 eval { ($path, $owner) = PVE
::Storage
::path
($storecfg, $volid); };
2031 if ($owner && ($owner == $vmid)) {
2039 sub vmconfig_register_unused_drive
{
2040 my ($storecfg, $vmid, $conf, $drive) = @_;
2042 if (drive_is_cloudinit
($drive)) {
2043 eval { PVE
::Storage
::vdisk_free
($storecfg, $drive->{file
}) };
2045 delete $conf->{cloudinit
};
2046 } elsif (!drive_is_cdrom
($drive)) {
2047 my $volid = $drive->{file
};
2048 if (vm_is_volid_owner
($storecfg, $vmid, $volid)) {
2049 PVE
::QemuConfig-
>add_unused_volume($conf, $volid, $vmid);
2054 # smbios: [manufacturer=str][,product=str][,version=str][,serial=str][,uuid=uuid][,sku=str][,family=str][,base64=bool]
2058 pattern
=> '[a-fA-F0-9]{8}(?:-[a-fA-F0-9]{4}){3}-[a-fA-F0-9]{12}',
2059 format_description
=> 'UUID',
2060 description
=> "Set SMBIOS1 UUID.",
2065 pattern
=> '[A-Za-z0-9+\/]+={0,2}',
2066 format_description
=> 'Base64 encoded string',
2067 description
=> "Set SMBIOS1 version.",
2072 pattern
=> '[A-Za-z0-9+\/]+={0,2}',
2073 format_description
=> 'Base64 encoded string',
2074 description
=> "Set SMBIOS1 serial number.",
2079 pattern
=> '[A-Za-z0-9+\/]+={0,2}',
2080 format_description
=> 'Base64 encoded string',
2081 description
=> "Set SMBIOS1 manufacturer.",
2086 pattern
=> '[A-Za-z0-9+\/]+={0,2}',
2087 format_description
=> 'Base64 encoded string',
2088 description
=> "Set SMBIOS1 product ID.",
2093 pattern
=> '[A-Za-z0-9+\/]+={0,2}',
2094 format_description
=> 'Base64 encoded string',
2095 description
=> "Set SMBIOS1 SKU string.",
2100 pattern
=> '[A-Za-z0-9+\/]+={0,2}',
2101 format_description
=> 'Base64 encoded string',
2102 description
=> "Set SMBIOS1 family string.",
2107 description
=> 'Flag to indicate that the SMBIOS values are base64 encoded',
2115 my $res = eval { parse_property_string
($smbios1_fmt, $data) };
2122 return PVE
::JSONSchema
::print_property_string
($smbios1, $smbios1_fmt);
2125 PVE
::JSONSchema
::register_format
('pve-qm-smbios1', $smbios1_fmt);
2127 sub parse_watchdog
{
2132 my $res = eval { parse_property_string
($watchdog_fmt, $value) };
2137 sub parse_guest_agent
{
2140 return {} if !defined($conf->{agent
});
2142 my $res = eval { parse_property_string
($agent_fmt, $conf->{agent
}) };
2145 # if the agent is disabled ignore the other potentially set properties
2146 return {} if !$res->{enabled
};
2151 my ($conf, $key) = @_;
2152 return undef if !defined($conf->{agent
});
2154 my $agent = parse_guest_agent
($conf);
2155 return $agent->{$key};
2161 return {} if !$value;
2162 my $res = eval { parse_property_string
($vga_fmt, $value) };
2172 my $res = eval { parse_property_string
($rng_fmt, $value) };
2177 sub parse_meta_info
{
2182 my $res = eval { parse_property_string
($meta_info_fmt, $value) };
2187 sub new_meta_info_string
{
2188 my () = @_; # for now do not allow to override any value
2190 return PVE
::JSONSchema
::print_property_string
(
2192 'creation-qemu' => kvm_user_version
(),
2193 ctime
=> "". int(time()),
2199 sub qemu_created_version_fixups
{
2200 my ($conf, $forcemachine, $kvmver) = @_;
2202 my $meta = parse_meta_info
($conf->{meta
}) // {};
2203 my $forced_vers = PVE
::QemuServer
::Machine
::extract_version
($forcemachine);
2205 # check if we need to apply some handling for VMs that always use the latest machine version but
2206 # had a machine version transition happen that affected HW such that, e.g., an OS config change
2207 # would be required (we do not want to pin machine version for non-windows OS type)
2209 (!defined($conf->{machine
}) || $conf->{machine
} =~ m/^(?:pc|q35|virt)$/) # non-versioned machine
2210 && (!defined($meta->{'creation-qemu'}) || !min_version
($meta->{'creation-qemu'}, 6, 1)) # created before 6.1
2211 && (!$forced_vers || min_version
($forced_vers, 6, 1)) # handle snapshot-rollback/migrations
2212 && min_version
($kvmver, 6, 1) # only need to apply the change since 6.1
2214 my $q35 = PVE
::QemuServer
::Machine
::machine_type_is_q35
($conf);
2215 if ($q35 && $conf->{ostype
} && $conf->{ostype
} eq 'l26') {
2216 # this changed to default-on in Q 6.1 for q35 machines, it will mess with PCI slot view
2217 # and thus with the predictable interface naming of systemd
2218 return ['-global', 'ICH9-LPC.acpi-pci-hotplug-with-bridge-support=off'];
2224 PVE
::JSONSchema
::register_format
('pve-qm-usb-device', \
&verify_usb_device
);
2225 sub verify_usb_device
{
2226 my ($value, $noerr) = @_;
2228 return $value if parse_usb_device
($value);
2232 die "unable to parse usb device\n";
2235 # add JSON properties for create and set function
2236 sub json_config_properties
{
2237 my ($prop, $with_disk_alloc) = @_;
2239 my $skip_json_config_opts = {
2243 runningmachine
=> 1,
2248 foreach my $opt (keys %$confdesc) {
2249 next if $skip_json_config_opts->{$opt};
2251 if ($with_disk_alloc && is_valid_drivename
($opt)) {
2252 $prop->{$opt} = $PVE::QemuServer
::Drive
::drivedesc_hash_with_alloc-
>{$opt};
2254 $prop->{$opt} = $confdesc->{$opt};
2261 # Properties that we can read from an OVF file
2262 sub json_ovf_properties
{
2265 for my $device (PVE
::QemuServer
::Drive
::valid_drive_names
()) {
2266 $prop->{$device} = {
2268 format
=> 'pve-volume-id-or-absolute-path',
2269 description
=> "Disk image that gets imported to $device",
2276 description
=> "The number of CPU cores.",
2281 description
=> "Amount of RAM for the VM in MB.",
2286 description
=> "Name of the VM.",
2293 # return copy of $confdesc_cloudinit to generate documentation
2294 sub cloudinit_config_properties
{
2296 return dclone
($confdesc_cloudinit);
2299 sub cloudinit_pending_properties
{
2301 map { $_ => 1 } keys $confdesc_cloudinit->%*,
2304 $p->{"net$_"} = 1 for 0..($MAX_NETS-1);
2309 my ($key, $value) = @_;
2311 die "unknown setting '$key'\n" if !$confdesc->{$key};
2313 my $type = $confdesc->{$key}->{type
};
2315 if (!defined($value)) {
2316 die "got undefined value\n";
2319 if ($value =~ m/[\n\r]/) {
2320 die "property contains a line feed\n";
2323 if ($type eq 'boolean') {
2324 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
2325 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
2326 die "type check ('boolean') failed - got '$value'\n";
2327 } elsif ($type eq 'integer') {
2328 return int($1) if $value =~ m/^(\d+)$/;
2329 die "type check ('integer') failed - got '$value'\n";
2330 } elsif ($type eq 'number') {
2331 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
2332 die "type check ('number') failed - got '$value'\n";
2333 } elsif ($type eq 'string') {
2334 if (my $fmt = $confdesc->{$key}->{format
}) {
2335 PVE
::JSONSchema
::check_format
($fmt, $value);
2338 $value =~ s/^\"(.*)\"$/$1/;
2341 die "internal error"
2346 my ($storecfg, $vmid, $skiplock, $replacement_conf, $purge_unreferenced) = @_;
2348 my $conf = PVE
::QemuConfig-
>load_config($vmid);
2350 if (!$skiplock && !PVE
::QemuConfig-
>has_lock($conf, 'suspended')) {
2351 PVE
::QemuConfig-
>check_lock($conf);
2354 if ($conf->{template
}) {
2355 # check if any base image is still used by a linked clone
2356 PVE
::QemuConfig-
>foreach_volume_full($conf, { include_unused
=> 1 }, sub {
2357 my ($ds, $drive) = @_;
2358 return if drive_is_cdrom
($drive);
2360 my $volid = $drive->{file
};
2361 return if !$volid || $volid =~ m
|^/|;
2363 die "base volume '$volid' is still in use by linked cloned\n"
2364 if PVE
::Storage
::volume_is_base_and_used
($storecfg, $volid);
2370 my $remove_owned_drive = sub {
2371 my ($ds, $drive) = @_;
2372 return if drive_is_cdrom
($drive, 1);
2374 my $volid = $drive->{file
};
2375 return if !$volid || $volid =~ m
|^/|;
2376 return if $volids->{$volid};
2378 my ($path, $owner) = PVE
::Storage
::path
($storecfg, $volid);
2379 return if !$path || !$owner || ($owner != $vmid);
2381 $volids->{$volid} = 1;
2382 eval { PVE
::Storage
::vdisk_free
($storecfg, $volid) };
2383 warn "Could not remove disk '$volid', check manually: $@" if $@;
2386 # only remove disks owned by this VM (referenced in the config)
2387 my $include_opts = {
2388 include_unused
=> 1,
2389 extra_keys
=> ['vmstate'],
2391 PVE
::QemuConfig-
>foreach_volume_full($conf, $include_opts, $remove_owned_drive);
2393 for my $snap (values %{$conf->{snapshots
}}) {
2394 next if !defined($snap->{vmstate
});
2395 my $drive = PVE
::QemuConfig-
>parse_volume('vmstate', $snap->{vmstate
}, 1);
2396 next if !defined($drive);
2397 $remove_owned_drive->('vmstate', $drive);
2400 PVE
::QemuConfig-
>foreach_volume_full($conf->{pending
}, $include_opts, $remove_owned_drive);
2402 if ($purge_unreferenced) { # also remove unreferenced disk
2403 my $vmdisks = PVE
::Storage
::vdisk_list
($storecfg, undef, $vmid, undef, 'images');
2404 PVE
::Storage
::foreach_volid
($vmdisks, sub {
2405 my ($volid, $sid, $volname, $d) = @_;
2406 eval { PVE
::Storage
::vdisk_free
($storecfg, $volid) };
2411 if (defined $replacement_conf) {
2412 PVE
::QemuConfig-
>write_config($vmid, $replacement_conf);
2414 PVE
::QemuConfig-
>destroy_config($vmid);
2418 sub parse_vm_config
{
2419 my ($filename, $raw, $strict) = @_;
2421 return if !defined($raw);
2424 digest
=> Digest
::SHA
::sha1_hex
($raw),
2430 my $handle_error = sub {
2440 $filename =~ m
|/qemu-server/(\d
+)\
.conf
$|
2441 || die "got strange filename '$filename'";
2447 my $finish_description = sub {
2448 if (defined($descr)) {
2450 $conf->{description
} = $descr;
2456 my @lines = split(/\n/, $raw);
2457 foreach my $line (@lines) {
2458 next if $line =~ m/^\s*$/;
2460 if ($line =~ m/^\[PENDING\]\s*$/i) {
2461 $section = 'pending';
2462 $finish_description->();
2463 $conf = $res->{$section} = {};
2465 } elsif ($line =~ m/^\[special:cloudinit\]\s*$/i) {
2466 $section = 'cloudinit';
2467 $finish_description->();
2468 $conf = $res->{$section} = {};
2471 } elsif ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
2473 $finish_description->();
2474 $conf = $res->{snapshots
}->{$section} = {};
2478 if ($line =~ m/^\#(.*)$/) {
2479 $descr = '' if !defined($descr);
2480 $descr .= PVE
::Tools
::decode_text
($1) . "\n";
2484 if ($line =~ m/^(description):\s*(.*\S)\s*$/) {
2485 $descr = '' if !defined($descr);
2486 $descr .= PVE
::Tools
::decode_text
($2);
2487 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
2488 $conf->{snapstate
} = $1;
2489 } elsif ($line =~ m/^(args):\s*(.*\S)\s*$/) {
2492 $conf->{$key} = $value;
2493 } elsif ($line =~ m/^delete:\s*(.*\S)\s*$/) {
2495 if ($section eq 'pending') {
2496 $conf->{delete} = $value; # we parse this later
2498 $handle_error->("vm $vmid - property 'delete' is only allowed in [PENDING]\n");
2500 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(.+?)\s*$/) {
2503 if ($section eq 'cloudinit') {
2504 # ignore validation only used for informative purpose
2505 $conf->{$key} = $value;
2508 eval { $value = check_type
($key, $value); };
2510 $handle_error->("vm $vmid - unable to parse value of '$key' - $@");
2512 $key = 'ide2' if $key eq 'cdrom';
2513 my $fmt = $confdesc->{$key}->{format
};
2514 if ($fmt && $fmt =~ /^pve-qm-(?:ide|scsi|virtio|sata)$/) {
2515 my $v = parse_drive
($key, $value);
2516 if (my $volid = filename_to_volume_id
($vmid, $v->{file
}, $v->{media
})) {
2517 $v->{file
} = $volid;
2518 $value = print_drive
($v);
2520 $handle_error->("vm $vmid - unable to parse value of '$key'\n");
2525 $conf->{$key} = $value;
2528 $handle_error->("vm $vmid - unable to parse config: $line\n");
2532 $finish_description->();
2533 delete $res->{snapstate
}; # just to be sure
2538 sub write_vm_config
{
2539 my ($filename, $conf) = @_;
2541 delete $conf->{snapstate
}; # just to be sure
2543 if ($conf->{cdrom
}) {
2544 die "option ide2 conflicts with cdrom\n" if $conf->{ide2
};
2545 $conf->{ide2
} = $conf->{cdrom
};
2546 delete $conf->{cdrom
};
2549 # we do not use 'smp' any longer
2550 if ($conf->{sockets
}) {
2551 delete $conf->{smp
};
2552 } elsif ($conf->{smp
}) {
2553 $conf->{sockets
} = $conf->{smp
};
2554 delete $conf->{cores
};
2555 delete $conf->{smp
};
2558 my $used_volids = {};
2560 my $cleanup_config = sub {
2561 my ($cref, $pending, $snapname) = @_;
2563 foreach my $key (keys %$cref) {
2564 next if $key eq 'digest' || $key eq 'description' || $key eq 'snapshots' ||
2565 $key eq 'snapstate' || $key eq 'pending' || $key eq 'cloudinit';
2566 my $value = $cref->{$key};
2567 if ($key eq 'delete') {
2568 die "propertry 'delete' is only allowed in [PENDING]\n"
2570 # fixme: check syntax?
2573 eval { $value = check_type
($key, $value); };
2574 die "unable to parse value of '$key' - $@" if $@;
2576 $cref->{$key} = $value;
2578 if (!$snapname && is_valid_drivename
($key)) {
2579 my $drive = parse_drive
($key, $value);
2580 $used_volids->{$drive->{file
}} = 1 if $drive && $drive->{file
};
2585 &$cleanup_config($conf);
2587 &$cleanup_config($conf->{pending
}, 1);
2589 foreach my $snapname (keys %{$conf->{snapshots
}}) {
2590 die "internal error: snapshot name '$snapname' is forbidden" if lc($snapname) eq 'pending';
2591 &$cleanup_config($conf->{snapshots
}->{$snapname}, undef, $snapname);
2594 # remove 'unusedX' settings if we re-add a volume
2595 foreach my $key (keys %$conf) {
2596 my $value = $conf->{$key};
2597 if ($key =~ m/^unused/ && $used_volids->{$value}) {
2598 delete $conf->{$key};
2602 my $generate_raw_config = sub {
2603 my ($conf, $pending) = @_;
2607 # add description as comment to top of file
2608 if (defined(my $descr = $conf->{description
})) {
2610 foreach my $cl (split(/\n/, $descr)) {
2611 $raw .= '#' . PVE
::Tools
::encode_text
($cl) . "\n";
2614 $raw .= "#\n" if $pending;
2618 foreach my $key (sort keys %$conf) {
2619 next if $key =~ /^(digest|description|pending|cloudinit|snapshots)$/;
2620 $raw .= "$key: $conf->{$key}\n";
2625 my $raw = &$generate_raw_config($conf);
2627 if (scalar(keys %{$conf->{pending
}})){
2628 $raw .= "\n[PENDING]\n";
2629 $raw .= &$generate_raw_config($conf->{pending
}, 1);
2632 if (scalar(keys %{$conf->{cloudinit
}}) && PVE
::QemuConfig-
>has_cloudinit($conf)){
2633 $raw .= "\n[special:cloudinit]\n";
2634 $raw .= &$generate_raw_config($conf->{cloudinit
});
2637 foreach my $snapname (sort keys %{$conf->{snapshots
}}) {
2638 $raw .= "\n[$snapname]\n";
2639 $raw .= &$generate_raw_config($conf->{snapshots
}->{$snapname});
2649 # we use static defaults from our JSON schema configuration
2650 foreach my $key (keys %$confdesc) {
2651 if (defined(my $default = $confdesc->{$key}->{default})) {
2652 $res->{$key} = $default;
2660 my $vmlist = PVE
::Cluster
::get_vmlist
();
2662 return $res if !$vmlist || !$vmlist->{ids
};
2663 my $ids = $vmlist->{ids
};
2664 my $nodename = nodename
();
2666 foreach my $vmid (keys %$ids) {
2667 my $d = $ids->{$vmid};
2668 next if !$d->{node
} || $d->{node
} ne $nodename;
2669 next if !$d->{type
} || $d->{type
} ne 'qemu';
2670 $res->{$vmid}->{exists} = 1;
2675 # test if VM uses local resources (to prevent migration)
2676 sub check_local_resources
{
2677 my ($conf, $noerr) = @_;
2681 push @loc_res, "hostusb" if $conf->{hostusb
}; # old syntax
2682 push @loc_res, "hostpci" if $conf->{hostpci
}; # old syntax
2684 push @loc_res, "ivshmem" if $conf->{ivshmem
};
2686 foreach my $k (keys %$conf) {
2687 next if $k =~ m/^usb/ && ($conf->{$k} =~ m/^spice(?![^,])/);
2688 # sockets are safe: they will recreated be on the target side post-migrate
2689 next if $k =~ m/^serial/ && ($conf->{$k} eq 'socket');
2690 push @loc_res, $k if $k =~ m/^(usb|hostpci|serial|parallel)\d+$/;
2693 die "VM uses local resources\n" if scalar @loc_res && !$noerr;
2698 # check if used storages are available on all nodes (use by migrate)
2699 sub check_storage_availability
{
2700 my ($storecfg, $conf, $node) = @_;
2702 PVE
::QemuConfig-
>foreach_volume($conf, sub {
2703 my ($ds, $drive) = @_;
2705 my $volid = $drive->{file
};
2708 my ($sid, $volname) = PVE
::Storage
::parse_volume_id
($volid, 1);
2711 # check if storage is available on both nodes
2712 my $scfg = PVE
::Storage
::storage_check_enabled
($storecfg, $sid);
2713 PVE
::Storage
::storage_check_enabled
($storecfg, $sid, $node);
2715 my ($vtype) = PVE
::Storage
::parse_volname
($storecfg, $volid);
2717 die "$volid: content type '$vtype' is not available on storage '$sid'\n"
2718 if !$scfg->{content
}->{$vtype};
2722 # list nodes where all VM images are available (used by has_feature API)
2724 my ($conf, $storecfg) = @_;
2726 my $nodelist = PVE
::Cluster
::get_nodelist
();
2727 my $nodehash = { map { $_ => 1 } @$nodelist };
2728 my $nodename = nodename
();
2730 PVE
::QemuConfig-
>foreach_volume($conf, sub {
2731 my ($ds, $drive) = @_;
2733 my $volid = $drive->{file
};
2736 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($volid, 1);
2738 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
2739 if ($scfg->{disable
}) {
2741 } elsif (my $avail = $scfg->{nodes
}) {
2742 foreach my $node (keys %$nodehash) {
2743 delete $nodehash->{$node} if !$avail->{$node};
2745 } elsif (!$scfg->{shared
}) {
2746 foreach my $node (keys %$nodehash) {
2747 delete $nodehash->{$node} if $node ne $nodename
2756 sub check_local_storage_availability
{
2757 my ($conf, $storecfg) = @_;
2759 my $nodelist = PVE
::Cluster
::get_nodelist
();
2760 my $nodehash = { map { $_ => {} } @$nodelist };
2762 PVE
::QemuConfig-
>foreach_volume($conf, sub {
2763 my ($ds, $drive) = @_;
2765 my $volid = $drive->{file
};
2768 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($volid, 1);
2770 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
2772 if ($scfg->{disable
}) {
2773 foreach my $node (keys %$nodehash) {
2774 $nodehash->{$node}->{unavailable_storages
}->{$storeid} = 1;
2776 } elsif (my $avail = $scfg->{nodes
}) {
2777 foreach my $node (keys %$nodehash) {
2778 if (!$avail->{$node}) {
2779 $nodehash->{$node}->{unavailable_storages
}->{$storeid} = 1;
2786 foreach my $node (values %$nodehash) {
2787 if (my $unavail = $node->{unavailable_storages
}) {
2788 $node->{unavailable_storages
} = [ sort keys %$unavail ];
2795 # Compat only, use assert_config_exists_on_node and vm_running_locally where possible
2797 my ($vmid, $nocheck, $node) = @_;
2799 # $nocheck is set when called during a migration, in which case the config
2800 # file might still or already reside on the *other* node
2801 # - because rename has already happened, and current node is source
2802 # - because rename hasn't happened yet, and current node is target
2803 # - because rename has happened, current node is target, but hasn't yet
2805 PVE
::QemuConfig
::assert_config_exists_on_node
($vmid, $node) if !$nocheck;
2806 return PVE
::QemuServer
::Helpers
::vm_running_locally
($vmid);
2811 my $vzlist = config_list
();
2813 my $fd = IO
::Dir-
>new($PVE::QemuServer
::Helpers
::var_run_tmpdir
) || return $vzlist;
2815 while (defined(my $de = $fd->read)) {
2816 next if $de !~ m/^(\d+)\.pid$/;
2818 next if !defined($vzlist->{$vmid});
2819 if (my $pid = check_running
($vmid)) {
2820 $vzlist->{$vmid}->{pid
} = $pid;
2827 our $vmstatus_return_properties = {
2828 vmid
=> get_standard_option
('pve-vmid'),
2830 description
=> "QEMU process status.",
2832 enum
=> ['stopped', 'running'],
2835 description
=> "Maximum memory in bytes.",
2838 renderer
=> 'bytes',
2841 description
=> "Root disk size in bytes.",
2844 renderer
=> 'bytes',
2847 description
=> "VM name.",
2852 description
=> "QEMU QMP agent status.",
2857 description
=> "PID of running qemu process.",
2862 description
=> "Uptime.",
2865 renderer
=> 'duration',
2868 description
=> "Maximum usable CPUs.",
2873 description
=> "The current config lock, if any.",
2878 description
=> "The current configured tags, if any",
2882 'running-machine' => {
2883 description
=> "The currently running machine type (if running).",
2888 description
=> "The currently running QEMU version (if running).",
2894 my $last_proc_pid_stat;
2896 # get VM status information
2897 # This must be fast and should not block ($full == false)
2898 # We only query KVM using QMP if $full == true (this can be slow)
2900 my ($opt_vmid, $full) = @_;
2904 my $storecfg = PVE
::Storage
::config
();
2906 my $list = vzlist
();
2907 my $defaults = load_defaults
();
2909 my ($uptime) = PVE
::ProcFSTools
::read_proc_uptime
(1);
2911 my $cpucount = $cpuinfo->{cpus
} || 1;
2913 foreach my $vmid (keys %$list) {
2914 next if $opt_vmid && ($vmid ne $opt_vmid);
2916 my $conf = PVE
::QemuConfig-
>load_config($vmid);
2918 my $d = { vmid
=> int($vmid) };
2919 $d->{pid
} = int($list->{$vmid}->{pid
}) if $list->{$vmid}->{pid
};
2921 # fixme: better status?
2922 $d->{status
} = $list->{$vmid}->{pid
} ?
'running' : 'stopped';
2924 my $size = PVE
::QemuServer
::Drive
::bootdisk_size
($storecfg, $conf);
2925 if (defined($size)) {
2926 $d->{disk
} = 0; # no info available
2927 $d->{maxdisk
} = $size;
2933 $d->{cpus
} = ($conf->{sockets
} || $defaults->{sockets
})
2934 * ($conf->{cores
} || $defaults->{cores
});
2935 $d->{cpus
} = $cpucount if $d->{cpus
} > $cpucount;
2936 $d->{cpus
} = $conf->{vcpus
} if $conf->{vcpus
};
2938 $d->{name
} = $conf->{name
} || "VM $vmid";
2939 $d->{maxmem
} = $conf->{memory
} ?
$conf->{memory
}*(1024*1024)
2940 : $defaults->{memory
}*(1024*1024);
2942 if ($conf->{balloon
}) {
2943 $d->{balloon_min
} = $conf->{balloon
}*(1024*1024);
2944 $d->{shares
} = defined($conf->{shares
}) ?
$conf->{shares
}
2945 : $defaults->{shares
};
2956 $d->{diskwrite
} = 0;
2958 $d->{template
} = 1 if PVE
::QemuConfig-
>is_template($conf);
2960 $d->{serial
} = 1 if conf_has_serial
($conf);
2961 $d->{lock} = $conf->{lock} if $conf->{lock};
2962 $d->{tags
} = $conf->{tags
} if defined($conf->{tags
});
2967 my $netdev = PVE
::ProcFSTools
::read_proc_net_dev
();
2968 foreach my $dev (keys %$netdev) {
2969 next if $dev !~ m/^tap([1-9]\d*)i/;
2971 my $d = $res->{$vmid};
2974 $d->{netout
} += $netdev->{$dev}->{receive
};
2975 $d->{netin
} += $netdev->{$dev}->{transmit
};
2978 $d->{nics
}->{$dev}->{netout
} = int($netdev->{$dev}->{receive
});
2979 $d->{nics
}->{$dev}->{netin
} = int($netdev->{$dev}->{transmit
});
2984 my $ctime = gettimeofday
;
2986 foreach my $vmid (keys %$list) {
2988 my $d = $res->{$vmid};
2989 my $pid = $d->{pid
};
2992 my $pstat = PVE
::ProcFSTools
::read_proc_pid_stat
($pid);
2993 next if !$pstat; # not running
2995 my $used = $pstat->{utime} + $pstat->{stime
};
2997 $d->{uptime
} = int(($uptime - $pstat->{starttime
})/$cpuinfo->{user_hz
});
2999 if ($pstat->{vsize
}) {
3000 $d->{mem
} = int(($pstat->{rss
}/$pstat->{vsize
})*$d->{maxmem
});
3003 my $old = $last_proc_pid_stat->{$pid};
3005 $last_proc_pid_stat->{$pid} = {
3013 my $dtime = ($ctime - $old->{time}) * $cpucount * $cpuinfo->{user_hz
};
3015 if ($dtime > 1000) {
3016 my $dutime = $used - $old->{used
};
3018 $d->{cpu
} = (($dutime/$dtime)* $cpucount) / $d->{cpus
};
3019 $last_proc_pid_stat->{$pid} = {
3025 $d->{cpu
} = $old->{cpu
};
3029 return $res if !$full;
3031 my $qmpclient = PVE
::QMPClient-
>new();
3033 my $ballooncb = sub {
3034 my ($vmid, $resp) = @_;
3036 my $info = $resp->{'return'};
3037 return if !$info->{max_mem
};
3039 my $d = $res->{$vmid};
3041 # use memory assigned to VM
3042 $d->{maxmem
} = $info->{max_mem
};
3043 $d->{balloon
} = $info->{actual
};
3045 if (defined($info->{total_mem
}) && defined($info->{free_mem
})) {
3046 $d->{mem
} = $info->{total_mem
} - $info->{free_mem
};
3047 $d->{freemem
} = $info->{free_mem
};
3050 $d->{ballooninfo
} = $info;
3053 my $blockstatscb = sub {
3054 my ($vmid, $resp) = @_;
3055 my $data = $resp->{'return'} || [];
3056 my $totalrdbytes = 0;
3057 my $totalwrbytes = 0;
3059 for my $blockstat (@$data) {
3060 $totalrdbytes = $totalrdbytes + $blockstat->{stats
}->{rd_bytes
};
3061 $totalwrbytes = $totalwrbytes + $blockstat->{stats
}->{wr_bytes
};
3063 $blockstat->{device
} =~ s/drive-//;
3064 $res->{$vmid}->{blockstat
}->{$blockstat->{device
}} = $blockstat->{stats
};
3066 $res->{$vmid}->{diskread
} = $totalrdbytes;
3067 $res->{$vmid}->{diskwrite
} = $totalwrbytes;
3070 my $machinecb = sub {
3071 my ($vmid, $resp) = @_;
3072 my $data = $resp->{'return'} || [];
3074 $res->{$vmid}->{'running-machine'} =
3075 PVE
::QemuServer
::Machine
::current_from_query_machines
($data);
3078 my $versioncb = sub {
3079 my ($vmid, $resp) = @_;
3080 my $data = $resp->{'return'} // {};
3081 my $version = 'unknown';
3083 if (my $v = $data->{qemu
}) {
3084 $version = $v->{major
} . "." . $v->{minor
} . "." . $v->{micro
};
3087 $res->{$vmid}->{'running-qemu'} = $version;
3090 my $statuscb = sub {
3091 my ($vmid, $resp) = @_;
3093 $qmpclient->queue_cmd($vmid, $blockstatscb, 'query-blockstats');
3094 $qmpclient->queue_cmd($vmid, $machinecb, 'query-machines');
3095 $qmpclient->queue_cmd($vmid, $versioncb, 'query-version');
3096 # this fails if ballon driver is not loaded, so this must be
3097 # the last commnand (following command are aborted if this fails).
3098 $qmpclient->queue_cmd($vmid, $ballooncb, 'query-balloon');
3100 my $status = 'unknown';
3101 if (!defined($status = $resp->{'return'}->{status
})) {
3102 warn "unable to get VM status\n";
3106 $res->{$vmid}->{qmpstatus
} = $resp->{'return'}->{status
};
3109 foreach my $vmid (keys %$list) {
3110 next if $opt_vmid && ($vmid ne $opt_vmid);
3111 next if !$res->{$vmid}->{pid
}; # not running
3112 $qmpclient->queue_cmd($vmid, $statuscb, 'query-status');
3115 $qmpclient->queue_execute(undef, 2);
3117 foreach my $vmid (keys %$list) {
3118 next if $opt_vmid && ($vmid ne $opt_vmid);
3119 next if !$res->{$vmid}->{pid
}; #not running
3121 # we can't use the $qmpclient since it might have already aborted on
3122 # 'query-balloon', but this might also fail for older versions...
3123 my $qemu_support = eval { mon_cmd
($vmid, "query-proxmox-support") };
3124 $res->{$vmid}->{'proxmox-support'} = $qemu_support // {};
3127 foreach my $vmid (keys %$list) {
3128 next if $opt_vmid && ($vmid ne $opt_vmid);
3129 $res->{$vmid}->{qmpstatus
} = $res->{$vmid}->{status
} if !$res->{$vmid}->{qmpstatus
};
3135 sub conf_has_serial
{
3138 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
3139 if ($conf->{"serial$i"}) {
3147 sub conf_has_audio
{
3148 my ($conf, $id) = @_;
3151 my $audio = $conf->{"audio$id"};
3152 return if !defined($audio);
3154 my $audioproperties = parse_property_string
($audio_fmt, $audio);
3155 my $audiodriver = $audioproperties->{driver
} // 'spice';
3158 dev
=> $audioproperties->{device
},
3159 dev_id
=> "audiodev$id",
3160 backend
=> $audiodriver,
3161 backend_id
=> "$audiodriver-backend${id}",
3166 my ($audio, $audiopciaddr, $machine_version) = @_;
3170 my $id = $audio->{dev_id
};
3172 if (min_version
($machine_version, 4, 2)) {
3173 $audiodev = ",audiodev=$audio->{backend_id}";
3176 if ($audio->{dev
} eq 'AC97') {
3177 push @$devs, '-device', "AC97,id=${id}${audiopciaddr}$audiodev";
3178 } elsif ($audio->{dev
} =~ /intel\-hda$/) {
3179 push @$devs, '-device', "$audio->{dev},id=${id}${audiopciaddr}";
3180 push @$devs, '-device', "hda-micro,id=${id}-codec0,bus=${id}.0,cad=0$audiodev";
3181 push @$devs, '-device', "hda-duplex,id=${id}-codec1,bus=${id}.0,cad=1$audiodev";
3183 die "unkown audio device '$audio->{dev}', implement me!";
3186 push @$devs, '-audiodev', "$audio->{backend},id=$audio->{backend_id}";
3194 socket => "/var/run/qemu-server/$vmid.swtpm",
3195 pid
=> "/var/run/qemu-server/$vmid.swtpm.pid",
3199 sub add_tpm_device
{
3200 my ($vmid, $devices, $conf) = @_;
3202 return if !$conf->{tpmstate0
};
3204 my $paths = get_tpm_paths
($vmid);
3206 push @$devices, "-chardev", "socket,id=tpmchar,path=$paths->{socket}";
3207 push @$devices, "-tpmdev", "emulator,id=tpmdev,chardev=tpmchar";
3208 push @$devices, "-device", "tpm-tis,tpmdev=tpmdev";
3212 my ($storecfg, $vmid, $tpmdrive, $migration) = @_;
3214 return if !$tpmdrive;
3217 my $tpm = parse_drive
("tpmstate0", $tpmdrive);
3218 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($tpm->{file
}, 1);
3220 $state = PVE
::Storage
::map_volume
($storecfg, $tpm->{file
});
3222 $state = $tpm->{file
};
3225 my $paths = get_tpm_paths
($vmid);
3227 # during migration, we will get state from remote
3230 # run swtpm_setup to create a new TPM state if it doesn't exist yet
3237 "--create-platform-cert",
3240 "/etc/swtpm_setup.conf", # do not use XDG configs
3242 "0", # force creation as root, error if not possible
3243 "--not-overwrite", # ignore existing state, do not modify
3246 push @$setup_cmd, "--tpm2" if $tpm->{version
} eq 'v2.0';
3247 # TPM 2.0 supports ECC crypto, use if possible
3248 push @$setup_cmd, "--ecc" if $tpm->{version
} eq 'v2.0';
3250 run_command
($setup_cmd, outfunc
=> sub {
3251 print "swtpm_setup: $1\n";
3255 my $emulator_cmd = [
3259 "backend-uri=file://$state,mode=0600",
3261 "type=unixio,path=$paths->{socket},mode=0600",
3263 "file=$paths->{pid}",
3264 "--terminate", # terminate on QEMU disconnect
3267 push @$emulator_cmd, "--tpm2" if $tpm->{version
} eq 'v2.0';
3268 run_command
($emulator_cmd, outfunc
=> sub { print $1; });
3270 my $tries = 100; # swtpm may take a bit to start before daemonizing, wait up to 5s for pid
3271 while (! -e
$paths->{pid
}) {
3272 die "failed to start swtpm: pid file '$paths->{pid}' wasn't created.\n" if --$tries == 0;
3276 # return untainted PID of swtpm daemon so it can be killed on error
3277 file_read_firstline
($paths->{pid
}) =~ m/(\d+)/;
3281 sub vga_conf_has_spice
{
3284 my $vgaconf = parse_vga
($vga);
3285 my $vgatype = $vgaconf->{type
};
3286 return 0 if !$vgatype || $vgatype !~ m/^qxl([234])?$/;
3293 return get_host_arch
() eq $arch;
3298 return $conf->{arch
} // get_host_arch
();
3301 my $default_machines = {
3306 sub get_installed_machine_version
{
3307 my ($kvmversion) = @_;
3308 $kvmversion = kvm_user_version
() if !defined($kvmversion);
3309 $kvmversion =~ m/^(\d+\.\d+)/;
3313 sub windows_get_pinned_machine_version
{
3314 my ($machine, $base_version, $kvmversion) = @_;
3316 my $pin_version = $base_version;
3317 if (!defined($base_version) ||
3318 !PVE
::QemuServer
::Machine
::can_run_pve_machine_version
($base_version, $kvmversion)
3320 $pin_version = get_installed_machine_version
($kvmversion);
3322 if (!$machine || $machine eq 'pc') {
3323 $machine = "pc-i440fx-$pin_version";
3324 } elsif ($machine eq 'q35') {
3325 $machine = "pc-q35-$pin_version";
3326 } elsif ($machine eq 'virt') {
3327 $machine = "virt-$pin_version";
3329 warn "unknown machine type '$machine', not touching that!\n";
3335 sub get_vm_machine
{
3336 my ($conf, $forcemachine, $arch, $add_pve_version, $kvmversion) = @_;
3338 my $machine = $forcemachine || $conf->{machine
};
3340 if (!$machine || $machine =~ m/^(?:pc|q35|virt)$/) {
3341 $kvmversion //= kvm_user_version
();
3342 # we must pin Windows VMs without a specific version to 5.1, as 5.2 fixed a bug in ACPI
3343 # layout which confuses windows quite a bit and may result in various regressions..
3344 # see: https://lists.gnu.org/archive/html/qemu-devel/2021-02/msg08484.html
3345 if (windows_version
($conf->{ostype
})) {
3346 $machine = windows_get_pinned_machine_version
($machine, '5.1', $kvmversion);
3349 $machine ||= $default_machines->{$arch};
3350 if ($add_pve_version) {
3351 my $pvever = PVE
::QemuServer
::Machine
::get_pve_version
($kvmversion);
3352 $machine .= "+pve$pvever";
3356 if ($add_pve_version && $machine !~ m/\+pve\d+?(?:\.pxe)?$/) {
3357 my $is_pxe = $machine =~ m/^(.*?)\.pxe$/;
3358 $machine = $1 if $is_pxe;
3360 # for version-pinned machines that do not include a pve-version (e.g.
3361 # pc-q35-4.1), we assume 0 to keep them stable in case we bump
3362 $machine .= '+pve0';
3364 $machine .= '.pxe' if $is_pxe;
3370 sub get_ovmf_files
($$$) {
3371 my ($arch, $efidisk, $smm) = @_;
3373 my $types = $OVMF->{$arch}
3374 or die "no OVMF images known for architecture '$arch'\n";
3376 my $type = 'default';
3377 if (defined($efidisk->{efitype
}) && $efidisk->{efitype
} eq '4m') {
3378 $type = $smm ?
"4m" : "4m-no-smm";
3379 $type .= '-ms' if $efidisk->{'pre-enrolled-keys'};
3382 return $types->{$type}->@*;
3386 aarch64
=> '/usr/bin/qemu-system-aarch64',
3387 x86_64
=> '/usr/bin/qemu-system-x86_64',
3389 sub get_command_for_arch
($) {
3391 return '/usr/bin/kvm' if is_native
($arch);
3393 my $cmd = $Arch2Qemu->{$arch}
3394 or die "don't know how to emulate architecture '$arch'\n";
3398 # To use query_supported_cpu_flags and query_understood_cpu_flags to get flags
3399 # to use in a QEMU command line (-cpu element), first array_intersect the result
3400 # of query_supported_ with query_understood_. This is necessary because:
3402 # a) query_understood_ returns flags the host cannot use and
3403 # b) query_supported_ (rather the QMP call) doesn't actually return CPU
3404 # flags, but CPU settings - with most of them being flags. Those settings
3405 # (and some flags, curiously) cannot be specified as a "-cpu" argument.
3407 # query_supported_ needs to start up to 2 temporary VMs and is therefore rather
3408 # expensive. If you need the value returned from this, you can get it much
3409 # cheaper from pmxcfs using PVE::Cluster::get_node_kv('cpuflags-$accel') with
3410 # $accel being 'kvm' or 'tcg'.
3412 # pvestatd calls this function on startup and whenever the QEMU/KVM version
3413 # changes, automatically populating pmxcfs.
3415 # Returns: { kvm => [ flagX, flagY, ... ], tcg => [ flag1, flag2, ... ] }
3416 # since kvm and tcg machines support different flags
3418 sub query_supported_cpu_flags
{
3421 $arch //= get_host_arch
();
3422 my $default_machine = $default_machines->{$arch};
3426 # FIXME: Once this is merged, the code below should work for ARM as well:
3427 # https://lists.nongnu.org/archive/html/qemu-devel/2019-06/msg04947.html
3428 die "QEMU/KVM cannot detect CPU flags on ARM (aarch64)\n" if
3431 my $kvm_supported = defined(kvm_version
());
3432 my $qemu_cmd = get_command_for_arch
($arch);
3434 my $pidfile = PVE
::QemuServer
::Helpers
::pidfile_name
($fakevmid);
3436 # Start a temporary (frozen) VM with vmid -1 to allow sending a QMP command
3437 my $query_supported_run_qemu = sub {
3443 '-machine', $default_machine,
3445 '-chardev', "socket,id=qmp,path=/var/run/qemu-server/$fakevmid.qmp,server=on,wait=off",
3446 '-mon', 'chardev=qmp,mode=control',
3447 '-pidfile', $pidfile,
3452 push @$cmd, '-accel', 'tcg';
3455 my $rc = run_command
($cmd, noerr
=> 1, quiet
=> 0);
3456 die "QEMU flag querying VM exited with code " . $rc if $rc;
3459 my $cmd_result = mon_cmd
(
3461 'query-cpu-model-expansion',
3463 model
=> { name
=> 'host' }
3466 my $props = $cmd_result->{model
}->{props
};
3467 foreach my $prop (keys %$props) {
3468 next if $props->{$prop} ne '1';
3469 # QEMU returns some flags multiple times, with '_', '.' or '-'
3470 # (e.g. lahf_lm and lahf-lm; sse4.2, sse4-2 and sse4_2; ...).
3471 # We only keep those with underscores, to match /proc/cpuinfo
3472 $prop =~ s/\.|-/_/g;
3473 $flags->{$prop} = 1;
3478 # force stop with 10 sec timeout and 'nocheck', always stop, even if QMP failed
3479 vm_stop
(undef, $fakevmid, 1, 1, 10, 0, 1);
3483 return [ sort keys %$flags ];
3486 # We need to query QEMU twice, since KVM and TCG have different supported flags
3487 PVE
::QemuConfig-
>lock_config($fakevmid, sub {
3488 $flags->{tcg
} = eval { $query_supported_run_qemu->(0) };
3489 warn "warning: failed querying supported tcg flags: $@\n" if $@;
3491 if ($kvm_supported) {
3492 $flags->{kvm
} = eval { $query_supported_run_qemu->(1) };
3493 warn "warning: failed querying supported kvm flags: $@\n" if $@;
3500 # Understood CPU flags are written to a file at 'pve-qemu' compile time
3501 my $understood_cpu_flag_dir = "/usr/share/kvm";
3502 sub query_understood_cpu_flags
{
3503 my $arch = get_host_arch
();
3504 my $filepath = "$understood_cpu_flag_dir/recognized-CPUID-flags-$arch";
3506 die "Cannot query understood QEMU CPU flags for architecture: $arch (file not found)\n"
3509 my $raw = file_get_contents
($filepath);
3510 $raw =~ s/^\s+|\s+$//g;
3511 my @flags = split(/\s+/, $raw);
3516 # Since commit 277d33454f77ec1d1e0bc04e37621e4dd2424b67 in pve-qemu, smm is not off by default
3517 # anymore. But smm=off seems to be required when using SeaBIOS and serial display.
3518 my sub should_disable_smm
{
3519 my ($conf, $vga) = @_;
3521 return (!defined($conf->{bios
}) || $conf->{bios
} eq 'seabios') &&
3522 $vga->{type
} && $vga->{type
} =~ m/^(serial\d+|none)$/;
3525 my sub print_ovmf_drive_commandlines
{
3526 my ($conf, $storecfg, $vmid, $arch, $q35, $version_guard) = @_;
3528 my $d = $conf->{efidisk0
} ? parse_drive
('efidisk0', $conf->{efidisk0
}) : undef;
3530 my ($ovmf_code, $ovmf_vars) = get_ovmf_files
($arch, $d, $q35);
3531 die "uefi base image '$ovmf_code' not found\n" if ! -f
$ovmf_code;
3533 my $var_drive_str = "if=pflash,unit=1,id=drive-efidisk0";
3535 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($d->{file
}, 1);
3536 my ($path, $format) = $d->@{'file', 'format'};
3538 $path = PVE
::Storage
::path
($storecfg, $d->{file
});
3539 if (!defined($format)) {
3540 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
3541 $format = qemu_img_format
($scfg, $volname);
3543 } elsif (!defined($format)) {
3544 die "efidisk format must be specified\n";
3546 # SPI flash does lots of read-modify-write OPs, without writeback this gets really slow #3329
3547 if ($path =~ m/^rbd:/) {
3548 $var_drive_str .= ',cache=writeback';
3549 $path .= ':rbd_cache_policy=writeback'; # avoid write-around, we *need* to cache writes too
3551 $var_drive_str .= ",format=$format,file=$path";
3553 $var_drive_str .= ",size=" . (-s
$ovmf_vars) if $format eq 'raw' && $version_guard->(4, 1, 2);
3554 $var_drive_str .= ',readonly=on' if drive_is_read_only
($conf, $d);
3556 log_warn
("no efidisk configured! Using temporary efivars disk.");
3557 my $path = "/tmp/$vmid-ovmf.fd";
3558 PVE
::Tools
::file_copy
($ovmf_vars, $path, -s
$ovmf_vars);
3559 $var_drive_str .= ",format=raw,file=$path";
3560 $var_drive_str .= ",size=" . (-s
$ovmf_vars) if $version_guard->(4, 1, 2);
3563 return ("if=pflash,unit=0,format=raw,readonly=on,file=$ovmf_code", $var_drive_str);
3566 sub config_to_command
{
3567 my ($storecfg, $vmid, $conf, $defaults, $forcemachine, $forcecpu,
3570 my ($globalFlags, $machineFlags, $rtcFlags) = ([], [], []);
3573 my $ostype = $conf->{ostype
};
3574 my $winversion = windows_version
($ostype);
3575 my $kvm = $conf->{kvm
};
3576 my $nodename = nodename
();
3578 my $arch = get_vm_arch
($conf);
3579 my $kvm_binary = get_command_for_arch
($arch);
3580 my $kvmver = kvm_user_version
($kvm_binary);
3582 if (!$kvmver || $kvmver !~ m/^(\d+)\.(\d+)/ || $1 < 3) {
3583 $kvmver //= "undefined";
3584 die "Detected old QEMU binary ('$kvmver', at least 3.0 is required)\n";
3587 my $add_pve_version = min_version
($kvmver, 4, 1);
3589 my $machine_type = get_vm_machine
($conf, $forcemachine, $arch, $add_pve_version);
3590 my $machine_version = extract_version
($machine_type, $kvmver);
3591 $kvm //= 1 if is_native
($arch);
3593 $machine_version =~ m/(\d+)\.(\d+)/;
3594 my ($machine_major, $machine_minor) = ($1, $2);
3596 if ($kvmver =~ m/^\d+\.\d+\.(\d+)/ && $1 >= 90) {
3597 warn "warning: Installed QEMU version ($kvmver) is a release candidate, ignoring version checks\n";
3598 } elsif (!min_version
($kvmver, $machine_major, $machine_minor)) {
3599 die "Installed QEMU version '$kvmver' is too old to run machine type '$machine_type',"
3600 ." please upgrade node '$nodename'\n"
3601 } elsif (!PVE
::QemuServer
::Machine
::can_run_pve_machine_version
($machine_version, $kvmver)) {
3602 my $max_pve_version = PVE
::QemuServer
::Machine
::get_pve_version
($machine_version);
3603 die "Installed qemu-server (max feature level for $machine_major.$machine_minor is"
3604 ." pve$max_pve_version) is too old to run machine type '$machine_type', please upgrade"
3605 ." node '$nodename'\n";
3608 # if a specific +pve version is required for a feature, use $version_guard
3609 # instead of min_version to allow machines to be run with the minimum
3611 my $required_pve_version = 0;
3612 my $version_guard = sub {
3613 my ($major, $minor, $pve) = @_;
3614 return 0 if !min_version
($machine_version, $major, $minor, $pve);
3615 my $max_pve = PVE
::QemuServer
::Machine
::get_pve_version
("$major.$minor");
3616 return 1 if min_version
($machine_version, $major, $minor, $max_pve+1);
3617 $required_pve_version = $pve if $pve && $pve > $required_pve_version;
3621 if ($kvm && !defined kvm_version
()) {
3622 die "KVM virtualisation configured, but not available. Either disable in VM configuration"
3623 ." or enable in BIOS.\n";
3626 my $q35 = PVE
::QemuServer
::Machine
::machine_type_is_q35
($conf);
3627 my $hotplug_features = parse_hotplug_features
(defined($conf->{hotplug
}) ?
$conf->{hotplug
} : '1');
3628 my $use_old_bios_files = undef;
3629 ($use_old_bios_files, $machine_type) = qemu_use_old_bios_files
($machine_type);
3632 if ($conf->{affinity
}) {
3633 push @$cmd, '/usr/bin/taskset', '--cpu-list', '--all-tasks', $conf->{affinity
};
3636 push @$cmd, $kvm_binary;
3638 push @$cmd, '-id', $vmid;
3640 my $vmname = $conf->{name
} || "vm$vmid";
3642 push @$cmd, '-name', "$vmname,debug-threads=on";
3644 push @$cmd, '-no-shutdown';
3648 my $qmpsocket = PVE
::QemuServer
::Helpers
::qmp_socket
($vmid);
3649 push @$cmd, '-chardev', "socket,id=qmp,path=$qmpsocket,server=on,wait=off";
3650 push @$cmd, '-mon', "chardev=qmp,mode=control";
3652 if (min_version
($machine_version, 2, 12)) {
3653 push @$cmd, '-chardev', "socket,id=qmp-event,path=/var/run/qmeventd.sock,reconnect=5";
3654 push @$cmd, '-mon', "chardev=qmp-event,mode=control";
3657 push @$cmd, '-pidfile' , PVE
::QemuServer
::Helpers
::pidfile_name
($vmid);
3659 push @$cmd, '-daemonize';
3661 if ($conf->{smbios1
}) {
3662 my $smbios_conf = parse_smbios1
($conf->{smbios1
});
3663 if ($smbios_conf->{base64
}) {
3664 # Do not pass base64 flag to qemu
3665 delete $smbios_conf->{base64
};
3666 my $smbios_string = "";
3667 foreach my $key (keys %$smbios_conf) {
3669 if ($key eq "uuid") {
3670 $value = $smbios_conf->{uuid
}
3672 $value = decode_base64
($smbios_conf->{$key});
3674 # qemu accepts any binary data, only commas need escaping by double comma
3676 $smbios_string .= "," . $key . "=" . $value if $value;
3678 push @$cmd, '-smbios', "type=1" . $smbios_string;
3680 push @$cmd, '-smbios', "type=1,$conf->{smbios1}";
3684 if ($conf->{bios
} && $conf->{bios
} eq 'ovmf') {
3685 my ($code_drive_str, $var_drive_str) =
3686 print_ovmf_drive_commandlines
($conf, $storecfg, $vmid, $arch, $q35, $version_guard);
3687 push $cmd->@*, '-drive', $code_drive_str;
3688 push $cmd->@*, '-drive', $var_drive_str;
3691 if ($q35) { # tell QEMU to load q35 config early
3692 # we use different pcie-port hardware for qemu >= 4.0 for passthrough
3693 if (min_version
($machine_version, 4, 0)) {
3694 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35-4.0.cfg';
3696 push @$devices, '-readconfig', '/usr/share/qemu-server/pve-q35.cfg';
3700 if (defined(my $fixups = qemu_created_version_fixups
($conf, $forcemachine, $kvmver))) {
3701 push @$cmd, $fixups->@*;
3704 if ($conf->{vmgenid
}) {
3705 push @$devices, '-device', 'vmgenid,guid='.$conf->{vmgenid
};
3708 # add usb controllers
3709 my @usbcontrollers = PVE
::QemuServer
::USB
::get_usb_controllers
(
3710 $conf, $bridges, $arch, $machine_type, $usbdesc->{format
}, $MAX_USB_DEVICES, $machine_version);
3711 push @$devices, @usbcontrollers if @usbcontrollers;
3712 my $vga = parse_vga
($conf->{vga
});
3714 my $qxlnum = vga_conf_has_spice
($conf->{vga
});
3715 $vga->{type
} = 'qxl' if $qxlnum;
3717 if (!$vga->{type
}) {
3718 if ($arch eq 'aarch64') {
3719 $vga->{type
} = 'virtio';
3720 } elsif (min_version
($machine_version, 2, 9)) {
3721 $vga->{type
} = (!$winversion || $winversion >= 6) ?
'std' : 'cirrus';
3723 $vga->{type
} = ($winversion >= 6) ?
'std' : 'cirrus';
3727 # enable absolute mouse coordinates (needed by vnc)
3728 my $tablet = $conf->{tablet
};
3729 if (!defined($tablet)) {
3730 $tablet = $defaults->{tablet
};
3731 $tablet = 0 if $qxlnum; # disable for spice because it is not needed
3732 $tablet = 0 if $vga->{type
} =~ m/^serial\d+$/; # disable if we use serial terminal (no vga card)
3736 push @$devices, '-device', print_tabletdevice_full
($conf, $arch) if $tablet;
3737 my $kbd = print_keyboarddevice_full
($conf, $arch);
3738 push @$devices, '-device', $kbd if defined($kbd);
3741 my $bootorder = device_bootorder
($conf);
3743 # host pci device passthrough
3744 my ($kvm_off, $gpu_passthrough, $legacy_igd) = PVE
::QemuServer
::PCI
::print_hostpci_devices
(
3745 $vmid, $conf, $devices, $vga, $winversion, $q35, $bridges, $arch, $machine_type, $bootorder);
3748 my $usb_dev_features = {};
3749 $usb_dev_features->{spice_usb3
} = 1 if min_version
($machine_version, 4, 0);
3751 my @usbdevices = PVE
::QemuServer
::USB
::get_usb_devices
(
3752 $conf, $usbdesc->{format
}, $MAX_USB_DEVICES, $usb_dev_features, $bootorder, $machine_version);
3753 push @$devices, @usbdevices if @usbdevices;
3756 for (my $i = 0; $i < $MAX_SERIAL_PORTS; $i++) {
3757 my $path = $conf->{"serial$i"} or next;
3758 if ($path eq 'socket') {
3759 my $socket = "/var/run/qemu-server/${vmid}.serial$i";
3760 push @$devices, '-chardev', "socket,id=serial$i,path=$socket,server=on,wait=off";
3761 # On aarch64, serial0 is the UART device. QEMU only allows
3762 # connecting UART devices via the '-serial' command line, as
3763 # the device has a fixed slot on the hardware...
3764 if ($arch eq 'aarch64' && $i == 0) {
3765 push @$devices, '-serial', "chardev:serial$i";
3767 push @$devices, '-device', "isa-serial,chardev=serial$i";
3770 die "no such serial device\n" if ! -c
$path;
3771 push @$devices, '-chardev', "tty,id=serial$i,path=$path";
3772 push @$devices, '-device', "isa-serial,chardev=serial$i";
3777 for (my $i = 0; $i < $MAX_PARALLEL_PORTS; $i++) {
3778 if (my $path = $conf->{"parallel$i"}) {
3779 die "no such parallel device\n" if ! -c
$path;
3780 my $devtype = $path =~ m!^/dev/usb/lp! ?
'tty' : 'parport';
3781 push @$devices, '-chardev', "$devtype,id=parallel$i,path=$path";
3782 push @$devices, '-device', "isa-parallel,chardev=parallel$i";
3786 if (min_version
($machine_version, 4, 0) && (my $audio = conf_has_audio
($conf))) {
3787 my $audiopciaddr = print_pci_addr
("audio0", $bridges, $arch, $machine_type);
3788 my $audio_devs = audio_devs
($audio, $audiopciaddr, $machine_version);
3789 push @$devices, @$audio_devs;
3792 add_tpm_device
($vmid, $devices, $conf);
3795 $sockets = $conf->{smp
} if $conf->{smp
}; # old style - no longer iused
3796 $sockets = $conf->{sockets
} if $conf->{sockets
};
3798 my $cores = $conf->{cores
} || 1;
3800 my $maxcpus = $sockets * $cores;
3802 my $vcpus = $conf->{vcpus
} ?
$conf->{vcpus
} : $maxcpus;
3804 my $allowed_vcpus = $cpuinfo->{cpus
};
3806 die "MAX $allowed_vcpus vcpus allowed per VM on this node\n" if ($allowed_vcpus < $maxcpus);
3808 if ($hotplug_features->{cpu
} && min_version
($machine_version, 2, 7)) {
3809 push @$cmd, '-smp', "1,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
3810 for (my $i = 2; $i <= $vcpus; $i++) {
3811 my $cpustr = print_cpu_device
($conf,$i);
3812 push @$cmd, '-device', $cpustr;
3817 push @$cmd, '-smp', "$vcpus,sockets=$sockets,cores=$cores,maxcpus=$maxcpus";
3819 push @$cmd, '-nodefaults';
3821 push @$cmd, '-boot', "menu=on,strict=on,reboot-timeout=1000,splash=/usr/share/qemu-server/bootsplash.jpg";
3823 push @$cmd, '-no-acpi' if defined($conf->{acpi
}) && $conf->{acpi
} == 0;
3825 push @$cmd, '-no-reboot' if defined($conf->{reboot
}) && $conf->{reboot
} == 0;
3827 if ($vga->{type
} && $vga->{type
} !~ m/^serial\d+$/ && $vga->{type
} ne 'none'){
3828 push @$devices, '-device', print_vga_device
(
3829 $conf, $vga, $arch, $machine_version, $machine_type, undef, $qxlnum, $bridges);
3831 push @$cmd, '-display', 'egl-headless,gl=core' if $vga->{type
} eq 'virtio-gl'; # VIRGL
3833 my $socket = PVE
::QemuServer
::Helpers
::vnc_socket
($vmid);
3834 push @$cmd, '-vnc', "unix:$socket,password=on";
3836 push @$cmd, '-vga', 'none' if $vga->{type
} eq 'none';
3837 push @$cmd, '-nographic';
3841 my $tdf = defined($conf->{tdf
}) ?
$conf->{tdf
} : $defaults->{tdf
};
3842 my $useLocaltime = $conf->{localtime};
3844 if ($winversion >= 5) { # windows
3845 $useLocaltime = 1 if !defined($conf->{localtime});
3847 # use time drift fix when acpi is enabled
3848 if (!(defined($conf->{acpi
}) && $conf->{acpi
} == 0)) {
3849 $tdf = 1 if !defined($conf->{tdf
});
3853 if ($winversion >= 6) {
3854 push @$globalFlags, 'kvm-pit.lost_tick_policy=discard';
3855 push @$cmd, '-no-hpet';
3858 push @$rtcFlags, 'driftfix=slew' if $tdf;
3860 if ($conf->{startdate
} && $conf->{startdate
} ne 'now') {
3861 push @$rtcFlags, "base=$conf->{startdate}";
3862 } elsif ($useLocaltime) {
3863 push @$rtcFlags, 'base=localtime';
3867 push @$cmd, '-cpu', $forcecpu;
3869 push @$cmd, get_cpu_options
($conf, $arch, $kvm, $kvm_off, $machine_version, $winversion, $gpu_passthrough);
3872 PVE
::QemuServer
::Memory
::config
($conf, $vmid, $sockets, $cores, $defaults, $hotplug_features, $cmd);
3874 push @$cmd, '-S' if $conf->{freeze
};
3876 push @$cmd, '-k', $conf->{keyboard
} if defined($conf->{keyboard
});
3878 my $guest_agent = parse_guest_agent
($conf);
3880 if ($guest_agent->{enabled
}) {
3881 my $qgasocket = PVE
::QemuServer
::Helpers
::qmp_socket
($vmid, 1);
3882 push @$devices, '-chardev', "socket,path=$qgasocket,server=on,wait=off,id=qga0";
3884 if (!$guest_agent->{type
} || $guest_agent->{type
} eq 'virtio') {
3885 my $pciaddr = print_pci_addr
("qga0", $bridges, $arch, $machine_type);
3886 push @$devices, '-device', "virtio-serial,id=qga0$pciaddr";
3887 push @$devices, '-device', 'virtserialport,chardev=qga0,name=org.qemu.guest_agent.0';
3888 } elsif ($guest_agent->{type
} eq 'isa') {
3889 push @$devices, '-device', "isa-serial,chardev=qga0";
3893 my $rng = $conf->{rng0
} ? parse_rng
($conf->{rng0
}) : undef;
3894 if ($rng && $version_guard->(4, 1, 2)) {
3895 check_rng_source
($rng->{source
});
3897 my $max_bytes = $rng->{max_bytes
} // $rng_fmt->{max_bytes
}->{default};
3898 my $period = $rng->{period
} // $rng_fmt->{period
}->{default};
3899 my $limiter_str = "";
3901 $limiter_str = ",max-bytes=$max_bytes,period=$period";
3904 my $rng_addr = print_pci_addr
("rng0", $bridges, $arch, $machine_type);
3905 push @$devices, '-object', "rng-random,filename=$rng->{source},id=rng0";
3906 push @$devices, '-device', "virtio-rng-pci,rng=rng0$limiter_str$rng_addr";
3911 if ($qxlnum || $vga->{type
} =~ /^virtio/) {
3914 for (my $i = 1; $i < $qxlnum; $i++){
3915 push @$devices, '-device', print_vga_device
(
3916 $conf, $vga, $arch, $machine_version, $machine_type, $i, $qxlnum, $bridges);
3919 # assume other OS works like Linux
3920 my ($ram, $vram) = ("134217728", "67108864");
3921 if ($vga->{memory
}) {
3922 $ram = PVE
::Tools
::convert_size
($qxlnum*4*$vga->{memory
}, 'mb' => 'b');
3923 $vram = PVE
::Tools
::convert_size
($qxlnum*2*$vga->{memory
}, 'mb' => 'b');
3925 push @$cmd, '-global', "qxl-vga.ram_size=$ram";
3926 push @$cmd, '-global', "qxl-vga.vram_size=$vram";
3930 my $pciaddr = print_pci_addr
("spice", $bridges, $arch, $machine_type);
3932 my $pfamily = PVE
::Tools
::get_host_address_family
($nodename);
3933 my @nodeaddrs = PVE
::Tools
::getaddrinfo_all
('localhost', family
=> $pfamily);
3934 die "failed to get an ip address of type $pfamily for 'localhost'\n" if !@nodeaddrs;
3936 push @$devices, '-device', "virtio-serial,id=spice$pciaddr";
3937 push @$devices, '-chardev', "spicevmc,id=vdagent,name=vdagent";
3938 push @$devices, '-device', "virtserialport,chardev=vdagent,name=com.redhat.spice.0";
3940 my $localhost = PVE
::Network
::addr_to_ip
($nodeaddrs[0]->{addr
});
3941 $spice_port = PVE
::Tools
::next_spice_port
($pfamily, $localhost);
3943 my $spice_enhancement_str = $conf->{spice_enhancements
} // '';
3944 my $spice_enhancement = parse_property_string
($spice_enhancements_fmt, $spice_enhancement_str);
3945 if ($spice_enhancement->{foldersharing
}) {
3946 push @$devices, '-chardev', "spiceport,id=foldershare,name=org.spice-space.webdav.0";
3947 push @$devices, '-device', "virtserialport,chardev=foldershare,name=org.spice-space.webdav.0";
3950 my $spice_opts = "tls-port=${spice_port},addr=$localhost,tls-ciphers=HIGH,seamless-migration=on";
3951 $spice_opts .= ",streaming-video=$spice_enhancement->{videostreaming}"
3952 if $spice_enhancement->{videostreaming
};
3954 push @$devices, '-spice', "$spice_opts";
3957 # enable balloon by default, unless explicitly disabled
3958 if (!defined($conf->{balloon
}) || $conf->{balloon
}) {
3959 my $pciaddr = print_pci_addr
("balloon0", $bridges, $arch, $machine_type);
3960 my $ballooncmd = "virtio-balloon-pci,id=balloon0$pciaddr";
3961 $ballooncmd .= ",free-page-reporting=on" if min_version
($machine_version, 6, 2);
3962 push @$devices, '-device', $ballooncmd;
3965 if ($conf->{watchdog
}) {
3966 my $wdopts = parse_watchdog
($conf->{watchdog
});
3967 my $pciaddr = print_pci_addr
("watchdog", $bridges, $arch, $machine_type);
3968 my $watchdog = $wdopts->{model
} || 'i6300esb';
3969 push @$devices, '-device', "$watchdog$pciaddr";
3970 push @$devices, '-watchdog-action', $wdopts->{action
} if $wdopts->{action
};
3974 my $scsicontroller = {};
3975 my $ahcicontroller = {};
3976 my $scsihw = defined($conf->{scsihw
}) ?
$conf->{scsihw
} : $defaults->{scsihw
};
3978 # Add iscsi initiator name if available
3979 if (my $initiator = get_initiator_name
()) {
3980 push @$devices, '-iscsi', "initiator-name=$initiator";
3983 PVE
::QemuConfig-
>foreach_volume($conf, sub {
3984 my ($ds, $drive) = @_;
3986 if (PVE
::Storage
::parse_volume_id
($drive->{file
}, 1)) {
3987 check_volume_storage_type
($storecfg, $drive->{file
});
3988 push @$vollist, $drive->{file
};
3991 # ignore efidisk here, already added in bios/fw handling code above
3992 return if $drive->{interface
} eq 'efidisk';
3994 return if $drive->{interface
} eq 'tpmstate';
3996 $use_virtio = 1 if $ds =~ m/^virtio/;
3998 $drive->{bootindex
} = $bootorder->{$ds} if $bootorder->{$ds};
4000 if ($drive->{interface
} eq 'virtio'){
4001 push @$cmd, '-object', "iothread,id=iothread-$ds" if $drive->{iothread
};
4004 if ($drive->{interface
} eq 'scsi') {
4006 my ($maxdev, $controller, $controller_prefix) = scsihw_infos
($conf, $drive);
4008 die "scsi$drive->{index}: machine version 4.1~pve2 or higher is required to use more than 14 SCSI disks\n"
4009 if $drive->{index} > 13 && !&$version_guard(4, 1, 2);
4011 my $pciaddr = print_pci_addr
("$controller_prefix$controller", $bridges, $arch, $machine_type);
4012 my $scsihw_type = $scsihw =~ m/^virtio-scsi-single/ ?
"virtio-scsi-pci" : $scsihw;
4015 if($conf->{scsihw
} && $conf->{scsihw
} eq "virtio-scsi-single" && $drive->{iothread
}){
4016 $iothread .= ",iothread=iothread-$controller_prefix$controller";
4017 push @$cmd, '-object', "iothread,id=iothread-$controller_prefix$controller";
4018 } elsif ($drive->{iothread
}) {
4020 "iothread is only valid with virtio disk or virtio-scsi-single controller, ignoring\n"
4025 if($conf->{scsihw
} && $conf->{scsihw
} eq "virtio-scsi-single" && $drive->{queues
}){
4026 $queues = ",num_queues=$drive->{queues}";
4029 push @$devices, '-device', "$scsihw_type,id=$controller_prefix$controller$pciaddr$iothread$queues"
4030 if !$scsicontroller->{$controller};
4031 $scsicontroller->{$controller}=1;
4034 if ($drive->{interface
} eq 'sata') {
4035 my $controller = int($drive->{index} / $PVE::QemuServer
::Drive
::MAX_SATA_DISKS
);
4036 my $pciaddr = print_pci_addr
("ahci$controller", $bridges, $arch, $machine_type);
4037 push @$devices, '-device', "ahci,id=ahci$controller,multifunction=on$pciaddr"
4038 if !$ahcicontroller->{$controller};
4039 $ahcicontroller->{$controller}=1;
4042 my $pbs_conf = $pbs_backing->{$ds};
4043 my $pbs_name = undef;
4045 $pbs_name = "drive-$ds-pbs";
4046 push @$devices, '-blockdev', print_pbs_blockdev
($pbs_conf, $pbs_name);
4049 my $drive_cmd = print_drive_commandline_full
(
4050 $storecfg, $vmid, $drive, $pbs_name, min_version
($kvmver, 6, 0));
4052 # extra protection for templates, but SATA and IDE don't support it..
4053 $drive_cmd .= ',readonly=on' if drive_is_read_only
($conf, $drive);
4055 push @$devices, '-drive',$drive_cmd;
4056 push @$devices, '-device', print_drivedevice_full
(
4057 $storecfg, $conf, $vmid, $drive, $bridges, $arch, $machine_type);
4060 for (my $i = 0; $i < $MAX_NETS; $i++) {
4061 my $netname = "net$i";
4063 next if !$conf->{$netname};
4064 my $d = parse_net
($conf->{$netname});
4066 # save the MAC addr here (could be auto-gen. in some odd setups) for FDB registering later?
4068 $use_virtio = 1 if $d->{model
} eq 'virtio';
4070 $d->{bootindex
} = $bootorder->{$netname} if $bootorder->{$netname};
4072 my $netdevfull = print_netdev_full
($vmid, $conf, $arch, $d, $netname);
4073 push @$devices, '-netdev', $netdevfull;
4075 my $netdevicefull = print_netdevice_full
(
4076 $vmid, $conf, $d, $netname, $bridges, $use_old_bios_files, $arch, $machine_type, $machine_version);
4078 push @$devices, '-device', $netdevicefull;
4081 if ($conf->{ivshmem
}) {
4082 my $ivshmem = parse_property_string
($ivshmem_fmt, $conf->{ivshmem
});
4086 $bus = print_pcie_addr
("ivshmem");
4088 $bus = print_pci_addr
("ivshmem", $bridges, $arch, $machine_type);
4091 my $ivshmem_name = $ivshmem->{name
} // $vmid;
4092 my $path = '/dev/shm/pve-shm-' . $ivshmem_name;
4094 push @$devices, '-device', "ivshmem-plain,memdev=ivshmem$bus,";
4095 push @$devices, '-object', "memory-backend-file,id=ivshmem,share=on,mem-path=$path"
4096 .",size=$ivshmem->{size}M";
4099 # pci.4 is nested in pci.1
4100 $bridges->{1} = 1 if $bridges->{4};
4102 if (!$q35) { # add pci bridges
4103 if (min_version
($machine_version, 2, 3)) {
4107 $bridges->{3} = 1 if $scsihw =~ m/^virtio-scsi-single/;
4110 for my $k (sort {$b cmp $a} keys %$bridges) {
4111 next if $q35 && $k < 4; # q35.cfg already includes bridges up to 3
4114 if ($k == 2 && $legacy_igd) {
4117 my $pciaddr = print_pci_addr
("pci.$k_name", undef, $arch, $machine_type);
4118 my $devstr = "pci-bridge,id=pci.$k,chassis_nr=$k$pciaddr";
4120 if ($q35) { # add after -readconfig pve-q35.cfg
4121 splice @$devices, 2, 0, '-device', $devstr;
4123 unshift @$devices, '-device', $devstr if $k > 0;
4128 push @$machineFlags, 'accel=tcg';
4131 push @$machineFlags, 'smm=off' if should_disable_smm
($conf, $vga);
4133 my $machine_type_min = $machine_type;
4134 if ($add_pve_version) {
4135 $machine_type_min =~ s/\+pve\d+$//;
4136 $machine_type_min .= "+pve$required_pve_version";
4138 push @$machineFlags, "type=${machine_type_min}";
4140 push @$cmd, @$devices;
4141 push @$cmd, '-rtc', join(',', @$rtcFlags) if scalar(@$rtcFlags);
4142 push @$cmd, '-machine', join(',', @$machineFlags) if scalar(@$machineFlags);
4143 push @$cmd, '-global', join(',', @$globalFlags) if scalar(@$globalFlags);
4145 if (my $vmstate = $conf->{vmstate
}) {
4146 my $statepath = PVE
::Storage
::path
($storecfg, $vmstate);
4147 push @$vollist, $vmstate;
4148 push @$cmd, '-loadstate', $statepath;
4149 print "activating and using '$vmstate' as vmstate\n";
4152 if (PVE
::QemuConfig-
>is_template($conf)) {
4153 # needed to workaround base volumes being read-only
4154 push @$cmd, '-snapshot';
4158 if ($conf->{args
}) {
4159 my $aa = PVE
::Tools
::split_args
($conf->{args
});
4163 return wantarray ?
($cmd, $vollist, $spice_port) : $cmd;
4166 sub check_rng_source
{
4169 # mostly relevant for /dev/hwrng, but doesn't hurt to check others too
4170 die "cannot create VirtIO RNG device: source file '$source' doesn't exist\n"
4173 my $rng_current = '/sys/devices/virtual/misc/hw_random/rng_current';
4174 if ($source eq '/dev/hwrng' && file_read_firstline
($rng_current) eq 'none') {
4175 # Needs to abort, otherwise QEMU crashes on first rng access. Note that rng_current cannot
4176 # be changed to 'none' manually, so once the VM is past this point, it's no longer an issue.
4177 die "Cannot start VM with passed-through RNG device: '/dev/hwrng' exists, but"
4178 ." '$rng_current' is set to 'none'. Ensure that a compatible hardware-RNG is attached"
4186 my $res = mon_cmd
($vmid, 'query-spice');
4188 return $res->{'tls-port'} || $res->{'port'} || die "no spice port\n";
4191 sub vm_devices_list
{
4194 my $res = mon_cmd
($vmid, 'query-pci');
4195 my $devices_to_check = [];
4197 foreach my $pcibus (@$res) {
4198 push @$devices_to_check, @{$pcibus->{devices
}},
4201 while (@$devices_to_check) {
4203 for my $d (@$devices_to_check) {
4204 $devices->{$d->{'qdev_id'}} = 1 if $d->{'qdev_id'};
4205 next if !$d->{'pci_bridge'} || !$d->{'pci_bridge'}->{devices
};
4207 $devices->{$d->{'qdev_id'}} += scalar(@{$d->{'pci_bridge'}->{devices
}});
4208 push @$to_check, @{$d->{'pci_bridge'}->{devices
}};
4210 $devices_to_check = $to_check;
4213 my $resblock = mon_cmd
($vmid, 'query-block');
4214 foreach my $block (@$resblock) {
4215 if($block->{device
} =~ m/^drive-(\S+)/){
4220 my $resmice = mon_cmd
($vmid, 'query-mice');
4221 foreach my $mice (@$resmice) {
4222 if ($mice->{name
} eq 'QEMU HID Tablet') {
4223 $devices->{tablet
} = 1;
4228 # for usb devices there is no query-usb
4229 # but we can iterate over the entries in
4230 # qom-list path=/machine/peripheral
4231 my $resperipheral = mon_cmd
($vmid, 'qom-list', path
=> '/machine/peripheral');
4232 foreach my $per (@$resperipheral) {
4233 if ($per->{name
} =~ m/^usb(?:redirdev)?\d+$/) {
4234 $devices->{$per->{name
}} = 1;
4242 my ($storecfg, $conf, $vmid, $deviceid, $device, $arch, $machine_type) = @_;
4244 my $q35 = PVE
::QemuServer
::Machine
::machine_type_is_q35
($conf);
4246 my $devices_list = vm_devices_list
($vmid);
4247 return 1 if defined($devices_list->{$deviceid});
4249 # add PCI bridge if we need it for the device
4250 qemu_add_pci_bridge
($storecfg, $conf, $vmid, $deviceid, $arch, $machine_type);
4252 if ($deviceid eq 'tablet') {
4253 qemu_deviceadd
($vmid, print_tabletdevice_full
($conf, $arch));
4254 } elsif ($deviceid eq 'keyboard') {
4255 qemu_deviceadd
($vmid, print_keyboarddevice_full
($conf, $arch));
4256 } elsif ($deviceid =~ m/^usbredirdev(\d+)$/) {
4258 qemu_spice_usbredir_chardev_add
($vmid, "usbredirchardev$id");
4259 qemu_deviceadd
($vmid, PVE
::QemuServer
::USB
::print_spice_usbdevice
($id, "xhci", $id + 1));
4260 } elsif ($deviceid =~ m/^usb(\d+)$/) {
4261 qemu_deviceadd
($vmid, PVE
::QemuServer
::USB
::print_usbdevice_full
($conf, $deviceid, $device, {}, $1 + 1));
4262 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
4263 qemu_iothread_add
($vmid, $deviceid, $device);
4265 qemu_driveadd
($storecfg, $vmid, $device);
4266 my $devicefull = print_drivedevice_full
($storecfg, $conf, $vmid, $device, undef, $arch, $machine_type);
4268 qemu_deviceadd
($vmid, $devicefull);
4269 eval { qemu_deviceaddverify
($vmid, $deviceid); };
4271 eval { qemu_drivedel
($vmid, $deviceid); };
4275 } elsif ($deviceid =~ m/^(virtioscsi|scsihw)(\d+)$/) {
4276 my $scsihw = defined($conf->{scsihw
}) ?
$conf->{scsihw
} : "lsi";
4277 my $pciaddr = print_pci_addr
($deviceid, undef, $arch, $machine_type);
4278 my $scsihw_type = $scsihw eq 'virtio-scsi-single' ?
"virtio-scsi-pci" : $scsihw;
4280 my $devicefull = "$scsihw_type,id=$deviceid$pciaddr";
4282 if($deviceid =~ m/^virtioscsi(\d+)$/ && $device->{iothread
}) {
4283 qemu_iothread_add
($vmid, $deviceid, $device);
4284 $devicefull .= ",iothread=iothread-$deviceid";
4287 if($deviceid =~ m/^virtioscsi(\d+)$/ && $device->{queues
}) {
4288 $devicefull .= ",num_queues=$device->{queues}";
4291 qemu_deviceadd
($vmid, $devicefull);
4292 qemu_deviceaddverify
($vmid, $deviceid);
4293 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
4294 qemu_findorcreatescsihw
($storecfg,$conf, $vmid, $device, $arch, $machine_type);
4295 qemu_driveadd
($storecfg, $vmid, $device);
4297 my $devicefull = print_drivedevice_full
($storecfg, $conf, $vmid, $device, undef, $arch, $machine_type);
4298 eval { qemu_deviceadd
($vmid, $devicefull); };
4300 eval { qemu_drivedel
($vmid, $deviceid); };
4304 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
4305 return if !qemu_netdevadd
($vmid, $conf, $arch, $device, $deviceid);
4307 my $machine_type = PVE
::QemuServer
::Machine
::qemu_machine_pxe
($vmid, $conf);
4308 my $machine_version = PVE
::QemuServer
::Machine
::extract_version
($machine_type);
4309 my $use_old_bios_files = undef;
4310 ($use_old_bios_files, $machine_type) = qemu_use_old_bios_files
($machine_type);
4312 my $netdevicefull = print_netdevice_full
(
4313 $vmid, $conf, $device, $deviceid, undef, $use_old_bios_files, $arch, $machine_type, $machine_version);
4314 qemu_deviceadd
($vmid, $netdevicefull);
4316 qemu_deviceaddverify
($vmid, $deviceid);
4317 qemu_set_link_status
($vmid, $deviceid, !$device->{link_down
});
4320 eval { qemu_netdevdel
($vmid, $deviceid); };
4324 } elsif (!$q35 && $deviceid =~ m/^(pci\.)(\d+)$/) {
4326 my $pciaddr = print_pci_addr
($deviceid, undef, $arch, $machine_type);
4327 my $devicefull = "pci-bridge,id=pci.$bridgeid,chassis_nr=$bridgeid$pciaddr";
4329 qemu_deviceadd
($vmid, $devicefull);
4330 qemu_deviceaddverify
($vmid, $deviceid);
4332 die "can't hotplug device '$deviceid'\n";
4338 # fixme: this should raise exceptions on error!
4339 sub vm_deviceunplug
{
4340 my ($vmid, $conf, $deviceid) = @_;
4342 my $devices_list = vm_devices_list
($vmid);
4343 return 1 if !defined($devices_list->{$deviceid});
4345 my $bootdisks = PVE
::QemuServer
::Drive
::get_bootdisks
($conf);
4346 die "can't unplug bootdisk '$deviceid'\n" if grep {$_ eq $deviceid} @$bootdisks;
4348 if ($deviceid eq 'tablet' || $deviceid eq 'keyboard' || $deviceid eq 'xhci') {
4349 qemu_devicedel
($vmid, $deviceid);
4350 } elsif ($deviceid =~ m/^usbredirdev\d+$/) {
4351 qemu_devicedel
($vmid, $deviceid);
4352 qemu_devicedelverify
($vmid, $deviceid);
4353 } elsif ($deviceid =~ m/^usb\d+$/) {
4354 qemu_devicedel
($vmid, $deviceid);
4355 qemu_devicedelverify
($vmid, $deviceid);
4356 } elsif ($deviceid =~ m/^(virtio)(\d+)$/) {
4357 my $device = parse_drive
($deviceid, $conf->{$deviceid});
4359 qemu_devicedel
($vmid, $deviceid);
4360 qemu_devicedelverify
($vmid, $deviceid);
4361 qemu_drivedel
($vmid, $deviceid);
4362 qemu_iothread_del
($vmid, $deviceid, $device);
4363 } elsif ($deviceid =~ m/^(virtioscsi|scsihw)(\d+)$/) {
4364 qemu_devicedel
($vmid, $deviceid);
4365 qemu_devicedelverify
($vmid, $deviceid);
4366 } elsif ($deviceid =~ m/^(scsi)(\d+)$/) {
4367 my $device = parse_drive
($deviceid, $conf->{$deviceid});
4369 qemu_devicedel
($vmid, $deviceid);
4370 qemu_devicedelverify
($vmid, $deviceid);
4371 qemu_drivedel
($vmid, $deviceid);
4372 qemu_deletescsihw
($conf, $vmid, $deviceid);
4374 qemu_iothread_del
($vmid, "virtioscsi$device->{index}", $device)
4375 if $conf->{scsihw
} && ($conf->{scsihw
} eq 'virtio-scsi-single');
4376 } elsif ($deviceid =~ m/^(net)(\d+)$/) {
4377 qemu_devicedel
($vmid, $deviceid);
4378 qemu_devicedelverify
($vmid, $deviceid);
4379 qemu_netdevdel
($vmid, $deviceid);
4381 die "can't unplug device '$deviceid'\n";
4387 sub qemu_spice_usbredir_chardev_add
{
4388 my ($vmid, $id) = @_;
4390 mon_cmd
($vmid, "chardev-add" , (
4401 sub qemu_deviceadd
{
4402 my ($vmid, $devicefull) = @_;
4404 $devicefull = "driver=".$devicefull;
4405 my %options = split(/[=,]/, $devicefull);
4407 mon_cmd
($vmid, "device_add" , %options);
4410 sub qemu_devicedel
{
4411 my ($vmid, $deviceid) = @_;
4413 my $ret = mon_cmd
($vmid, "device_del", id
=> $deviceid);
4416 sub qemu_iothread_add
{
4417 my ($vmid, $deviceid, $device) = @_;
4419 if ($device->{iothread
}) {
4420 my $iothreads = vm_iothreads_list
($vmid);
4421 qemu_objectadd
($vmid, "iothread-$deviceid", "iothread") if !$iothreads->{"iothread-$deviceid"};
4425 sub qemu_iothread_del
{
4426 my ($vmid, $deviceid, $device) = @_;
4428 if ($device->{iothread
}) {
4429 my $iothreads = vm_iothreads_list
($vmid);
4430 qemu_objectdel
($vmid, "iothread-$deviceid") if $iothreads->{"iothread-$deviceid"};
4434 sub qemu_objectadd
{
4435 my ($vmid, $objectid, $qomtype) = @_;
4437 mon_cmd
($vmid, "object-add", id
=> $objectid, "qom-type" => $qomtype);
4442 sub qemu_objectdel
{
4443 my ($vmid, $objectid) = @_;
4445 mon_cmd
($vmid, "object-del", id
=> $objectid);
4451 my ($storecfg, $vmid, $device) = @_;
4453 my $kvmver = get_running_qemu_version
($vmid);
4454 my $io_uring = min_version
($kvmver, 6, 0);
4455 my $drive = print_drive_commandline_full
($storecfg, $vmid, $device, undef, $io_uring);
4456 $drive =~ s/\\/\\\\/g;
4457 my $ret = PVE
::QemuServer
::Monitor
::hmp_cmd
($vmid, "drive_add auto \"$drive\"");
4459 # If the command succeeds qemu prints: "OK
"
4460 return 1 if $ret =~ m/OK/s;
4462 die "adding drive failed
: $ret\n";
4466 my ($vmid, $deviceid) = @_;
4468 my $ret = PVE::QemuServer::Monitor::hmp_cmd($vmid, "drive_del drive-
$deviceid");
4471 return 1 if $ret eq "";
4473 # NB: device not found errors mean the drive was auto-deleted and we ignore the error
4474 return 1 if $ret =~ m/Device \'.*?\' not found/s;
4476 die "deleting drive
$deviceid failed
: $ret\n";
4479 sub qemu_deviceaddverify {
4480 my ($vmid, $deviceid) = @_;
4482 for (my $i = 0; $i <= 5; $i++) {
4483 my $devices_list = vm_devices_list($vmid);
4484 return 1 if defined($devices_list->{$deviceid});
4488 die "error on hotplug device
'$deviceid'\n";
4492 sub qemu_devicedelverify {
4493 my ($vmid, $deviceid) = @_;
4495 # need to verify that the device is correctly removed as device_del
4496 # is async and empty return is not reliable
4498 for (my $i = 0; $i <= 5; $i++) {
4499 my $devices_list = vm_devices_list($vmid);
4500 return 1 if !defined($devices_list->{$deviceid});
4504 die "error on hot-unplugging device
'$deviceid'\n";
4507 sub qemu_findorcreatescsihw {
4508 my ($storecfg, $conf, $vmid, $device, $arch, $machine_type) = @_;
4510 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $device);
4512 my $scsihwid="$controller_prefix$controller";
4513 my $devices_list = vm_devices_list($vmid);
4515 if (!defined($devices_list->{$scsihwid})) {
4516 vm_deviceplug($storecfg, $conf, $vmid, $scsihwid, $device, $arch, $machine_type);
4522 sub qemu_deletescsihw {
4523 my ($conf, $vmid, $opt) = @_;
4525 my $device = parse_drive($opt, $conf->{$opt});
4527 if ($conf->{scsihw} && ($conf->{scsihw} eq 'virtio-scsi-single')) {
4528 vm_deviceunplug($vmid, $conf, "virtioscsi
$device->{index}");
4532 my ($maxdev, $controller, $controller_prefix) = scsihw_infos($conf, $device);
4534 my $devices_list = vm_devices_list($vmid);
4535 foreach my $opt (keys %{$devices_list}) {
4536 if (is_valid_drivename($opt)) {
4537 my $drive = parse_drive($opt, $conf->{$opt});
4538 if ($drive->{interface} eq 'scsi' && $drive->{index} < (($maxdev-1)*($controller+1))) {
4544 my $scsihwid="scsihw
$controller";
4546 vm_deviceunplug($vmid, $conf, $scsihwid);
4551 sub qemu_add_pci_bridge {
4552 my ($storecfg, $conf, $vmid, $device, $arch, $machine_type) = @_;
4558 print_pci_addr($device, $bridges, $arch, $machine_type);
4560 while (my ($k, $v) = each %$bridges) {
4563 return 1 if !defined($bridgeid) || $bridgeid < 1;
4565 my $bridge = "pci
.$bridgeid";
4566 my $devices_list = vm_devices_list($vmid);
4568 if (!defined($devices_list->{$bridge})) {
4569 vm_deviceplug($storecfg, $conf, $vmid, $bridge, $arch, $machine_type);
4575 sub qemu_set_link_status {
4576 my ($vmid, $device, $up) = @_;
4578 mon_cmd($vmid, "set_link
", name => $device,
4579 up => $up ? JSON::true : JSON::false);
4582 sub qemu_netdevadd {
4583 my ($vmid, $conf, $arch, $device, $deviceid) = @_;
4585 my $netdev = print_netdev_full($vmid, $conf, $arch, $device, $deviceid, 1);
4586 my %options = split(/[=,]/, $netdev);
4588 if (defined(my $vhost = $options{vhost})) {
4589 $options{vhost} = JSON::boolean(PVE::JSONSchema::parse_boolean($vhost));
4592 if (defined(my $queues = $options{queues})) {
4593 $options{queues} = $queues + 0;
4596 mon_cmd($vmid, "netdev_add
", %options);
4600 sub qemu_netdevdel {
4601 my ($vmid, $deviceid) = @_;
4603 mon_cmd($vmid, "netdev_del
", id => $deviceid);
4606 sub qemu_usb_hotplug {
4607 my ($storecfg, $conf, $vmid, $deviceid, $device, $arch, $machine_type) = @_;
4611 # remove the old one first
4612 vm_deviceunplug($vmid, $conf, $deviceid);
4614 # check if xhci controller is necessary and available
4615 my $devicelist = vm_devices_list($vmid);
4617 if (!$devicelist->{xhci}) {
4618 my $pciaddr = print_pci_addr("xhci
", undef, $arch, $machine_type);
4619 qemu_deviceadd($vmid, PVE::QemuServer::USB::print_qemu_xhci_controller($pciaddr));
4622 # print_usbdevice_full expects the parsed device
4623 my $d = parse_usb_device($device->{host});
4624 $d->{usb3} = $device->{usb3};
4627 vm_deviceplug($storecfg, $conf, $vmid, $deviceid, $d, $arch, $machine_type);
4630 sub qemu_cpu_hotplug {
4631 my ($vmid, $conf, $vcpus) = @_;
4633 my $machine_type = PVE::QemuServer::Machine::get_current_qemu_machine($vmid);
4636 $sockets = $conf->{smp} if $conf->{smp}; # old style - no longer iused
4637 $sockets = $conf->{sockets} if $conf->{sockets};
4638 my $cores = $conf->{cores} || 1;
4639 my $maxcpus = $sockets * $cores;
4641 $vcpus = $maxcpus if !$vcpus;
4643 die "you can
't add more vcpus than maxcpus\n"
4644 if $vcpus > $maxcpus;
4646 my $currentvcpus = $conf->{vcpus} || $maxcpus;
4648 if ($vcpus < $currentvcpus) {
4650 if (PVE::QemuServer::Machine::machine_version($machine_type, 2, 7)) {
4652 for (my $i = $currentvcpus; $i > $vcpus; $i--) {
4653 qemu_devicedel($vmid, "cpu$i");
4655 my $currentrunningvcpus = undef;
4657 $currentrunningvcpus = mon_cmd($vmid, "query-cpus-fast");
4658 last if scalar(@{$currentrunningvcpus}) == $i-1;
4659 raise_param_exc({ vcpus => "error unplugging cpu$i" }) if $retry > 5;
4663 #update conf after each succesfull cpu unplug
4664 $conf->{vcpus} = scalar(@{$currentrunningvcpus});
4665 PVE::QemuConfig->write_config($vmid, $conf);
4668 die "cpu hot-unplugging requires qemu version 2.7 or higher\n";
4674 my $currentrunningvcpus = mon_cmd($vmid, "query-cpus-fast");
4675 die "vcpus in running vm does not match its configuration\n"
4676 if scalar(@{$currentrunningvcpus}) != $currentvcpus;
4678 if (PVE::QemuServer::Machine::machine_version($machine_type, 2, 7)) {
4680 for (my $i = $currentvcpus+1; $i <= $vcpus; $i++) {
4681 my $cpustr = print_cpu_device($conf, $i);
4682 qemu_deviceadd($vmid, $cpustr);
4685 my $currentrunningvcpus = undef;
4687 $currentrunningvcpus = mon_cmd($vmid, "query-cpus-fast");
4688 last if scalar(@{$currentrunningvcpus}) == $i;
4689 raise_param_exc({ vcpus => "error hotplugging cpu$i" }) if $retry > 10;
4693 #update conf after each succesfull cpu hotplug
4694 $conf->{vcpus} = scalar(@{$currentrunningvcpus});
4695 PVE::QemuConfig->write_config($vmid, $conf);
4699 for (my $i = $currentvcpus; $i < $vcpus; $i++) {
4700 mon_cmd($vmid, "cpu-add", id => int($i));
4705 sub qemu_block_set_io_throttle {
4706 my ($vmid, $deviceid,
4707 $bps, $bps_rd, $bps_wr, $iops, $iops_rd, $iops_wr,
4708 $bps_max, $bps_rd_max, $bps_wr_max, $iops_max, $iops_rd_max, $iops_wr_max,
4709 $bps_max_length, $bps_rd_max_length, $bps_wr_max_length,
4710 $iops_max_length, $iops_rd_max_length, $iops_wr_max_length) = @_;
4712 return if !check_running($vmid) ;
4714 mon_cmd($vmid, "block_set_io_throttle", device => $deviceid,
4716 bps_rd => int($bps_rd),
4717 bps_wr => int($bps_wr),
4719 iops_rd => int($iops_rd),
4720 iops_wr => int($iops_wr),
4721 bps_max => int($bps_max),
4722 bps_rd_max => int($bps_rd_max),
4723 bps_wr_max => int($bps_wr_max),
4724 iops_max => int($iops_max),
4725 iops_rd_max => int($iops_rd_max),
4726 iops_wr_max => int($iops_wr_max),
4727 bps_max_length => int($bps_max_length),
4728 bps_rd_max_length => int($bps_rd_max_length),
4729 bps_wr_max_length => int($bps_wr_max_length),
4730 iops_max_length => int($iops_max_length),
4731 iops_rd_max_length => int($iops_rd_max_length),
4732 iops_wr_max_length => int($iops_wr_max_length),
4737 sub qemu_block_resize {
4738 my ($vmid, $deviceid, $storecfg, $volid, $size) = @_;
4740 my $running = check_running($vmid);
4742 $size = 0 if !PVE::Storage::volume_resize($storecfg, $volid, $size, $running);
4744 return if !$running;
4746 my $padding = (1024 - $size % 1024) % 1024;
4747 $size = $size + $padding;
4752 device => $deviceid,
4758 sub qemu_volume_snapshot {
4759 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
4761 my $running = check_running($vmid);
4763 if ($running && do_snapshots_with_qemu($storecfg, $volid, $deviceid)) {
4764 mon_cmd($vmid, 'blockdev-snapshot-internal-sync
', device => $deviceid, name => $snap);
4766 PVE::Storage::volume_snapshot($storecfg, $volid, $snap);
4770 sub qemu_volume_snapshot_delete {
4771 my ($vmid, $deviceid, $storecfg, $volid, $snap) = @_;
4773 my $running = check_running($vmid);
4778 my $conf = PVE::QemuConfig->load_config($vmid);
4779 PVE::QemuConfig->foreach_volume($conf, sub {
4780 my ($ds, $drive) = @_;
4781 $running = 1 if $drive->{file} eq $volid;
4785 if ($running && do_snapshots_with_qemu($storecfg, $volid, $deviceid)) {
4786 mon_cmd($vmid, 'blockdev-snapshot-delete-internal-sync
', device => $deviceid, name => $snap);
4788 PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap, $running);
4792 sub set_migration_caps {
4793 my ($vmid, $savevm) = @_;
4795 my $qemu_support = eval { mon_cmd($vmid, "query-proxmox-support") };
4797 my $bitmap_prop = $savevm ? 'pbs-dirty-bitmap-savevm
' : 'pbs-dirty-bitmap-migration
';
4798 my $dirty_bitmaps = $qemu_support->{$bitmap_prop} ? 1 : 0;
4803 "auto-converge" => 1,
4805 "x-rdma-pin-all" => 0,
4808 "dirty-bitmaps" => $dirty_bitmaps,
4811 my $supported_capabilities = mon_cmd($vmid, "query-migrate-capabilities");
4813 for my $supported_capability (@$supported_capabilities) {
4815 capability => $supported_capability->{capability},
4816 state => $enabled_cap->{$supported_capability->{capability}} ? JSON::true : JSON::false,
4820 mon_cmd($vmid, "migrate-set-capabilities", capabilities => $cap_ref);
4824 my ($conf, $func, @param) = @_;
4828 my $test_volid = sub {
4829 my ($key, $drive, $snapname) = @_;
4831 my $volid = $drive->{file};
4834 $volhash->{$volid}->{cdrom} //= 1;
4835 $volhash->{$volid}->{cdrom} = 0 if !drive_is_cdrom($drive);
4837 my $replicate = $drive->{replicate} // 1;
4838 $volhash->{$volid}->{replicate} //= 0;
4839 $volhash->{$volid}->{replicate} = 1 if $replicate;
4841 $volhash->{$volid}->{shared} //= 0;
4842 $volhash->{$volid}->{shared} = 1 if $drive->{shared};
4844 $volhash->{$volid}->{referenced_in_config} //= 0;
4845 $volhash->{$volid}->{referenced_in_config} = 1 if !defined($snapname);
4847 $volhash->{$volid}->{referenced_in_snapshot}->{$snapname} = 1
4848 if defined($snapname);
4850 my $size = $drive->{size};
4851 $volhash->{$volid}->{size} //= $size if $size;
4853 $volhash->{$volid}->{is_vmstate} //= 0;
4854 $volhash->{$volid}->{is_vmstate} = 1 if $key eq 'vmstate
';
4856 $volhash->{$volid}->{is_tpmstate} //= 0;
4857 $volhash->{$volid}->{is_tpmstate} = 1 if $key eq 'tpmstate0
';
4859 $volhash->{$volid}->{is_unused} //= 0;
4860 $volhash->{$volid}->{is_unused} = 1 if $key =~ /^unused\d+$/;
4862 $volhash->{$volid}->{drivename} = $key if is_valid_drivename($key);
4865 my $include_opts = {
4866 extra_keys => ['vmstate
'],
4867 include_unused => 1,
4870 PVE::QemuConfig->foreach_volume_full($conf, $include_opts, $test_volid);
4871 foreach my $snapname (keys %{$conf->{snapshots}}) {
4872 my $snap = $conf->{snapshots}->{$snapname};
4873 PVE::QemuConfig->foreach_volume_full($snap, $include_opts, $test_volid, $snapname);
4876 foreach my $volid (keys %$volhash) {
4877 &$func($volid, $volhash->{$volid}, @param);
4881 my $fast_plug_option = {
4889 'vmstatestorage
' => 1,
4894 for my $opt (keys %$confdesc_cloudinit) {
4895 $fast_plug_option->{$opt} = 1;
4898 # hotplug changes in [PENDING]
4899 # $selection hash can be used to only apply specified options, for
4900 # example: { cores => 1 } (only apply changed 'cores
')
4901 # $errors ref is used to return error messages
4902 sub vmconfig_hotplug_pending {
4903 my ($vmid, $conf, $storecfg, $selection, $errors) = @_;
4905 my $defaults = load_defaults();
4906 my $arch = get_vm_arch($conf);
4907 my $machine_type = get_vm_machine($conf, undef, $arch);
4909 # commit values which do not have any impact on running VM first
4910 # Note: those option cannot raise errors, we we do not care about
4911 # $selection and always apply them.
4913 my $add_error = sub {
4914 my ($opt, $msg) = @_;
4915 $errors->{$opt} = "hotplug problem - $msg";
4918 my $cloudinit_pending_properties = PVE::QemuServer::cloudinit_pending_properties();
4920 my $cloudinit_record_changed = sub {
4921 my ($conf, $opt, $old, $new) = @_;
4922 return if !$cloudinit_pending_properties->{$opt};
4924 my $ci = ($conf->{cloudinit} //= {});
4926 my $recorded = $ci->{$opt};
4927 my %added = map { $_ => 1 } PVE::Tools::split_list(delete($ci->{added}) // '');
4929 if (defined($new)) {
4930 if (defined($old)) {
4931 # an existing value is being modified
4932 if (defined($recorded)) {
4933 # the value was already not in sync
4934 if ($new eq $recorded) {
4935 # a value is being reverted to the cloud-init state:
4937 delete $added{$opt};
4939 # the value was changed multiple times, do nothing
4941 } elsif ($added{$opt}) {
4942 # the value had been marked as added and is being changed, do nothing
4944 # the value is new, record it:
4948 # a new value is being added
4949 if (defined($recorded)) {
4950 # it was already not in sync
4951 if ($new eq $recorded) {
4952 # a value is being reverted to the cloud-init state:
4954 delete $added{$opt};
4956 # the value had temporarily been removed, do nothing
4958 } elsif ($added{$opt}) {
4959 # the value had been marked as added already, do nothing
4961 # the value is new, add it
4965 } elsif (!defined($old)) {
4966 # a non-existent value is being removed? ignore...
4968 # a value is being deleted
4969 if (defined($recorded)) {
4970 # a value was already recorded, just keep it
4971 } elsif ($added{$opt}) {
4972 # the value was marked as added, remove it
4973 delete $added{$opt};
4975 # a previously unrecorded value is being removed, record the old value:
4980 my $added = join(',', sort keys %added);
4981 $ci->{added} = $added if length($added);
4985 foreach my $opt (keys %{$conf->{pending}}) { # add/change
4986 if ($fast_plug_option->{$opt}) {
4987 my $new = delete $conf->{pending}->{$opt};
4988 $cloudinit_record_changed->($conf, $opt, $conf->{$opt}, $new);
4989 $conf->{$opt} = $new;
4995 PVE::QemuConfig->write_config($vmid, $conf);
4998 my $ostype = $conf->{ostype};
4999 my $version = extract_version($machine_type, get_running_qemu_version($vmid));
5000 my $hotplug_features = parse_hotplug_features(defined($conf->{hotplug}) ? $conf->{hotplug} : '1');
5001 my $usb_hotplug = $hotplug_features->{usb}
5002 && min_version($version, 7, 1)
5003 && defined($ostype) && ($ostype eq 'l26
' || windows_version($ostype) > 7);
5005 my $cgroup = PVE::QemuServer::CGroup->new($vmid);
5006 my $pending_delete_hash = PVE::QemuConfig->parse_pending_delete($conf->{pending}->{delete});
5008 foreach my $opt (sort keys %$pending_delete_hash) {
5009 next if $selection && !$selection->{$opt};
5010 my $force = $pending_delete_hash->{$opt}->{force};
5012 if ($opt eq 'hotplug
') {
5013 die "skip\n" if ($conf->{hotplug} =~ /memory/);
5014 } elsif ($opt eq 'tablet
') {
5015 die "skip\n" if !$hotplug_features->{usb};
5016 if ($defaults->{tablet}) {
5017 vm_deviceplug($storecfg, $conf, $vmid, 'tablet
', $arch, $machine_type);
5018 vm_deviceplug($storecfg, $conf, $vmid, 'keyboard
', $arch, $machine_type)
5019 if $arch eq 'aarch64
';
5021 vm_deviceunplug($vmid, $conf, 'tablet
');
5022 vm_deviceunplug($vmid, $conf, 'keyboard
') if $arch eq 'aarch64
';
5024 } elsif ($opt =~ m/^usb(\d+)$/) {
5026 die "skip\n" if !$usb_hotplug;
5027 vm_deviceunplug($vmid, $conf, "usbredirdev$index"); # if it's a spice port
5028 vm_deviceunplug
($vmid, $conf, $opt);
5029 } elsif ($opt eq 'vcpus') {
5030 die "skip\n" if !$hotplug_features->{cpu
};
5031 qemu_cpu_hotplug
($vmid, $conf, undef);
5032 } elsif ($opt eq 'balloon') {
5033 # enable balloon device is not hotpluggable
5034 die "skip\n" if defined($conf->{balloon
}) && $conf->{balloon
} == 0;
5035 # here we reset the ballooning value to memory
5036 my $balloon = $conf->{memory
} || $defaults->{memory
};
5037 mon_cmd
($vmid, "balloon", value
=> $balloon*1024*1024);
5038 } elsif ($fast_plug_option->{$opt}) {
5040 } elsif ($opt =~ m/^net(\d+)$/) {
5041 die "skip\n" if !$hotplug_features->{network
};
5042 vm_deviceunplug
($vmid, $conf, $opt);
5043 } elsif (is_valid_drivename
($opt)) {
5044 die "skip\n" if !$hotplug_features->{disk
} || $opt =~ m/(ide|sata)(\d+)/;
5045 vm_deviceunplug
($vmid, $conf, $opt);
5046 vmconfig_delete_or_detach_drive
($vmid, $storecfg, $conf, $opt, $force);
5047 } elsif ($opt =~ m/^memory$/) {
5048 die "skip\n" if !$hotplug_features->{memory
};
5049 PVE
::QemuServer
::Memory
::qemu_memory_hotplug
($vmid, $conf, $defaults, $opt);
5050 } elsif ($opt eq 'cpuunits') {
5051 $cgroup->change_cpu_shares(undef);
5052 } elsif ($opt eq 'cpulimit') {
5053 $cgroup->change_cpu_quota(undef, undef); # reset, cgroup module can better decide values
5059 &$add_error($opt, $err) if $err ne "skip\n";
5061 my $old = delete $conf->{$opt};
5062 $cloudinit_record_changed->($conf, $opt, $old, undef);
5063 PVE
::QemuConfig-
>remove_from_pending_delete($conf, $opt);
5068 foreach my $opt (keys %{$conf->{pending
}}) {
5069 next if $selection && !$selection->{$opt};
5070 my $value = $conf->{pending
}->{$opt};
5072 if ($opt eq 'hotplug') {
5073 die "skip\n" if ($value =~ /memory/) || ($value !~ /memory/ && $conf->{hotplug
} =~ /memory/);
5074 } elsif ($opt eq 'tablet') {
5075 die "skip\n" if !$hotplug_features->{usb
};
5077 vm_deviceplug
($storecfg, $conf, $vmid, 'tablet', $arch, $machine_type);
5078 vm_deviceplug
($storecfg, $conf, $vmid, 'keyboard', $arch, $machine_type)
5079 if $arch eq 'aarch64';
5080 } elsif ($value == 0) {
5081 vm_deviceunplug
($vmid, $conf, 'tablet');
5082 vm_deviceunplug
($vmid, $conf, 'keyboard') if $arch eq 'aarch64';
5084 } elsif ($opt =~ m/^usb(\d+)$/) {
5086 die "skip\n" if !$usb_hotplug;
5087 my $d = eval { parse_property_string
($usbdesc->{format
}, $value) };
5089 if ($d->{host
} eq 'spice') {
5090 $id = "usbredirdev$index";
5092 qemu_usb_hotplug
($storecfg, $conf, $vmid, $id, $d, $arch, $machine_type);
5093 } elsif ($opt eq 'vcpus') {
5094 die "skip\n" if !$hotplug_features->{cpu
};
5095 qemu_cpu_hotplug
($vmid, $conf, $value);
5096 } elsif ($opt eq 'balloon') {
5097 # enable/disable balloning device is not hotpluggable
5098 my $old_balloon_enabled = !!(!defined($conf->{balloon
}) || $conf->{balloon
});
5099 my $new_balloon_enabled = !!(!defined($conf->{pending
}->{balloon
}) || $conf->{pending
}->{balloon
});
5100 die "skip\n" if $old_balloon_enabled != $new_balloon_enabled;
5102 # allow manual ballooning if shares is set to zero
5103 if ((defined($conf->{shares
}) && ($conf->{shares
} == 0))) {
5104 my $balloon = $conf->{pending
}->{balloon
} || $conf->{memory
} || $defaults->{memory
};
5105 mon_cmd
($vmid, "balloon", value
=> $balloon*1024*1024);
5107 } elsif ($opt =~ m/^net(\d+)$/) {
5108 # some changes can be done without hotplug
5109 vmconfig_update_net
($storecfg, $conf, $hotplug_features->{network
},
5110 $vmid, $opt, $value, $arch, $machine_type);
5111 } elsif (is_valid_drivename
($opt)) {
5112 die "skip\n" if $opt eq 'efidisk0' || $opt eq 'tpmstate0';
5113 # some changes can be done without hotplug
5114 my $drive = parse_drive
($opt, $value);
5115 if (drive_is_cloudinit
($drive)) {
5116 $cloudinit_opt = [$opt, $drive];
5117 # apply all the other changes first, then generate the cloudinit disk
5120 vmconfig_update_disk
($storecfg, $conf, $hotplug_features->{disk
},
5121 $vmid, $opt, $value, $arch, $machine_type);
5122 } elsif ($opt =~ m/^memory$/) { #dimms
5123 die "skip\n" if !$hotplug_features->{memory
};
5124 $value = PVE
::QemuServer
::Memory
::qemu_memory_hotplug
($vmid, $conf, $defaults, $opt, $value);
5125 } elsif ($opt eq 'cpuunits') {
5126 my $new_cpuunits = PVE
::CGroup
::clamp_cpu_shares
($conf->{pending
}->{$opt}); #clamp
5127 $cgroup->change_cpu_shares($new_cpuunits);
5128 } elsif ($opt eq 'cpulimit') {
5129 my $cpulimit = $conf->{pending
}->{$opt} == 0 ?
-1 : int($conf->{pending
}->{$opt} * 100000);
5130 $cgroup->change_cpu_quota($cpulimit, 100000);
5131 } elsif ($opt eq 'agent') {
5132 vmconfig_update_agent
($conf, $opt, $value);
5134 die "skip\n"; # skip non-hot-pluggable options
5138 &$add_error($opt, $err) if $err ne "skip\n";
5140 $cloudinit_record_changed->($conf, $opt, $conf->{$opt}, $value);
5141 $conf->{$opt} = $value;
5142 delete $conf->{pending
}->{$opt};
5146 if (defined($cloudinit_opt)) {
5147 my ($opt, $drive) = @$cloudinit_opt;
5148 my $value = $conf->{pending
}->{$opt};
5150 my $temp = {%$conf, $opt => $value};
5151 PVE
::QemuServer
::Cloudinit
::apply_cloudinit_config
($temp, $vmid);
5152 vmconfig_update_disk
($storecfg, $conf, $hotplug_features->{disk
},
5153 $vmid, $opt, $value, $arch, $machine_type);
5156 &$add_error($opt, $err) if $err ne "skip\n";
5158 $conf->{$opt} = $value;
5159 delete $conf->{pending
}->{$opt};
5163 # unplug xhci controller if no usb device is left
5166 for (my $i = 0; $i < $MAX_USB_DEVICES; $i++) {
5167 next if !defined($conf->{"usb$i"});
5172 vm_deviceunplug
($vmid, $conf, 'xhci');
5176 PVE
::QemuConfig-
>write_config($vmid, $conf);
5178 if ($hotplug_features->{cloudinit
} && PVE
::QemuServer
::Cloudinit
::has_changes
($conf)) {
5179 PVE
::QemuServer
::vmconfig_update_cloudinit_drive
($storecfg, $conf, $vmid);
5183 sub try_deallocate_drive
{
5184 my ($storecfg, $vmid, $conf, $key, $drive, $rpcenv, $authuser, $force) = @_;
5186 if (($force || $key =~ /^unused/) && !drive_is_cdrom
($drive, 1)) {
5187 my $volid = $drive->{file
};
5188 if (vm_is_volid_owner
($storecfg, $vmid, $volid)) {
5189 my $sid = PVE
::Storage
::parse_volume_id
($volid);
5190 $rpcenv->check($authuser, "/storage/$sid", ['Datastore.AllocateSpace']);
5192 # check if the disk is really unused
5193 die "unable to delete '$volid' - volume is still in use (snapshot?)\n"
5194 if PVE
::QemuServer
::Drive
::is_volume_in_use
($storecfg, $conf, $key, $volid);
5195 PVE
::Storage
::vdisk_free
($storecfg, $volid);
5198 # If vm is not owner of this disk remove from config
5206 sub vmconfig_delete_or_detach_drive
{
5207 my ($vmid, $storecfg, $conf, $opt, $force) = @_;
5209 my $drive = parse_drive
($opt, $conf->{$opt});
5211 my $rpcenv = PVE
::RPCEnvironment
::get
();
5212 my $authuser = $rpcenv->get_user();
5215 $rpcenv->check_vm_perm($authuser, $vmid, undef, ['VM.Config.Disk']);
5216 try_deallocate_drive
($storecfg, $vmid, $conf, $opt, $drive, $rpcenv, $authuser, $force);
5218 vmconfig_register_unused_drive
($storecfg, $vmid, $conf, $drive);
5224 sub vmconfig_apply_pending
{
5225 my ($vmid, $conf, $storecfg, $errors, $skip_cloud_init) = @_;
5227 return if !scalar(keys %{$conf->{pending
}});
5229 my $add_apply_error = sub {
5230 my ($opt, $msg) = @_;
5231 my $err_msg = "unable to apply pending change $opt : $msg";
5232 $errors->{$opt} = $err_msg;
5238 my $pending_delete_hash = PVE
::QemuConfig-
>parse_pending_delete($conf->{pending
}->{delete});
5239 foreach my $opt (sort keys %$pending_delete_hash) {
5240 my $force = $pending_delete_hash->{$opt}->{force
};
5242 if ($opt =~ m/^unused/) {
5243 die "internal error";
5244 } elsif (defined($conf->{$opt}) && is_valid_drivename
($opt)) {
5245 vmconfig_delete_or_detach_drive
($vmid, $storecfg, $conf, $opt, $force);
5249 $add_apply_error->($opt, $err);
5251 PVE
::QemuConfig-
>remove_from_pending_delete($conf, $opt);
5252 delete $conf->{$opt};
5256 PVE
::QemuConfig-
>cleanup_pending($conf);
5258 my $generate_cloudinit = $skip_cloud_init ?
0 : undef;
5260 foreach my $opt (keys %{$conf->{pending
}}) { # add/change
5261 next if $opt eq 'delete'; # just to be sure
5263 if (defined($conf->{$opt}) && is_valid_drivename
($opt)) {
5264 vmconfig_register_unused_drive
($storecfg, $vmid, $conf, parse_drive
($opt, $conf->{$opt}))
5268 $add_apply_error->($opt, $err);
5271 if (is_valid_drivename
($opt)) {
5272 my $drive = parse_drive
($opt, $conf->{pending
}->{$opt});
5273 $generate_cloudinit //= 1 if drive_is_cloudinit
($drive);
5276 $conf->{$opt} = delete $conf->{pending
}->{$opt};
5280 # write all changes at once to avoid unnecessary i/o
5281 PVE
::QemuConfig-
>write_config($vmid, $conf);
5282 if ($generate_cloudinit) {
5283 if (PVE
::QemuServer
::Cloudinit
::apply_cloudinit_config
($conf, $vmid)) {
5284 # After successful generation and if there were changes to be applied, update the
5285 # config to drop the {cloudinit} entry.
5286 PVE
::QemuConfig-
>write_config($vmid, $conf);
5291 sub vmconfig_update_net
{
5292 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value, $arch, $machine_type) = @_;
5294 my $newnet = parse_net
($value);
5296 if ($conf->{$opt}) {
5297 my $oldnet = parse_net
($conf->{$opt});
5299 if (safe_string_ne
($oldnet->{model
}, $newnet->{model
}) ||
5300 safe_string_ne
($oldnet->{macaddr
}, $newnet->{macaddr
}) ||
5301 safe_num_ne
($oldnet->{queues
}, $newnet->{queues
}) ||
5302 !($newnet->{bridge
} && $oldnet->{bridge
})) { # bridge/nat mode change
5304 # for non online change, we try to hot-unplug
5305 die "skip\n" if !$hotplug;
5306 vm_deviceunplug
($vmid, $conf, $opt);
5309 die "internal error" if $opt !~ m/net(\d+)/;
5310 my $iface = "tap${vmid}i$1";
5312 if (safe_string_ne
($oldnet->{bridge
}, $newnet->{bridge
}) ||
5313 safe_num_ne
($oldnet->{tag
}, $newnet->{tag
}) ||
5314 safe_string_ne
($oldnet->{trunks
}, $newnet->{trunks
}) ||
5315 safe_num_ne
($oldnet->{firewall
}, $newnet->{firewall
})) {
5316 PVE
::Network
::tap_unplug
($iface);
5319 PVE
::Network
::SDN
::Zones
::tap_plug
($iface, $newnet->{bridge
}, $newnet->{tag
}, $newnet->{firewall
}, $newnet->{trunks
}, $newnet->{rate
});
5321 PVE
::Network
::tap_plug
($iface, $newnet->{bridge
}, $newnet->{tag
}, $newnet->{firewall
}, $newnet->{trunks
}, $newnet->{rate
});
5323 } elsif (safe_num_ne
($oldnet->{rate
}, $newnet->{rate
})) {
5324 # Rate can be applied on its own but any change above needs to
5325 # include the rate in tap_plug since OVS resets everything.
5326 PVE
::Network
::tap_rate_limit
($iface, $newnet->{rate
});
5329 if (safe_string_ne
($oldnet->{link_down
}, $newnet->{link_down
})) {
5330 qemu_set_link_status
($vmid, $opt, !$newnet->{link_down
});
5338 vm_deviceplug
($storecfg, $conf, $vmid, $opt, $newnet, $arch, $machine_type);
5344 sub vmconfig_update_agent
{
5345 my ($conf, $opt, $value) = @_;
5347 die "skip\n" if !$conf->{$opt};
5349 my $hotplug_options = { fstrim_cloned_disks
=> 1 };
5351 my $old_agent = parse_guest_agent
($conf);
5352 my $agent = parse_guest_agent
({$opt => $value});
5354 for my $option (keys %$agent) { # added/changed options
5355 next if defined($hotplug_options->{$option});
5356 die "skip\n" if safe_string_ne
($agent->{$option}, $old_agent->{$option});
5359 for my $option (keys %$old_agent) { # removed options
5360 next if defined($hotplug_options->{$option});
5361 die "skip\n" if safe_string_ne
($old_agent->{$option}, $agent->{$option});
5364 return; # either no actual change (e.g., format string reordered) or just hotpluggable changes
5367 sub vmconfig_update_disk
{
5368 my ($storecfg, $conf, $hotplug, $vmid, $opt, $value, $arch, $machine_type) = @_;
5370 my $drive = parse_drive
($opt, $value);
5372 if ($conf->{$opt} && (my $old_drive = parse_drive
($opt, $conf->{$opt}))) {
5373 my $media = $drive->{media
} || 'disk';
5374 my $oldmedia = $old_drive->{media
} || 'disk';
5375 die "unable to change media type\n" if $media ne $oldmedia;
5377 if (!drive_is_cdrom
($old_drive)) {
5379 if ($drive->{file
} ne $old_drive->{file
}) {
5381 die "skip\n" if !$hotplug;
5383 # unplug and register as unused
5384 vm_deviceunplug
($vmid, $conf, $opt);
5385 vmconfig_register_unused_drive
($storecfg, $vmid, $conf, $old_drive)
5388 # update existing disk
5390 # skip non hotpluggable value
5391 if (safe_string_ne
($drive->{discard
}, $old_drive->{discard
}) ||
5392 safe_string_ne
($drive->{iothread
}, $old_drive->{iothread
}) ||
5393 safe_string_ne
($drive->{queues
}, $old_drive->{queues
}) ||
5394 safe_string_ne
($drive->{cache
}, $old_drive->{cache
}) ||
5395 safe_string_ne
($drive->{ssd
}, $old_drive->{ssd
}) ||
5396 safe_string_ne
($drive->{ro
}, $old_drive->{ro
})) {
5401 if (safe_num_ne
($drive->{mbps
}, $old_drive->{mbps
}) ||
5402 safe_num_ne
($drive->{mbps_rd
}, $old_drive->{mbps_rd
}) ||
5403 safe_num_ne
($drive->{mbps_wr
}, $old_drive->{mbps_wr
}) ||
5404 safe_num_ne
($drive->{iops
}, $old_drive->{iops
}) ||
5405 safe_num_ne
($drive->{iops_rd
}, $old_drive->{iops_rd
}) ||
5406 safe_num_ne
($drive->{iops_wr
}, $old_drive->{iops_wr
}) ||
5407 safe_num_ne
($drive->{mbps_max
}, $old_drive->{mbps_max
}) ||
5408 safe_num_ne
($drive->{mbps_rd_max
}, $old_drive->{mbps_rd_max
}) ||
5409 safe_num_ne
($drive->{mbps_wr_max
}, $old_drive->{mbps_wr_max
}) ||
5410 safe_num_ne
($drive->{iops_max
}, $old_drive->{iops_max
}) ||
5411 safe_num_ne
($drive->{iops_rd_max
}, $old_drive->{iops_rd_max
}) ||
5412 safe_num_ne
($drive->{iops_wr_max
}, $old_drive->{iops_wr_max
}) ||
5413 safe_num_ne
($drive->{bps_max_length
}, $old_drive->{bps_max_length
}) ||
5414 safe_num_ne
($drive->{bps_rd_max_length
}, $old_drive->{bps_rd_max_length
}) ||
5415 safe_num_ne
($drive->{bps_wr_max_length
}, $old_drive->{bps_wr_max_length
}) ||
5416 safe_num_ne
($drive->{iops_max_length
}, $old_drive->{iops_max_length
}) ||
5417 safe_num_ne
($drive->{iops_rd_max_length
}, $old_drive->{iops_rd_max_length
}) ||
5418 safe_num_ne
($drive->{iops_wr_max_length
}, $old_drive->{iops_wr_max_length
})) {
5420 qemu_block_set_io_throttle
(
5422 ($drive->{mbps
} || 0)*1024*1024,
5423 ($drive->{mbps_rd
} || 0)*1024*1024,
5424 ($drive->{mbps_wr
} || 0)*1024*1024,
5425 $drive->{iops
} || 0,
5426 $drive->{iops_rd
} || 0,
5427 $drive->{iops_wr
} || 0,
5428 ($drive->{mbps_max
} || 0)*1024*1024,
5429 ($drive->{mbps_rd_max
} || 0)*1024*1024,
5430 ($drive->{mbps_wr_max
} || 0)*1024*1024,
5431 $drive->{iops_max
} || 0,
5432 $drive->{iops_rd_max
} || 0,
5433 $drive->{iops_wr_max
} || 0,
5434 $drive->{bps_max_length
} || 1,
5435 $drive->{bps_rd_max_length
} || 1,
5436 $drive->{bps_wr_max_length
} || 1,
5437 $drive->{iops_max_length
} || 1,
5438 $drive->{iops_rd_max_length
} || 1,
5439 $drive->{iops_wr_max_length
} || 1,
5449 if ($drive->{file
} eq 'none') {
5450 mon_cmd
($vmid, "eject", force
=> JSON
::true
, id
=> "$opt");
5451 if (drive_is_cloudinit
($old_drive)) {
5452 vmconfig_register_unused_drive
($storecfg, $vmid, $conf, $old_drive);
5455 my $path = get_iso_path
($storecfg, $vmid, $drive->{file
});
5457 # force eject if locked
5458 mon_cmd
($vmid, "eject", force
=> JSON
::true
, id
=> "$opt");
5461 mon_cmd
($vmid, "blockdev-change-medium",
5462 id
=> "$opt", filename
=> "$path");
5470 die "skip\n" if !$hotplug || $opt =~ m/(ide|sata)(\d+)/;
5472 PVE
::Storage
::activate_volumes
($storecfg, [$drive->{file
}]) if $drive->{file
} !~ m
|^/dev/.+|;
5473 vm_deviceplug
($storecfg, $conf, $vmid, $opt, $drive, $arch, $machine_type);
5476 sub vmconfig_update_cloudinit_drive
{
5477 my ($storecfg, $conf, $vmid) = @_;
5479 my $cloudinit_ds = undef;
5480 my $cloudinit_drive = undef;
5482 PVE
::QemuConfig-
>foreach_volume($conf, sub {
5483 my ($ds, $drive) = @_;
5484 if (PVE
::QemuServer
::drive_is_cloudinit
($drive)) {
5485 $cloudinit_ds = $ds;
5486 $cloudinit_drive = $drive;
5490 return if !$cloudinit_drive;
5492 if (PVE
::QemuServer
::Cloudinit
::apply_cloudinit_config
($conf, $vmid)) {
5493 PVE
::QemuConfig-
>write_config($vmid, $conf);
5496 my $running = PVE
::QemuServer
::check_running
($vmid);
5499 my $path = PVE
::Storage
::path
($storecfg, $cloudinit_drive->{file
});
5501 mon_cmd
($vmid, "eject", force
=> JSON
::true
, id
=> "$cloudinit_ds");
5502 mon_cmd
($vmid, "blockdev-change-medium", id
=> "$cloudinit_ds", filename
=> "$path");
5507 # called in locked context by incoming migration
5508 sub vm_migrate_get_nbd_disks
{
5509 my ($storecfg, $conf, $replicated_volumes) = @_;
5511 my $local_volumes = {};
5512 PVE
::QemuConfig-
>foreach_volume($conf, sub {
5513 my ($ds, $drive) = @_;
5515 return if drive_is_cdrom
($drive);
5516 return if $ds eq 'tpmstate0';
5518 my $volid = $drive->{file
};
5522 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($volid);
5524 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
5525 return if $scfg->{shared
};
5527 # replicated disks re-use existing state via bitmap
5528 my $use_existing = $replicated_volumes->{$volid} ?
1 : 0;
5529 $local_volumes->{$ds} = [$volid, $storeid, $volname, $drive, $use_existing];
5531 return $local_volumes;
5534 # called in locked context by incoming migration
5535 sub vm_migrate_alloc_nbd_disks
{
5536 my ($storecfg, $vmid, $source_volumes, $storagemap) = @_;
5539 foreach my $opt (sort keys %$source_volumes) {
5540 my ($volid, $storeid, $volname, $drive, $use_existing, $format) = @{$source_volumes->{$opt}};
5542 if ($use_existing) {
5543 $nbd->{$opt}->{drivestr
} = print_drive
($drive);
5544 $nbd->{$opt}->{volid
} = $volid;
5545 $nbd->{$opt}->{replicated
} = 1;
5549 # storage mapping + volname = regular migration
5550 # storage mapping + format = remote migration
5551 # order of precedence, filtered by whether storage supports it:
5552 # 1. explicit requested format
5553 # 2. format of current volume
5554 # 3. default format of storage
5555 if (!$storagemap->{identity
}) {
5556 $storeid = PVE
::JSONSchema
::map_id
($storagemap, $storeid);
5557 my ($defFormat, $validFormats) = PVE
::Storage
::storage_default_format
($storecfg, $storeid);
5558 if (!$format || !grep { $format eq $_ } @$validFormats) {
5560 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
5561 my $fileFormat = qemu_img_format
($scfg, $volname);
5562 $format = $fileFormat
5563 if grep { $fileFormat eq $_ } @$validFormats;
5565 $format //= $defFormat;
5568 # can't happen for remote migration, so $volname is always defined
5569 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
5570 $format = qemu_img_format
($scfg, $volname);
5573 my $size = $drive->{size
} / 1024;
5574 my $newvolid = PVE
::Storage
::vdisk_alloc
($storecfg, $storeid, $vmid, $format, undef, $size);
5575 my $newdrive = $drive;
5576 $newdrive->{format
} = $format;
5577 $newdrive->{file
} = $newvolid;
5578 my $drivestr = print_drive
($newdrive);
5579 $nbd->{$opt}->{drivestr
} = $drivestr;
5580 $nbd->{$opt}->{volid
} = $newvolid;
5586 # see vm_start_nolock for parameters, additionally:
5588 # storagemap = parsed storage map for allocating NBD disks
5590 my ($storecfg, $vmid, $params, $migrate_opts) = @_;
5592 return PVE
::QemuConfig-
>lock_config($vmid, sub {
5593 my $conf = PVE
::QemuConfig-
>load_config($vmid, $migrate_opts->{migratedfrom
});
5595 die "you can't start a vm if it's a template\n"
5596 if !$params->{skiptemplate
} && PVE
::QemuConfig-
>is_template($conf);
5598 my $has_suspended_lock = PVE
::QemuConfig-
>has_lock($conf, 'suspended');
5599 my $has_backup_lock = PVE
::QemuConfig-
>has_lock($conf, 'backup');
5601 my $running = check_running
($vmid, undef, $migrate_opts->{migratedfrom
});
5603 if ($has_backup_lock && $running) {
5604 # a backup is currently running, attempt to start the guest in the
5605 # existing QEMU instance
5606 return vm_resume
($vmid);
5609 PVE
::QemuConfig-
>check_lock($conf)
5610 if !($params->{skiplock
} || $has_suspended_lock);
5612 $params->{resume
} = $has_suspended_lock || defined($conf->{vmstate
});
5614 die "VM $vmid already running\n" if $running;
5616 if (my $storagemap = $migrate_opts->{storagemap
}) {
5617 my $replicated = $migrate_opts->{replicated_volumes
};
5618 my $disks = vm_migrate_get_nbd_disks
($storecfg, $conf, $replicated);
5619 $migrate_opts->{nbd
} = vm_migrate_alloc_nbd_disks
($storecfg, $vmid, $disks, $storagemap);
5621 foreach my $opt (keys %{$migrate_opts->{nbd
}}) {
5622 $conf->{$opt} = $migrate_opts->{nbd
}->{$opt}->{drivestr
};
5626 return vm_start_nolock
($storecfg, $vmid, $conf, $params, $migrate_opts);
5632 # statefile => 'tcp', 'unix' for migration or path/volid for RAM state
5633 # skiplock => 0/1, skip checking for config lock
5634 # skiptemplate => 0/1, skip checking whether VM is template
5635 # forcemachine => to force QEMU machine (rollback/migration)
5636 # forcecpu => a QEMU '-cpu' argument string to override get_cpu_options
5637 # timeout => in seconds
5638 # paused => start VM in paused state (backup)
5639 # resume => resume from hibernation
5650 # nbd => volumes for NBD exports (vm_migrate_alloc_nbd_disks)
5651 # migratedfrom => source node
5652 # spice_ticket => used for spice migration, passed via tunnel/stdin
5653 # network => CIDR of migration network
5654 # type => secure/insecure - tunnel over encrypted connection or plain-text
5655 # nbd_proto_version => int, 0 for TCP, 1 for UNIX
5656 # replicated_volumes => which volids should be re-used with bitmaps for nbd migration
5657 # offline_volumes => new volids of offline migrated disks like tpmstate and cloudinit, not yet
5658 # contained in config
5659 sub vm_start_nolock
{
5660 my ($storecfg, $vmid, $conf, $params, $migrate_opts) = @_;
5662 my $statefile = $params->{statefile
};
5663 my $resume = $params->{resume
};
5665 my $migratedfrom = $migrate_opts->{migratedfrom
};
5666 my $migration_type = $migrate_opts->{type
};
5670 # clean up leftover reboot request files
5671 eval { clear_reboot_request
($vmid); };
5674 if (!$statefile && scalar(keys %{$conf->{pending
}})) {
5675 vmconfig_apply_pending
($vmid, $conf, $storecfg);
5676 $conf = PVE
::QemuConfig-
>load_config($vmid); # update/reload
5679 # don't regenerate the ISO if the VM is started as part of a live migration
5680 # this way we can reuse the old ISO with the correct config
5681 if (!$migratedfrom) {
5682 if (PVE
::QemuServer
::Cloudinit
::apply_cloudinit_config
($conf, $vmid)) {
5683 # FIXME: apply_cloudinit_config updates $conf in this case, and it would only drop
5684 # $conf->{cloudinit}, so we could just not do this?
5685 # But we do it above, so for now let's be consistent.
5686 $conf = PVE
::QemuConfig-
>load_config($vmid); # update/reload
5690 # override offline migrated volumes, conf is out of date still
5691 if (my $offline_volumes = $migrate_opts->{offline_volumes
}) {
5692 for my $key (sort keys $offline_volumes->%*) {
5693 my $parsed = parse_drive
($key, $conf->{$key});
5694 $parsed->{file
} = $offline_volumes->{$key};
5695 $conf->{$key} = print_drive
($parsed);
5699 my $defaults = load_defaults
();
5701 # set environment variable useful inside network script
5702 # for remote migration the config is available on the target node!
5703 if (!$migrate_opts->{remote_node
}) {
5704 $ENV{PVE_MIGRATED_FROM
} = $migratedfrom;
5707 PVE
::GuestHelpers
::exec_hookscript
($conf, $vmid, 'pre-start', 1);
5709 my $forcemachine = $params->{forcemachine
};
5710 my $forcecpu = $params->{forcecpu
};
5712 # enforce machine and CPU type on suspended vm to ensure HW compatibility
5713 $forcemachine = $conf->{runningmachine
};
5714 $forcecpu = $conf->{runningcpu
};
5715 print "Resuming suspended VM\n";
5718 my ($cmd, $vollist, $spice_port) = config_to_command
($storecfg, $vmid,
5719 $conf, $defaults, $forcemachine, $forcecpu, $params->{'pbs-backing'});
5722 my $get_migration_ip = sub {
5723 my ($nodename) = @_;
5725 return $migration_ip if defined($migration_ip);
5727 my $cidr = $migrate_opts->{network
};
5729 if (!defined($cidr)) {
5730 my $dc_conf = PVE
::Cluster
::cfs_read_file
('datacenter.cfg');
5731 $cidr = $dc_conf->{migration
}->{network
};
5734 if (defined($cidr)) {
5735 my $ips = PVE
::Network
::get_local_ip_from_cidr
($cidr);
5737 die "could not get IP: no address configured on local " .
5738 "node for network '$cidr'\n" if scalar(@$ips) == 0;
5740 die "could not get IP: multiple addresses configured on local " .
5741 "node for network '$cidr'\n" if scalar(@$ips) > 1;
5743 $migration_ip = @$ips[0];
5746 $migration_ip = PVE
::Cluster
::remote_node_ip
($nodename, 1)
5747 if !defined($migration_ip);
5749 return $migration_ip;
5753 if ($statefile eq 'tcp') {
5754 my $migrate = $res->{migrate
} = { proto
=> 'tcp' };
5755 $migrate->{addr
} = "localhost";
5756 my $datacenterconf = PVE
::Cluster
::cfs_read_file
('datacenter.cfg');
5757 my $nodename = nodename
();
5759 if (!defined($migration_type)) {
5760 if (defined($datacenterconf->{migration
}->{type
})) {
5761 $migration_type = $datacenterconf->{migration
}->{type
};
5763 $migration_type = 'secure';
5767 if ($migration_type eq 'insecure') {
5768 $migrate->{addr
} = $get_migration_ip->($nodename);
5769 $migrate->{addr
} = "[$migrate->{addr}]" if Net
::IP
::ip_is_ipv6
($migrate->{addr
});
5772 my $pfamily = PVE
::Tools
::get_host_address_family
($nodename);
5773 $migrate->{port
} = PVE
::Tools
::next_migrate_port
($pfamily);
5774 $migrate->{uri
} = "tcp:$migrate->{addr}:$migrate->{port}";
5775 push @$cmd, '-incoming', $migrate->{uri
};
5778 } elsif ($statefile eq 'unix') {
5779 # should be default for secure migrations as a ssh TCP forward
5780 # tunnel is not deterministic reliable ready and fails regurarly
5781 # to set up in time, so use UNIX socket forwards
5782 my $migrate = $res->{migrate
} = { proto
=> 'unix' };
5783 $migrate->{addr
} = "/run/qemu-server/$vmid.migrate";
5784 unlink $migrate->{addr
};
5786 $migrate->{uri
} = "unix:$migrate->{addr}";
5787 push @$cmd, '-incoming', $migrate->{uri
};
5790 } elsif (-e
$statefile) {
5791 push @$cmd, '-loadstate', $statefile;
5793 my $statepath = PVE
::Storage
::path
($storecfg, $statefile);
5794 push @$vollist, $statefile;
5795 push @$cmd, '-loadstate', $statepath;
5797 } elsif ($params->{paused
}) {
5801 my $start_timeout = $params->{timeout
} // config_aware_timeout
($conf, $resume);
5803 my $pci_devices = {}; # host pci devices
5804 for (my $i = 0; $i < $PVE::QemuServer
::PCI
::MAX_HOSTPCI_DEVICES
; $i++) {
5805 my $dev = $conf->{"hostpci$i"} or next;
5806 $pci_devices->{$i} = parse_hostpci
($dev);
5809 # do not reserve pciid for mediated devices, sysfs will error out for duplicate assignment
5810 my $real_pci_devices = [ grep { !(defined($_->{mdev
}) && scalar($_->{pciid
}->@*) == 1) } values $pci_devices->%* ];
5812 # map to a flat list of pci ids
5813 my $pci_id_list = [ map { $_->{id
} } map { $_->{pciid
}->@* } $real_pci_devices->@* ];
5815 # reserve all PCI IDs before actually doing anything with them
5816 PVE
::QemuServer
::PCI
::reserve_pci_usage
($pci_id_list, $vmid, $start_timeout);
5820 for my $id (sort keys %$pci_devices) {
5821 my $d = $pci_devices->{$id};
5822 for my $dev ($d->{pciid
}->@*) {
5823 my $info = PVE
::QemuServer
::PCI
::prepare_pci_device
($vmid, $dev->{id
}, $id, $d->{mdev
});
5825 # nvidia grid needs the uuid of the mdev as qemu parameter
5826 if ($d->{mdev
} && !defined($uuid) && $info->{vendor
} eq '10de') {
5827 $uuid = PVE
::QemuServer
::PCI
::generate_mdev_uuid
($vmid, $id);
5831 push @$cmd, '-uuid', $uuid if defined($uuid);
5834 eval { cleanup_pci_devices
($vmid, $conf) };
5839 PVE
::Storage
::activate_volumes
($storecfg, $vollist);
5842 run_command
(['/bin/systemctl', 'stop', "$vmid.scope"], outfunc
=> sub{}, errfunc
=> sub{});
5844 # Issues with the above 'stop' not being fully completed are extremely rare, a very low
5845 # timeout should be more than enough here...
5846 PVE
::Systemd
::wait_for_unit_removed
("$vmid.scope", 20);
5848 my $cpuunits = PVE
::CGroup
::clamp_cpu_shares
($conf->{cpuunits
});
5851 timeout
=> $statefile ?
undef : $start_timeout,
5856 # when migrating, prefix QEMU output so other side can pick up any
5857 # errors that might occur and show the user
5858 if ($migratedfrom) {
5859 $run_params{quiet
} = 1;
5860 $run_params{logfunc
} = sub { print "QEMU: $_[0]\n" };
5863 my %systemd_properties = (
5864 Slice
=> 'qemu.slice',
5865 KillMode
=> 'process',
5867 TimeoutStopUSec
=> ULONG_MAX
, # infinity
5870 if (PVE
::CGroup
::cgroup_mode
() == 2) {
5871 $systemd_properties{CPUWeight
} = $cpuunits;
5873 $systemd_properties{CPUShares
} = $cpuunits;
5876 if (my $cpulimit = $conf->{cpulimit
}) {
5877 $systemd_properties{CPUQuota
} = int($cpulimit * 100);
5879 $systemd_properties{timeout
} = 10 if $statefile; # setting up the scope shoul be quick
5881 my $run_qemu = sub {
5882 PVE
::Tools
::run_fork
sub {
5883 PVE
::Systemd
::enter_systemd_scope
($vmid, "Proxmox VE VM $vmid", %systemd_properties);
5886 if (my $tpm = $conf->{tpmstate0
}) {
5887 # start the TPM emulator so QEMU can connect on start
5888 $tpmpid = start_swtpm
($storecfg, $vmid, $tpm, $migratedfrom);
5891 my $exitcode = run_command
($cmd, %run_params);
5894 warn "stopping swtpm instance (pid $tpmpid) due to QEMU startup error\n";
5895 kill 'TERM', $tpmpid;
5897 die "QEMU exited with code $exitcode\n";
5902 if ($conf->{hugepages
}) {
5905 my $hugepages_topology = PVE
::QemuServer
::Memory
::hugepages_topology
($conf);
5906 my $hugepages_host_topology = PVE
::QemuServer
::Memory
::hugepages_host_topology
();
5908 PVE
::QemuServer
::Memory
::hugepages_mount
();
5909 PVE
::QemuServer
::Memory
::hugepages_allocate
($hugepages_topology, $hugepages_host_topology);
5911 eval { $run_qemu->() };
5913 PVE
::QemuServer
::Memory
::hugepages_reset
($hugepages_host_topology)
5914 if !$conf->{keephugepages
};
5918 PVE
::QemuServer
::Memory
::hugepages_pre_deallocate
($hugepages_topology)
5919 if !$conf->{keephugepages
};
5921 eval { PVE
::QemuServer
::Memory
::hugepages_update_locked
($code); };
5924 eval { $run_qemu->() };
5928 # deactivate volumes if start fails
5929 eval { PVE
::Storage
::deactivate_volumes
($storecfg, $vollist); };
5931 eval { cleanup_pci_devices
($vmid, $conf) };
5934 die "start failed: $err";
5937 # re-reserve all PCI IDs now that we can know the actual VM PID
5938 my $pid = PVE
::QemuServer
::Helpers
::vm_running_locally
($vmid);
5939 eval { PVE
::QemuServer
::PCI
::reserve_pci_usage
($pci_id_list, $vmid, undef, $pid) };
5942 if (defined($res->{migrate
})) {
5943 print "migration listens on $res->{migrate}->{uri}\n";
5944 } elsif ($statefile) {
5945 eval { mon_cmd
($vmid, "cont"); };
5949 #start nbd server for storage migration
5950 if (my $nbd = $migrate_opts->{nbd
}) {
5951 my $nbd_protocol_version = $migrate_opts->{nbd_proto_version
} // 0;
5953 my $migrate_storage_uri;
5954 # nbd_protocol_version > 0 for unix socket support
5955 if ($nbd_protocol_version > 0 && ($migration_type eq 'secure' || $migration_type eq 'websocket')) {
5956 my $socket_path = "/run/qemu-server/$vmid\_nbd.migrate";
5957 mon_cmd
($vmid, "nbd-server-start", addr
=> { type
=> 'unix', data
=> { path
=> $socket_path } } );
5958 $migrate_storage_uri = "nbd:unix:$socket_path";
5959 $res->{migrate
}->{unix_sockets
} = [$socket_path];
5961 my $nodename = nodename
();
5962 my $localip = $get_migration_ip->($nodename);
5963 my $pfamily = PVE
::Tools
::get_host_address_family
($nodename);
5964 my $storage_migrate_port = PVE
::Tools
::next_migrate_port
($pfamily);
5966 mon_cmd
($vmid, "nbd-server-start", addr
=> {
5969 host
=> "${localip}",
5970 port
=> "${storage_migrate_port}",
5973 $localip = "[$localip]" if Net
::IP
::ip_is_ipv6
($localip);
5974 $migrate_storage_uri = "nbd:${localip}:${storage_migrate_port}";
5977 foreach my $opt (sort keys %$nbd) {
5978 my $drivestr = $nbd->{$opt}->{drivestr
};
5979 my $volid = $nbd->{$opt}->{volid
};
5980 mon_cmd
($vmid, "nbd-server-add", device
=> "drive-$opt", writable
=> JSON
::true
);
5981 my $nbd_uri = "$migrate_storage_uri:exportname=drive-$opt";
5982 print "storage migration listens on $nbd_uri volume:$drivestr\n";
5983 print "re-using replicated volume: $opt - $volid\n"
5984 if $nbd->{$opt}->{replicated
};
5986 $res->{drives
}->{$opt} = $nbd->{$opt};
5987 $res->{drives
}->{$opt}->{nbd_uri
} = $nbd_uri;
5991 if ($migratedfrom) {
5993 set_migration_caps
($vmid);
5998 print "spice listens on port $spice_port\n";
5999 $res->{spice_port
} = $spice_port;
6000 if ($migrate_opts->{spice_ticket
}) {
6001 mon_cmd
($vmid, "set_password", protocol
=> 'spice', password
=>
6002 $migrate_opts->{spice_ticket
});
6003 mon_cmd
($vmid, "expire_password", protocol
=> 'spice', time => "+30");
6008 mon_cmd
($vmid, "balloon", value
=> $conf->{balloon
}*1024*1024)
6009 if !$statefile && $conf->{balloon
};
6011 foreach my $opt (keys %$conf) {
6012 next if $opt !~ m/^net\d+$/;
6013 my $nicconf = parse_net
($conf->{$opt});
6014 qemu_set_link_status
($vmid, $opt, 0) if $nicconf->{link_down
};
6016 add_nets_bridge_fdb
($conf, $vmid);
6019 mon_cmd
($vmid, 'qom-set',
6020 path
=> "machine/peripheral/balloon0",
6021 property
=> "guest-stats-polling-interval",
6022 value
=> 2) if (!defined($conf->{balloon
}) || $conf->{balloon
});
6025 print "Resumed VM, removing state\n";
6026 if (my $vmstate = $conf->{vmstate
}) {
6027 PVE
::Storage
::deactivate_volumes
($storecfg, [$vmstate]);
6028 PVE
::Storage
::vdisk_free
($storecfg, $vmstate);
6030 delete $conf->@{qw(lock vmstate runningmachine runningcpu)};
6031 PVE
::QemuConfig-
>write_config($vmid, $conf);
6034 PVE
::GuestHelpers
::exec_hookscript
($conf, $vmid, 'post-start');
6039 sub vm_commandline
{
6040 my ($storecfg, $vmid, $snapname) = @_;
6042 my $conf = PVE
::QemuConfig-
>load_config($vmid);
6044 my ($forcemachine, $forcecpu);
6046 my $snapshot = $conf->{snapshots
}->{$snapname};
6047 die "snapshot '$snapname' does not exist\n" if !defined($snapshot);
6049 # check for machine or CPU overrides in snapshot
6050 $forcemachine = $snapshot->{runningmachine
};
6051 $forcecpu = $snapshot->{runningcpu
};
6053 $snapshot->{digest
} = $conf->{digest
}; # keep file digest for API
6058 my $defaults = load_defaults
();
6060 my $cmd = config_to_command
($storecfg, $vmid, $conf, $defaults, $forcemachine, $forcecpu);
6062 return PVE
::Tools
::cmd2string
($cmd);
6066 my ($vmid, $skiplock) = @_;
6068 PVE
::QemuConfig-
>lock_config($vmid, sub {
6070 my $conf = PVE
::QemuConfig-
>load_config($vmid);
6072 PVE
::QemuConfig-
>check_lock($conf) if !$skiplock;
6074 mon_cmd
($vmid, "system_reset");
6078 sub get_vm_volumes
{
6082 foreach_volid
($conf, sub {
6083 my ($volid, $attr) = @_;
6085 return if $volid =~ m
|^/|;
6087 my ($sid, $volname) = PVE
::Storage
::parse_volume_id
($volid, 1);
6090 push @$vollist, $volid;
6096 sub cleanup_pci_devices
{
6097 my ($vmid, $conf) = @_;
6099 foreach my $key (keys %$conf) {
6100 next if $key !~ m/^hostpci(\d+)$/;
6101 my $hostpciindex = $1;
6102 my $uuid = PVE
::SysFSTools
::generate_mdev_uuid
($vmid, $hostpciindex);
6103 my $d = parse_hostpci
($conf->{$key});
6105 # NOTE: avoid PVE::SysFSTools::pci_cleanup_mdev_device as it requires PCI ID and we
6106 # don't want to break ABI just for this two liner
6107 my $dev_sysfs_dir = "/sys/bus/mdev/devices/$uuid";
6108 PVE
::SysFSTools
::file_write
("$dev_sysfs_dir/remove", "1") if -e
$dev_sysfs_dir;
6111 PVE
::QemuServer
::PCI
::remove_pci_reservation
($vmid);
6114 sub vm_stop_cleanup
{
6115 my ($storecfg, $vmid, $conf, $keepActive, $apply_pending_changes) = @_;
6120 my $vollist = get_vm_volumes
($conf);
6121 PVE
::Storage
::deactivate_volumes
($storecfg, $vollist);
6123 if (my $tpmdrive = $conf->{tpmstate0
}) {
6124 my $tpm = parse_drive
("tpmstate0", $tpmdrive);
6125 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($tpm->{file
}, 1);
6127 PVE
::Storage
::unmap_volume
($storecfg, $tpm->{file
});
6132 foreach my $ext (qw(mon qmp pid vnc qga)) {
6133 unlink "/var/run/qemu-server/${vmid}.$ext";
6136 if ($conf->{ivshmem
}) {
6137 my $ivshmem = parse_property_string
($ivshmem_fmt, $conf->{ivshmem
});
6138 # just delete it for now, VMs which have this already open do not
6139 # are affected, but new VMs will get a separated one. If this
6140 # becomes an issue we either add some sort of ref-counting or just
6141 # add a "don't delete on stop" flag to the ivshmem format.
6142 unlink '/dev/shm/pve-shm-' . ($ivshmem->{name
} // $vmid);
6145 cleanup_pci_devices
($vmid, $conf);
6147 vmconfig_apply_pending
($vmid, $conf, $storecfg) if $apply_pending_changes;
6149 warn $@ if $@; # avoid errors - just warn
6152 # call only in locked context
6154 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive) = @_;
6156 my $pid = check_running
($vmid, $nocheck);
6161 $conf = PVE
::QemuConfig-
>load_config($vmid);
6162 PVE
::QemuConfig-
>check_lock($conf) if !$skiplock;
6163 if (!defined($timeout) && $shutdown && $conf->{startup
}) {
6164 my $opts = PVE
::JSONSchema
::pve_parse_startup_order
($conf->{startup
});
6165 $timeout = $opts->{down
} if $opts->{down
};
6167 PVE
::GuestHelpers
::exec_hookscript
($conf, $vmid, 'pre-stop');
6172 if (defined($conf) && get_qga_key
($conf, 'enabled')) {
6173 mon_cmd
($vmid, "guest-shutdown", timeout
=> $timeout);
6175 mon_cmd
($vmid, "system_powerdown");
6178 mon_cmd
($vmid, "quit");
6184 $timeout = 60 if !defined($timeout);
6187 while (($count < $timeout) && check_running
($vmid, $nocheck)) {
6192 if ($count >= $timeout) {
6194 warn "VM still running - terminating now with SIGTERM\n";
6197 die "VM quit/powerdown failed - got timeout\n";
6200 vm_stop_cleanup
($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
6204 if (!check_running
($vmid, $nocheck)) {
6205 warn "Unexpected: VM shutdown command failed, but VM not running anymore..\n";
6209 warn "VM quit/powerdown failed - terminating now with SIGTERM\n";
6212 die "VM quit/powerdown failed\n";
6220 while (($count < $timeout) && check_running
($vmid, $nocheck)) {
6225 if ($count >= $timeout) {
6226 warn "VM still running - terminating now with SIGKILL\n";
6231 vm_stop_cleanup
($storecfg, $vmid, $conf, $keepActive, 1) if $conf;
6234 # Note: use $nocheck to skip tests if VM configuration file exists.
6235 # We need that when migration VMs to other nodes (files already moved)
6236 # Note: we set $keepActive in vzdump stop mode - volumes need to stay active
6238 my ($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive, $migratedfrom) = @_;
6240 $force = 1 if !defined($force) && !$shutdown;
6243 my $pid = check_running
($vmid, $nocheck, $migratedfrom);
6244 kill 15, $pid if $pid;
6245 my $conf = PVE
::QemuConfig-
>load_config($vmid, $migratedfrom);
6246 vm_stop_cleanup
($storecfg, $vmid, $conf, $keepActive, 0);
6250 PVE
::QemuConfig-
>lock_config($vmid, sub {
6251 _do_vm_stop
($storecfg, $vmid, $skiplock, $nocheck, $timeout, $shutdown, $force, $keepActive);
6256 my ($vmid, $timeout) = @_;
6258 PVE
::QemuConfig-
>lock_config($vmid, sub {
6261 # only reboot if running, as qmeventd starts it again on a stop event
6262 return if !check_running
($vmid);
6264 create_reboot_request
($vmid);
6266 my $storecfg = PVE
::Storage
::config
();
6267 _do_vm_stop
($storecfg, $vmid, undef, undef, $timeout, 1);
6271 # avoid that the next normal shutdown will be confused for a reboot
6272 clear_reboot_request
($vmid);
6278 # note: if using the statestorage parameter, the caller has to check privileges
6280 my ($vmid, $skiplock, $includestate, $statestorage) = @_;
6287 PVE
::QemuConfig-
>lock_config($vmid, sub {
6289 $conf = PVE
::QemuConfig-
>load_config($vmid);
6291 my $is_backing_up = PVE
::QemuConfig-
>has_lock($conf, 'backup');
6292 PVE
::QemuConfig-
>check_lock($conf)
6293 if !($skiplock || $is_backing_up);
6295 die "cannot suspend to disk during backup\n"
6296 if $is_backing_up && $includestate;
6298 if ($includestate) {
6299 $conf->{lock} = 'suspending';
6300 my $date = strftime
("%Y-%m-%d", localtime(time()));
6301 $storecfg = PVE
::Storage
::config
();
6302 if (!$statestorage) {
6303 $statestorage = find_vmstate_storage
($conf, $storecfg);
6304 # check permissions for the storage
6305 my $rpcenv = PVE
::RPCEnvironment
::get
();
6306 if ($rpcenv->{type
} ne 'cli') {
6307 my $authuser = $rpcenv->get_user();
6308 $rpcenv->check($authuser, "/storage/$statestorage", ['Datastore.AllocateSpace']);
6313 $vmstate = PVE
::QemuConfig-
>__snapshot_save_vmstate(
6314 $vmid, $conf, "suspend-$date", $storecfg, $statestorage, 1);
6315 $path = PVE
::Storage
::path
($storecfg, $vmstate);
6316 PVE
::QemuConfig-
>write_config($vmid, $conf);
6318 mon_cmd
($vmid, "stop");
6322 if ($includestate) {
6324 PVE
::Storage
::activate_volumes
($storecfg, [$vmstate]);
6327 set_migration_caps
($vmid, 1);
6328 mon_cmd
($vmid, "savevm-start", statefile
=> $path);
6330 my $state = mon_cmd
($vmid, "query-savevm");
6331 if (!$state->{status
}) {
6332 die "savevm not active\n";
6333 } elsif ($state->{status
} eq 'active') {
6336 } elsif ($state->{status
} eq 'completed') {
6337 print "State saved, quitting\n";
6339 } elsif ($state->{status
} eq 'failed' && $state->{error
}) {
6340 die "query-savevm failed with error '$state->{error}'\n"
6342 die "query-savevm returned status '$state->{status}'\n";
6348 PVE
::QemuConfig-
>lock_config($vmid, sub {
6349 $conf = PVE
::QemuConfig-
>load_config($vmid);
6351 # cleanup, but leave suspending lock, to indicate something went wrong
6353 mon_cmd
($vmid, "savevm-end");
6354 PVE
::Storage
::deactivate_volumes
($storecfg, [$vmstate]);
6355 PVE
::Storage
::vdisk_free
($storecfg, $vmstate);
6356 delete $conf->@{qw(vmstate runningmachine runningcpu)};
6357 PVE
::QemuConfig-
>write_config($vmid, $conf);
6363 die "lock changed unexpectedly\n"
6364 if !PVE
::QemuConfig-
>has_lock($conf, 'suspending');
6366 mon_cmd
($vmid, "quit");
6367 $conf->{lock} = 'suspended';
6368 PVE
::QemuConfig-
>write_config($vmid, $conf);
6373 # $nocheck is set when called as part of a migration - in this context the
6374 # location of the config file (source or target node) is not deterministic,
6375 # since migration cannot wait for pmxcfs to process the rename
6377 my ($vmid, $skiplock, $nocheck) = @_;
6379 PVE
::QemuConfig-
>lock_config($vmid, sub {
6380 my $res = mon_cmd
($vmid, 'query-status');
6381 my $resume_cmd = 'cont';
6385 $conf = eval { PVE
::QemuConfig-
>load_config($vmid) }; # try on target node
6387 my $vmlist = PVE
::Cluster
::get_vmlist
();
6388 if (exists($vmlist->{ids
}->{$vmid})) {
6389 my $node = $vmlist->{ids
}->{$vmid}->{node
};
6390 $conf = eval { PVE
::QemuConfig-
>load_config($vmid, $node) }; # try on source node
6393 PVE
::Cluster
::cfs_update
(); # vmlist was wrong, invalidate cache
6394 $conf = PVE
::QemuConfig-
>load_config($vmid); # last try on target node again
6398 $conf = PVE
::QemuConfig-
>load_config($vmid);
6401 if ($res->{status
}) {
6402 return if $res->{status
} eq 'running'; # job done, go home
6403 $resume_cmd = 'system_wakeup' if $res->{status
} eq 'suspended';
6404 $reset = 1 if $res->{status
} eq 'shutdown';
6408 PVE
::QemuConfig-
>check_lock($conf)
6409 if !($skiplock || PVE
::QemuConfig-
>has_lock($conf, 'backup'));
6413 # required if a VM shuts down during a backup and we get a resume
6414 # request before the backup finishes for example
6415 mon_cmd
($vmid, "system_reset");
6418 add_nets_bridge_fdb
($conf, $vmid) if $resume_cmd eq 'cont';
6420 mon_cmd
($vmid, $resume_cmd);
6425 my ($vmid, $skiplock, $key) = @_;
6427 PVE
::QemuConfig-
>lock_config($vmid, sub {
6429 my $conf = PVE
::QemuConfig-
>load_config($vmid);
6431 # there is no qmp command, so we use the human monitor command
6432 my $res = PVE
::QemuServer
::Monitor
::hmp_cmd
($vmid, "sendkey $key");
6433 die $res if $res ne '';
6437 # vzdump restore implementaion
6439 sub tar_archive_read_firstfile
{
6440 my $archive = shift;
6442 die "ERROR: file '$archive' does not exist\n" if ! -f
$archive;
6444 # try to detect archive type first
6445 my $pid = open (my $fh, '-|', 'tar', 'tf', $archive) ||
6446 die "unable to open file '$archive'\n";
6447 my $firstfile = <$fh>;
6451 die "ERROR: archive contaions no data\n" if !$firstfile;
6457 sub tar_restore_cleanup
{
6458 my ($storecfg, $statfile) = @_;
6460 print STDERR
"starting cleanup\n";
6462 if (my $fd = IO
::File-
>new($statfile, "r")) {
6463 while (defined(my $line = <$fd>)) {
6464 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
6467 if ($volid =~ m
|^/|) {
6468 unlink $volid || die 'unlink failed\n';
6470 PVE
::Storage
::vdisk_free
($storecfg, $volid);
6472 print STDERR
"temporary volume '$volid' sucessfuly removed\n";
6474 print STDERR
"unable to cleanup '$volid' - $@" if $@;
6476 print STDERR
"unable to parse line in statfile - $line";
6483 sub restore_file_archive
{
6484 my ($archive, $vmid, $user, $opts) = @_;
6486 return restore_vma_archive
($archive, $vmid, $user, $opts)
6489 my $info = PVE
::Storage
::archive_info
($archive);
6490 my $format = $opts->{format
} // $info->{format
};
6491 my $comp = $info->{compression
};
6493 # try to detect archive format
6494 if ($format eq 'tar') {
6495 return restore_tar_archive
($archive, $vmid, $user, $opts);
6497 return restore_vma_archive
($archive, $vmid, $user, $opts, $comp);
6501 # hepler to remove disks that will not be used after restore
6502 my $restore_cleanup_oldconf = sub {
6503 my ($storecfg, $vmid, $oldconf, $virtdev_hash) = @_;
6505 my $kept_disks = {};
6507 PVE
::QemuConfig-
>foreach_volume($oldconf, sub {
6508 my ($ds, $drive) = @_;
6510 return if drive_is_cdrom
($drive, 1);
6512 my $volid = $drive->{file
};
6513 return if !$volid || $volid =~ m
|^/|;
6515 my ($path, $owner) = PVE
::Storage
::path
($storecfg, $volid);
6516 return if !$path || !$owner || ($owner != $vmid);
6518 # Note: only delete disk we want to restore
6519 # other volumes will become unused
6520 if ($virtdev_hash->{$ds}) {
6521 eval { PVE
::Storage
::vdisk_free
($storecfg, $volid); };
6526 $kept_disks->{$volid} = 1;
6530 # after the restore we have no snapshots anymore
6531 for my $snapname (keys $oldconf->{snapshots
}->%*) {
6532 my $snap = $oldconf->{snapshots
}->{$snapname};
6533 if ($snap->{vmstate
}) {
6534 eval { PVE
::Storage
::vdisk_free
($storecfg, $snap->{vmstate
}); };
6540 for my $volid (keys $kept_disks->%*) {
6541 eval { PVE
::Storage
::volume_snapshot_delete
($storecfg, $volid, $snapname); };
6547 # Helper to parse vzdump backup device hints
6549 # $rpcenv: Environment, used to ckeck storage permissions
6550 # $user: User ID, to check storage permissions
6551 # $storecfg: Storage configuration
6552 # $fh: the file handle for reading the configuration
6553 # $devinfo: should contain device sizes for all backu-up'ed devices
6554 # $options: backup options (pool, default storage)
6556 # Return: $virtdev_hash, updates $devinfo (add devname, virtdev, format, storeid)
6557 my $parse_backup_hints = sub {
6558 my ($rpcenv, $user, $storecfg, $fh, $devinfo, $options) = @_;
6560 my $check_storage = sub { # assert if an image can be allocate
6561 my ($storeid, $scfg) = @_;
6562 die "Content type 'images' is not available on storage '$storeid'\n"
6563 if !$scfg->{content
}->{images
};
6564 $rpcenv->check($user, "/storage/$storeid", ['Datastore.AllocateSpace'])
6565 if $user ne 'root@pam';
6568 my $virtdev_hash = {};
6569 while (defined(my $line = <$fh>)) {
6570 if ($line =~ m/^\#qmdump\#map:(\S+):(\S+):(\S*):(\S*):$/) {
6571 my ($virtdev, $devname, $storeid, $format) = ($1, $2, $3, $4);
6572 die "archive does not contain data for drive '$virtdev'\n"
6573 if !$devinfo->{$devname};
6575 if (defined($options->{storage
})) {
6576 $storeid = $options->{storage
} || 'local';
6577 } elsif (!$storeid) {
6580 $format = 'raw' if !$format;
6581 $devinfo->{$devname}->{devname
} = $devname;
6582 $devinfo->{$devname}->{virtdev
} = $virtdev;
6583 $devinfo->{$devname}->{format
} = $format;
6584 $devinfo->{$devname}->{storeid
} = $storeid;
6586 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
6587 $check_storage->($storeid, $scfg); # permission and content type check
6589 $virtdev_hash->{$virtdev} = $devinfo->{$devname};
6590 } elsif ($line =~ m/^((?:ide|sata|scsi)\d+):\s*(.*)\s*$/) {
6592 my $drive = parse_drive
($virtdev, $2);
6594 if (drive_is_cloudinit
($drive)) {
6595 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($drive->{file
});
6596 $storeid = $options->{storage
} if defined ($options->{storage
});
6597 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
6598 my $format = qemu_img_format
($scfg, $volname); # has 'raw' fallback
6600 $check_storage->($storeid, $scfg); # permission and content type check
6602 $virtdev_hash->{$virtdev} = {
6604 storeid
=> $storeid,
6605 size
=> PVE
::QemuServer
::Cloudinit
::CLOUDINIT_DISK_SIZE
,
6612 return $virtdev_hash;
6615 # Helper to allocate and activate all volumes required for a restore
6617 # $storecfg: Storage configuration
6618 # $virtdev_hash: as returned by parse_backup_hints()
6620 # Returns: { $virtdev => $volid }
6621 my $restore_allocate_devices = sub {
6622 my ($storecfg, $virtdev_hash, $vmid) = @_;
6625 foreach my $virtdev (sort keys %$virtdev_hash) {
6626 my $d = $virtdev_hash->{$virtdev};
6627 my $alloc_size = int(($d->{size
} + 1024 - 1)/1024);
6628 my $storeid = $d->{storeid
};
6629 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
6631 # test if requested format is supported
6632 my ($defFormat, $validFormats) = PVE
::Storage
::storage_default_format
($storecfg, $storeid);
6633 my $supported = grep { $_ eq $d->{format
} } @$validFormats;
6634 $d->{format
} = $defFormat if !$supported;
6637 if ($d->{is_cloudinit
}) {
6638 $name = "vm-$vmid-cloudinit";
6639 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
6640 if ($scfg->{path
}) {
6641 $name .= ".$d->{format}";
6645 my $volid = PVE
::Storage
::vdisk_alloc
(
6646 $storecfg, $storeid, $vmid, $d->{format
}, $name, $alloc_size);
6648 print STDERR
"new volume ID is '$volid'\n";
6649 $d->{volid
} = $volid;
6651 PVE
::Storage
::activate_volumes
($storecfg, [$volid]);
6653 $map->{$virtdev} = $volid;
6659 sub restore_update_config_line
{
6660 my ($cookie, $map, $line, $unique) = @_;
6662 return '' if $line =~ m/^\#qmdump\#/;
6663 return '' if $line =~ m/^\#vzdump\#/;
6664 return '' if $line =~ m/^lock:/;
6665 return '' if $line =~ m/^unused\d+:/;
6666 return '' if $line =~ m/^parent:/;
6670 my $dc = PVE
::Cluster
::cfs_read_file
('datacenter.cfg');
6671 if (($line =~ m/^(vlan(\d+)):\s*(\S+)\s*$/)) {
6672 # try to convert old 1.X settings
6673 my ($id, $ind, $ethcfg) = ($1, $2, $3);
6674 foreach my $devconfig (PVE
::Tools
::split_list
($ethcfg)) {
6675 my ($model, $macaddr) = split(/\=/, $devconfig);
6676 $macaddr = PVE
::Tools
::random_ether_addr
($dc->{mac_prefix
}) if !$macaddr || $unique;
6679 bridge
=> "vmbr$ind",
6680 macaddr
=> $macaddr,
6682 my $netstr = print_net
($net);
6684 $res .= "net$cookie->{netcount}: $netstr\n";
6685 $cookie->{netcount
}++;
6687 } elsif (($line =~ m/^(net\d+):\s*(\S+)\s*$/) && $unique) {
6688 my ($id, $netstr) = ($1, $2);
6689 my $net = parse_net
($netstr);
6690 $net->{macaddr
} = PVE
::Tools
::random_ether_addr
($dc->{mac_prefix
}) if $net->{macaddr
};
6691 $netstr = print_net
($net);
6692 $res .= "$id: $netstr\n";
6693 } elsif ($line =~ m/^((ide|scsi|virtio|sata|efidisk|tpmstate)\d+):\s*(\S+)\s*$/) {
6696 my $di = parse_drive
($virtdev, $value);
6697 if (defined($di->{backup
}) && !$di->{backup
}) {
6699 } elsif ($map->{$virtdev}) {
6700 delete $di->{format
}; # format can change on restore
6701 $di->{file
} = $map->{$virtdev};
6702 $value = print_drive
($di);
6703 $res .= "$virtdev: $value\n";
6707 } elsif (($line =~ m/^vmgenid: (.*)/)) {
6709 if ($vmgenid ne '0') {
6710 # always generate a new vmgenid if there was a valid one setup
6711 $vmgenid = generate_uuid
();
6713 $res .= "vmgenid: $vmgenid\n";
6714 } elsif (($line =~ m/^(smbios1: )(.*)/) && $unique) {
6715 my ($uuid, $uuid_str);
6716 UUID
::generate
($uuid);
6717 UUID
::unparse
($uuid, $uuid_str);
6718 my $smbios1 = parse_smbios1
($2);
6719 $smbios1->{uuid
} = $uuid_str;
6720 $res .= $1.print_smbios1
($smbios1)."\n";
6728 my $restore_deactivate_volumes = sub {
6729 my ($storecfg, $virtdev_hash) = @_;
6732 for my $dev (values $virtdev_hash->%*) {
6733 push $vollist->@*, $dev->{volid
} if $dev->{volid
};
6736 eval { PVE
::Storage
::deactivate_volumes
($storecfg, $vollist); };
6737 print STDERR
$@ if $@;
6740 my $restore_destroy_volumes = sub {
6741 my ($storecfg, $virtdev_hash) = @_;
6743 for my $dev (values $virtdev_hash->%*) {
6744 my $volid = $dev->{volid
} or next;
6746 PVE
::Storage
::vdisk_free
($storecfg, $volid);
6747 print STDERR
"temporary volume '$volid' sucessfuly removed\n";
6749 print STDERR
"unable to cleanup '$volid' - $@" if $@;
6753 my $restore_merge_config = sub {
6754 my ($filename, $backup_conf_raw, $override_conf) = @_;
6756 my $backup_conf = parse_vm_config
($filename, $backup_conf_raw);
6757 for my $key (keys $override_conf->%*) {
6758 $backup_conf->{$key} = $override_conf->{$key};
6761 return $backup_conf;
6765 my ($cfg, $vmid) = @_;
6767 my $info = PVE
::Storage
::vdisk_list
($cfg, undef, $vmid, undef, 'images');
6769 my $volid_hash = {};
6770 foreach my $storeid (keys %$info) {
6771 foreach my $item (@{$info->{$storeid}}) {
6772 next if !($item->{volid
} && $item->{size
});
6773 $item->{path
} = PVE
::Storage
::path
($cfg, $item->{volid
});
6774 $volid_hash->{$item->{volid
}} = $item;
6781 sub update_disk_config
{
6782 my ($vmid, $conf, $volid_hash) = @_;
6785 my $prefix = "VM $vmid";
6787 # used and unused disks
6788 my $referenced = {};
6790 # Note: it is allowed to define multiple storages with same path (alias), so
6791 # we need to check both 'volid' and real 'path' (two different volid can point
6792 # to the same path).
6794 my $referencedpath = {};
6797 PVE
::QemuConfig-
>foreach_volume($conf, sub {
6798 my ($opt, $drive) = @_;
6800 my $volid = $drive->{file
};
6802 my $volume = $volid_hash->{$volid};
6804 # mark volid as "in-use" for next step
6805 $referenced->{$volid} = 1;
6806 if ($volume && (my $path = $volume->{path
})) {
6807 $referencedpath->{$path} = 1;
6810 return if drive_is_cdrom
($drive);
6813 my ($updated, $msg) = PVE
::QemuServer
::Drive
::update_disksize
($drive, $volume->{size
});
6814 if (defined($updated)) {
6816 $conf->{$opt} = print_drive
($updated);
6817 print "$prefix ($opt): $msg\n";
6821 # remove 'unusedX' entry if volume is used
6822 PVE
::QemuConfig-
>foreach_unused_volume($conf, sub {
6823 my ($opt, $drive) = @_;
6825 my $volid = $drive->{file
};
6829 $path = $volid_hash->{$volid}->{path
} if $volid_hash->{$volid};
6830 if ($referenced->{$volid} || ($path && $referencedpath->{$path})) {
6831 print "$prefix remove entry '$opt', its volume '$volid' is in use\n";
6833 delete $conf->{$opt};
6836 $referenced->{$volid} = 1;
6837 $referencedpath->{$path} = 1 if $path;
6840 foreach my $volid (sort keys %$volid_hash) {
6841 next if $volid =~ m/vm-$vmid-state-/;
6842 next if $referenced->{$volid};
6843 my $path = $volid_hash->{$volid}->{path
};
6844 next if !$path; # just to be sure
6845 next if $referencedpath->{$path};
6847 my $key = PVE
::QemuConfig-
>add_unused_volume($conf, $volid);
6848 print "$prefix add unreferenced volume '$volid' as '$key' to config\n";
6849 $referencedpath->{$path} = 1; # avoid to add more than once (aliases)
6856 my ($vmid, $nolock, $dryrun) = @_;
6858 my $cfg = PVE
::Storage
::config
();
6860 print "rescan volumes...\n";
6861 my $volid_hash = scan_volids
($cfg, $vmid);
6863 my $updatefn = sub {
6866 my $conf = PVE
::QemuConfig-
>load_config($vmid);
6868 PVE
::QemuConfig-
>check_lock($conf);
6871 foreach my $volid (keys %$volid_hash) {
6872 my $info = $volid_hash->{$volid};
6873 $vm_volids->{$volid} = $info if $info->{vmid
} && $info->{vmid
} == $vmid;
6876 my $changes = update_disk_config
($vmid, $conf, $vm_volids);
6878 PVE
::QemuConfig-
>write_config($vmid, $conf) if $changes && !$dryrun;
6881 if (defined($vmid)) {
6885 PVE
::QemuConfig-
>lock_config($vmid, $updatefn, $vmid);
6888 my $vmlist = config_list
();
6889 foreach my $vmid (keys %$vmlist) {
6893 PVE
::QemuConfig-
>lock_config($vmid, $updatefn, $vmid);
6899 sub restore_proxmox_backup_archive
{
6900 my ($archive, $vmid, $user, $options) = @_;
6902 my $storecfg = PVE
::Storage
::config
();
6904 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($archive);
6905 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
6907 my $fingerprint = $scfg->{fingerprint
};
6908 my $keyfile = PVE
::Storage
::PBSPlugin
::pbs_encryption_key_file_name
($storecfg, $storeid);
6910 my $repo = PVE
::PBSClient
::get_repository
($scfg);
6911 my $namespace = $scfg->{namespace
};
6913 # This is only used for `pbs-restore` and the QEMU PBS driver (live-restore)
6914 my $password = PVE
::Storage
::PBSPlugin
::pbs_get_password
($scfg, $storeid);
6915 local $ENV{PBS_PASSWORD
} = $password;
6916 local $ENV{PBS_FINGERPRINT
} = $fingerprint if defined($fingerprint);
6918 my ($vtype, $pbs_backup_name, undef, undef, undef, undef, $format) =
6919 PVE
::Storage
::parse_volname
($storecfg, $archive);
6921 die "got unexpected vtype '$vtype'\n" if $vtype ne 'backup';
6923 die "got unexpected backup format '$format'\n" if $format ne 'pbs-vm';
6925 my $tmpdir = "/var/tmp/vzdumptmp$$";
6929 my $conffile = PVE
::QemuConfig-
>config_file($vmid);
6930 # disable interrupts (always do cleanups)
6934 local $SIG{HUP
} = sub { print STDERR
"got interrupt - ignored\n"; };
6936 # Note: $oldconf is undef if VM does not exists
6937 my $cfs_path = PVE
::QemuConfig-
>cfs_config_path($vmid);
6938 my $oldconf = PVE
::Cluster
::cfs_read_file
($cfs_path);
6939 my $new_conf_raw = '';
6941 my $rpcenv = PVE
::RPCEnvironment
::get
();
6942 my $devinfo = {}; # info about drives included in backup
6943 my $virtdev_hash = {}; # info about allocated drives
6951 local $SIG{PIPE
} = sub { die "interrupted by signal\n"; };
6953 my $cfgfn = "$tmpdir/qemu-server.conf";
6954 my $firewall_config_fn = "$tmpdir/fw.conf";
6955 my $index_fn = "$tmpdir/index.json";
6957 my $cmd = "restore";
6959 my $param = [$pbs_backup_name, "index.json", $index_fn];
6960 PVE
::Storage
::PBSPlugin
::run_raw_client_cmd
($scfg, $storeid, $cmd, $param);
6961 my $index = PVE
::Tools
::file_get_contents
($index_fn);
6962 $index = decode_json
($index);
6964 foreach my $info (@{$index->{files
}}) {
6965 if ($info->{filename
} =~ m/^(drive-\S+).img.fidx$/) {
6967 if ($info->{size
} =~ m/^(\d+)$/) { # untaint size
6968 $devinfo->{$devname}->{size
} = $1;
6970 die "unable to parse file size in 'index.json' - got '$info->{size}'\n";
6975 my $is_qemu_server_backup = scalar(
6976 grep { $_->{filename
} eq 'qemu-server.conf.blob' } @{$index->{files
}}
6978 if (!$is_qemu_server_backup) {
6979 die "backup does not look like a qemu-server backup (missing 'qemu-server.conf' file)\n";
6981 my $has_firewall_config = scalar(grep { $_->{filename
} eq 'fw.conf.blob' } @{$index->{files
}});
6983 $param = [$pbs_backup_name, "qemu-server.conf", $cfgfn];
6984 PVE
::Storage
::PBSPlugin
::run_raw_client_cmd
($scfg, $storeid, $cmd, $param);
6986 if ($has_firewall_config) {
6987 $param = [$pbs_backup_name, "fw.conf", $firewall_config_fn];
6988 PVE
::Storage
::PBSPlugin
::run_raw_client_cmd
($scfg, $storeid, $cmd, $param);
6990 my $pve_firewall_dir = '/etc/pve/firewall';
6991 mkdir $pve_firewall_dir; # make sure the dir exists
6992 PVE
::Tools
::file_copy
($firewall_config_fn, "${pve_firewall_dir}/$vmid.fw");
6995 my $fh = IO
::File-
>new($cfgfn, "r") ||
6996 die "unable to read qemu-server.conf - $!\n";
6998 $virtdev_hash = $parse_backup_hints->($rpcenv, $user, $storecfg, $fh, $devinfo, $options);
7000 # fixme: rate limit?
7002 # create empty/temp config
7003 PVE
::Tools
::file_set_contents
($conffile, "memory: 128\nlock: create");
7005 $restore_cleanup_oldconf->($storecfg, $vmid, $oldconf, $virtdev_hash) if $oldconf;
7008 my $map = $restore_allocate_devices->($storecfg, $virtdev_hash, $vmid);
7010 foreach my $virtdev (sort keys %$virtdev_hash) {
7011 my $d = $virtdev_hash->{$virtdev};
7012 next if $d->{is_cloudinit
}; # no need to restore cloudinit
7014 # this fails if storage is unavailable
7015 my $volid = $d->{volid
};
7016 my $path = PVE
::Storage
::path
($storecfg, $volid);
7018 # for live-restore we only want to preload the efidisk and TPM state
7019 next if $options->{live
} && $virtdev ne 'efidisk0' && $virtdev ne 'tpmstate0';
7022 if (defined(my $ns = $scfg->{namespace
})) {
7023 @ns_arg = ('--ns', $ns);
7026 my $pbs_restore_cmd = [
7027 '/usr/bin/pbs-restore',
7028 '--repository', $repo,
7031 "$d->{devname}.img.fidx",
7036 push @$pbs_restore_cmd, '--format', $d->{format
} if $d->{format
};
7037 push @$pbs_restore_cmd, '--keyfile', $keyfile if -e
$keyfile;
7039 if (PVE
::Storage
::volume_has_feature
($storecfg, 'sparseinit', $volid)) {
7040 push @$pbs_restore_cmd, '--skip-zero';
7043 my $dbg_cmdstring = PVE
::Tools
::cmd2string
($pbs_restore_cmd);
7044 print "restore proxmox backup image: $dbg_cmdstring\n";
7045 run_command
($pbs_restore_cmd);
7048 $fh->seek(0, 0) || die "seek failed - $!\n";
7050 my $cookie = { netcount
=> 0 };
7051 while (defined(my $line = <$fh>)) {
7052 $new_conf_raw .= restore_update_config_line
(
7064 if ($err || !$options->{live
}) {
7065 $restore_deactivate_volumes->($storecfg, $virtdev_hash);
7071 $restore_destroy_volumes->($storecfg, $virtdev_hash);
7075 if ($options->{live
}) {
7076 # keep lock during live-restore
7077 $new_conf_raw .= "\nlock: create";
7080 my $new_conf = $restore_merge_config->($conffile, $new_conf_raw, $options->{override_conf
});
7081 PVE
::QemuConfig-
>write_config($vmid, $new_conf);
7083 eval { rescan
($vmid, 1); };
7086 PVE
::AccessControl
::add_vm_to_pool
($vmid, $options->{pool
}) if $options->{pool
};
7088 if ($options->{live
}) {
7094 local $SIG{PIPE
} = sub { die "got signal ($!) - abort\n"; };
7096 my $conf = PVE
::QemuConfig-
>load_config($vmid);
7097 die "cannot do live-restore for template\n" if PVE
::QemuConfig-
>is_template($conf);
7099 # these special drives are already restored before start
7100 delete $devinfo->{'drive-efidisk0'};
7101 delete $devinfo->{'drive-tpmstate0-backup'};
7105 keyfile
=> $keyfile,
7106 snapshot
=> $pbs_backup_name,
7107 namespace
=> $namespace,
7109 pbs_live_restore
($vmid, $conf, $storecfg, $devinfo, $pbs_opts);
7111 PVE
::QemuConfig-
>remove_lock($vmid, "create");
7115 sub pbs_live_restore
{
7116 my ($vmid, $conf, $storecfg, $restored_disks, $opts) = @_;
7118 print "starting VM for live-restore\n";
7119 print "repository: '$opts->{repo}', snapshot: '$opts->{snapshot}'\n";
7121 my $pbs_backing = {};
7122 for my $ds (keys %$restored_disks) {
7123 $ds =~ m/^drive-(.*)$/;
7125 $pbs_backing->{$confname} = {
7126 repository
=> $opts->{repo
},
7127 snapshot
=> $opts->{snapshot
},
7128 archive
=> "$ds.img.fidx",
7130 $pbs_backing->{$confname}->{keyfile
} = $opts->{keyfile
} if -e
$opts->{keyfile
};
7131 $pbs_backing->{$confname}->{namespace
} = $opts->{namespace
} if defined($opts->{namespace
});
7133 my $drive = parse_drive
($confname, $conf->{$confname});
7134 print "restoring '$ds' to '$drive->{file}'\n";
7137 my $drives_streamed = 0;
7139 # make sure HA doesn't interrupt our restore by stopping the VM
7140 if (PVE
::HA
::Config
::vm_is_ha_managed
($vmid)) {
7141 run_command
(['ha-manager', 'set', "vm:$vmid", '--state', 'started']);
7144 # start VM with backing chain pointing to PBS backup, environment vars for PBS driver
7145 # in QEMU (PBS_PASSWORD and PBS_FINGERPRINT) are already set by our caller
7146 vm_start_nolock
($storecfg, $vmid, $conf, {paused
=> 1, 'pbs-backing' => $pbs_backing}, {});
7148 my $qmeventd_fd = register_qmeventd_handle
($vmid);
7150 # begin streaming, i.e. data copy from PBS to target disk for every vol,
7151 # this will effectively collapse the backing image chain consisting of
7152 # [target <- alloc-track -> PBS snapshot] to just [target] (alloc-track
7153 # removes itself once all backing images vanish with 'auto-remove=on')
7155 for my $ds (sort keys %$restored_disks) {
7156 my $job_id = "restore-$ds";
7157 mon_cmd
($vmid, 'block-stream',
7158 'job-id' => $job_id,
7161 $jobs->{$job_id} = {};
7164 mon_cmd
($vmid, 'cont');
7165 qemu_drive_mirror_monitor
($vmid, undef, $jobs, 'auto', 0, 'stream');
7167 print "restore-drive jobs finished successfully, removing all tracking block devices"
7168 ." to disconnect from Proxmox Backup Server\n";
7170 for my $ds (sort keys %$restored_disks) {
7171 mon_cmd
($vmid, 'blockdev-del', 'node-name' => "$ds-pbs");
7174 close($qmeventd_fd);
7180 warn "An error occurred during live-restore: $err\n";
7181 _do_vm_stop
($storecfg, $vmid, 1, 1, 10, 0, 1);
7182 die "live-restore failed\n";
7186 sub restore_vma_archive
{
7187 my ($archive, $vmid, $user, $opts, $comp) = @_;
7189 my $readfrom = $archive;
7191 my $cfg = PVE
::Storage
::config
();
7193 my $bwlimit = $opts->{bwlimit
};
7195 my $dbg_cmdstring = '';
7196 my $add_pipe = sub {
7198 push @$commands, $cmd;
7199 $dbg_cmdstring .= ' | ' if length($dbg_cmdstring);
7200 $dbg_cmdstring .= PVE
::Tools
::cmd2string
($cmd);
7205 if ($archive eq '-') {
7208 # If we use a backup from a PVE defined storage we also consider that
7209 # storage's rate limit:
7210 my (undef, $volid) = PVE
::Storage
::path_to_volume_id
($cfg, $archive);
7211 if (defined($volid)) {
7212 my ($sid, undef) = PVE
::Storage
::parse_volume_id
($volid);
7213 my $readlimit = PVE
::Storage
::get_bandwidth_limit
('restore', [$sid], $bwlimit);
7215 print STDERR
"applying read rate limit: $readlimit\n";
7216 my $cstream = ['cstream', '-t', $readlimit*1024, '--', $readfrom];
7217 $add_pipe->($cstream);
7223 my $info = PVE
::Storage
::decompressor_info
('vma', $comp);
7224 my $cmd = $info->{decompressor
};
7225 push @$cmd, $readfrom;
7229 my $tmpdir = "/var/tmp/vzdumptmp$$";
7232 # disable interrupts (always do cleanups)
7236 local $SIG{HUP
} = sub { warn "got interrupt - ignored\n"; };
7238 my $mapfifo = "/var/tmp/vzdumptmp$$.fifo";
7239 POSIX
::mkfifo
($mapfifo, 0600);
7241 my $openfifo = sub { open($fifofh, '>', $mapfifo) or die $! };
7243 $add_pipe->(['vma', 'extract', '-v', '-r', $mapfifo, $readfrom, $tmpdir]);
7248 my $devinfo = {}; # info about drives included in backup
7249 my $virtdev_hash = {}; # info about allocated drives
7251 my $rpcenv = PVE
::RPCEnvironment
::get
();
7253 my $conffile = PVE
::QemuConfig-
>config_file($vmid);
7255 # Note: $oldconf is undef if VM does not exist
7256 my $cfs_path = PVE
::QemuConfig-
>cfs_config_path($vmid);
7257 my $oldconf = PVE
::Cluster
::cfs_read_file
($cfs_path);
7258 my $new_conf_raw = '';
7262 my $print_devmap = sub {
7263 my $cfgfn = "$tmpdir/qemu-server.conf";
7265 # we can read the config - that is already extracted
7266 my $fh = IO
::File-
>new($cfgfn, "r") ||
7267 die "unable to read qemu-server.conf - $!\n";
7269 my $fwcfgfn = "$tmpdir/qemu-server.fw";
7271 my $pve_firewall_dir = '/etc/pve/firewall';
7272 mkdir $pve_firewall_dir; # make sure the dir exists
7273 PVE
::Tools
::file_copy
($fwcfgfn, "${pve_firewall_dir}/$vmid.fw");
7276 $virtdev_hash = $parse_backup_hints->($rpcenv, $user, $cfg, $fh, $devinfo, $opts);
7278 foreach my $info (values %{$virtdev_hash}) {
7279 my $storeid = $info->{storeid
};
7280 next if defined($storage_limits{$storeid});
7282 my $limit = PVE
::Storage
::get_bandwidth_limit
('restore', [$storeid], $bwlimit) // 0;
7283 print STDERR
"rate limit for storage $storeid: $limit KiB/s\n" if $limit;
7284 $storage_limits{$storeid} = $limit * 1024;
7287 foreach my $devname (keys %$devinfo) {
7288 die "found no device mapping information for device '$devname'\n"
7289 if !$devinfo->{$devname}->{virtdev
};
7292 # create empty/temp config
7294 PVE
::Tools
::file_set_contents
($conffile, "memory: 128\n");
7295 $restore_cleanup_oldconf->($cfg, $vmid, $oldconf, $virtdev_hash);
7299 my $map = $restore_allocate_devices->($cfg, $virtdev_hash, $vmid);
7301 # print restore information to $fifofh
7302 foreach my $virtdev (sort keys %$virtdev_hash) {
7303 my $d = $virtdev_hash->{$virtdev};
7304 next if $d->{is_cloudinit
}; # no need to restore cloudinit
7306 my $storeid = $d->{storeid
};
7307 my $volid = $d->{volid
};
7310 if (my $limit = $storage_limits{$storeid}) {
7311 $map_opts .= "throttling.bps=$limit:throttling.group=$storeid:";
7314 my $write_zeros = 1;
7315 if (PVE
::Storage
::volume_has_feature
($cfg, 'sparseinit', $volid)) {
7319 my $path = PVE
::Storage
::path
($cfg, $volid);
7321 print $fifofh "${map_opts}format=$d->{format}:${write_zeros}:$d->{devname}=$path\n";
7323 print "map '$d->{devname}' to '$path' (write zeros = ${write_zeros})\n";
7326 $fh->seek(0, 0) || die "seek failed - $!\n";
7328 my $cookie = { netcount
=> 0 };
7329 while (defined(my $line = <$fh>)) {
7330 $new_conf_raw .= restore_update_config_line
(
7347 local $SIG{PIPE
} = sub { die "interrupted by signal\n"; };
7348 local $SIG{ALRM
} = sub { die "got timeout\n"; };
7350 $oldtimeout = alarm($timeout);
7357 if ($line =~ m/^DEV:\sdev_id=(\d+)\ssize:\s(\d+)\sdevname:\s(\S+)$/) {
7358 my ($dev_id, $size, $devname) = ($1, $2, $3);
7359 $devinfo->{$devname} = { size
=> $size, dev_id
=> $dev_id };
7360 } elsif ($line =~ m/^CTIME: /) {
7361 # we correctly received the vma config, so we can disable
7362 # the timeout now for disk allocation (set to 10 minutes, so
7363 # that we always timeout if something goes wrong)
7366 print $fifofh "done\n";
7367 my $tmp = $oldtimeout || 0;
7368 $oldtimeout = undef;
7375 print "restore vma archive: $dbg_cmdstring\n";
7376 run_command
($commands, input
=> $input, outfunc
=> $parser, afterfork
=> $openfifo);
7380 alarm($oldtimeout) if $oldtimeout;
7382 $restore_deactivate_volumes->($cfg, $virtdev_hash);
7384 close($fifofh) if $fifofh;
7389 $restore_destroy_volumes->($cfg, $virtdev_hash);
7393 my $new_conf = $restore_merge_config->($conffile, $new_conf_raw, $opts->{override_conf
});
7394 PVE
::QemuConfig-
>write_config($vmid, $new_conf);
7396 eval { rescan
($vmid, 1); };
7399 PVE
::AccessControl
::add_vm_to_pool
($vmid, $opts->{pool
}) if $opts->{pool
};
7402 sub restore_tar_archive
{
7403 my ($archive, $vmid, $user, $opts) = @_;
7405 if (scalar(keys $opts->{override_conf
}->%*) > 0) {
7406 my $keystring = join(' ', keys $opts->{override_conf
}->%*);
7407 die "cannot pass along options ($keystring) when restoring from tar archive\n";
7410 if ($archive ne '-') {
7411 my $firstfile = tar_archive_read_firstfile
($archive);
7412 die "ERROR: file '$archive' does not look like a QemuServer vzdump backup\n"
7413 if $firstfile ne 'qemu-server.conf';
7416 my $storecfg = PVE
::Storage
::config
();
7418 # avoid zombie disks when restoring over an existing VM -> cleanup first
7419 # pass keep_empty_config=1 to keep the config (thus VMID) reserved for us
7420 # skiplock=1 because qmrestore has set the 'create' lock itself already
7421 my $vmcfgfn = PVE
::QemuConfig-
>config_file($vmid);
7422 destroy_vm
($storecfg, $vmid, 1, { lock => 'restore' }) if -f
$vmcfgfn;
7424 my $tocmd = "/usr/lib/qemu-server/qmextract";
7426 $tocmd .= " --storage " . PVE
::Tools
::shellquote
($opts->{storage
}) if $opts->{storage
};
7427 $tocmd .= " --pool " . PVE
::Tools
::shellquote
($opts->{pool
}) if $opts->{pool
};
7428 $tocmd .= ' --prealloc' if $opts->{prealloc
};
7429 $tocmd .= ' --info' if $opts->{info
};
7431 # tar option "xf" does not autodetect compression when read from STDIN,
7432 # so we pipe to zcat
7433 my $cmd = "zcat -f|tar xf " . PVE
::Tools
::shellquote
($archive) . " " .
7434 PVE
::Tools
::shellquote
("--to-command=$tocmd");
7436 my $tmpdir = "/var/tmp/vzdumptmp$$";
7439 local $ENV{VZDUMP_TMPDIR
} = $tmpdir;
7440 local $ENV{VZDUMP_VMID
} = $vmid;
7441 local $ENV{VZDUMP_USER
} = $user;
7443 my $conffile = PVE
::QemuConfig-
>config_file($vmid);
7444 my $new_conf_raw = '';
7446 # disable interrupts (always do cleanups)
7450 local $SIG{HUP
} = sub { print STDERR
"got interrupt - ignored\n"; };
7458 local $SIG{PIPE
} = sub { die "interrupted by signal\n"; };
7460 if ($archive eq '-') {
7461 print "extracting archive from STDIN\n";
7462 run_command
($cmd, input
=> "<&STDIN");
7464 print "extracting archive '$archive'\n";
7468 return if $opts->{info
};
7472 my $statfile = "$tmpdir/qmrestore.stat";
7473 if (my $fd = IO
::File-
>new($statfile, "r")) {
7474 while (defined (my $line = <$fd>)) {
7475 if ($line =~ m/vzdump:([^\s:]*):(\S+)$/) {
7476 $map->{$1} = $2 if $1;
7478 print STDERR
"unable to parse line in statfile - $line\n";
7484 my $confsrc = "$tmpdir/qemu-server.conf";
7486 my $srcfd = IO
::File-
>new($confsrc, "r") || die "unable to open file '$confsrc'\n";
7488 my $cookie = { netcount
=> 0 };
7489 while (defined (my $line = <$srcfd>)) {
7490 $new_conf_raw .= restore_update_config_line
(
7501 tar_restore_cleanup
($storecfg, "$tmpdir/qmrestore.stat") if !$opts->{info
};
7507 PVE
::Tools
::file_set_contents
($conffile, $new_conf_raw);
7509 PVE
::Cluster
::cfs_update
(); # make sure we read new file
7511 eval { rescan
($vmid, 1); };
7515 sub foreach_storage_used_by_vm
{
7516 my ($conf, $func) = @_;
7520 PVE
::QemuConfig-
>foreach_volume($conf, sub {
7521 my ($ds, $drive) = @_;
7522 return if drive_is_cdrom
($drive);
7524 my $volid = $drive->{file
};
7526 my ($sid, $volname) = PVE
::Storage
::parse_volume_id
($volid, 1);
7527 $sidhash->{$sid} = $sid if $sid;
7530 foreach my $sid (sort keys %$sidhash) {
7535 my $qemu_snap_storage = {
7538 sub do_snapshots_with_qemu
{
7539 my ($storecfg, $volid, $deviceid) = @_;
7541 return if $deviceid =~ m/tpmstate0/;
7543 my $storage_name = PVE
::Storage
::parse_volume_id
($volid);
7544 my $scfg = $storecfg->{ids
}->{$storage_name};
7545 die "could not find storage '$storage_name'\n" if !defined($scfg);
7547 if ($qemu_snap_storage->{$scfg->{type
}} && !$scfg->{krbd
}){
7551 if ($volid =~ m/\.(qcow2|qed)$/){
7558 sub qga_check_running
{
7559 my ($vmid, $nowarn) = @_;
7561 eval { mon_cmd
($vmid, "guest-ping", timeout
=> 3); };
7563 warn "QEMU Guest Agent is not running - $@" if !$nowarn;
7569 sub template_create
{
7570 my ($vmid, $conf, $disk) = @_;
7572 my $storecfg = PVE
::Storage
::config
();
7574 PVE
::QemuConfig-
>foreach_volume($conf, sub {
7575 my ($ds, $drive) = @_;
7577 return if drive_is_cdrom
($drive);
7578 return if $disk && $ds ne $disk;
7580 my $volid = $drive->{file
};
7581 return if !PVE
::Storage
::volume_has_feature
($storecfg, 'template', $volid);
7583 my $voliddst = PVE
::Storage
::vdisk_create_base
($storecfg, $volid);
7584 $drive->{file
} = $voliddst;
7585 $conf->{$ds} = print_drive
($drive);
7586 PVE
::QemuConfig-
>write_config($vmid, $conf);
7590 sub convert_iscsi_path
{
7593 if ($path =~ m
|^iscsi
://([^/]+)/([^/]+)/(.+)$|) {
7598 my $initiator_name = get_initiator_name
();
7600 return "file.driver=iscsi,file.transport=tcp,file.initiator-name=$initiator_name,".
7601 "file.portal=$portal,file.target=$target,file.lun=$lun,driver=raw";
7604 die "cannot convert iscsi path '$path', unkown format\n";
7607 sub qemu_img_convert
{
7608 my ($src_volid, $dst_volid, $size, $snapname, $is_zero_initialized) = @_;
7610 my $storecfg = PVE
::Storage
::config
();
7611 my ($src_storeid, $src_volname) = PVE
::Storage
::parse_volume_id
($src_volid, 1);
7612 my ($dst_storeid, $dst_volname) = PVE
::Storage
::parse_volume_id
($dst_volid, 1);
7614 die "destination '$dst_volid' is not a valid volid form qemu-img convert\n" if !$dst_storeid;
7618 my $src_is_iscsi = 0;
7622 PVE
::Storage
::activate_volumes
($storecfg, [$src_volid], $snapname);
7623 my $src_scfg = PVE
::Storage
::storage_config
($storecfg, $src_storeid);
7624 $src_format = qemu_img_format
($src_scfg, $src_volname);
7625 $src_path = PVE
::Storage
::path
($storecfg, $src_volid, $snapname);
7626 $src_is_iscsi = ($src_path =~ m
|^iscsi
://|);
7627 $cachemode = 'none' if $src_scfg->{type
} eq 'zfspool';
7628 } elsif (-f
$src_volid || -b
$src_volid) {
7629 $src_path = $src_volid;
7630 if ($src_path =~ m/\.($PVE::QemuServer::Drive::QEMU_FORMAT_RE)$/) {
7635 die "source '$src_volid' is not a valid volid nor path for qemu-img convert\n" if !$src_path;
7637 my $dst_scfg = PVE
::Storage
::storage_config
($storecfg, $dst_storeid);
7638 my $dst_format = qemu_img_format
($dst_scfg, $dst_volname);
7639 my $dst_path = PVE
::Storage
::path
($storecfg, $dst_volid);
7640 my $dst_is_iscsi = ($dst_path =~ m
|^iscsi
://|);
7643 push @$cmd, '/usr/bin/qemu-img', 'convert', '-p', '-n';
7644 push @$cmd, '-l', "snapshot.name=$snapname"
7645 if $snapname && $src_format && $src_format eq "qcow2";
7646 push @$cmd, '-t', 'none' if $dst_scfg->{type
} eq 'zfspool';
7647 push @$cmd, '-T', $cachemode if defined($cachemode);
7649 if ($src_is_iscsi) {
7650 push @$cmd, '--image-opts';
7651 $src_path = convert_iscsi_path
($src_path);
7652 } elsif ($src_format) {
7653 push @$cmd, '-f', $src_format;
7656 if ($dst_is_iscsi) {
7657 push @$cmd, '--target-image-opts';
7658 $dst_path = convert_iscsi_path
($dst_path);
7660 push @$cmd, '-O', $dst_format;
7663 push @$cmd, $src_path;
7665 if (!$dst_is_iscsi && $is_zero_initialized) {
7666 push @$cmd, "zeroinit:$dst_path";
7668 push @$cmd, $dst_path;
7673 if($line =~ m/\((\S+)\/100\
%\)/){
7675 my $transferred = int($size * $percent / 100);
7676 my $total_h = render_bytes
($size, 1);
7677 my $transferred_h = render_bytes
($transferred, 1);
7679 print "transferred $transferred_h of $total_h ($percent%)\n";
7684 eval { run_command
($cmd, timeout
=> undef, outfunc
=> $parser); };
7686 die "copy failed: $err" if $err;
7689 sub qemu_img_format
{
7690 my ($scfg, $volname) = @_;
7692 if ($scfg->{path
} && $volname =~ m/\.($PVE::QemuServer::Drive::QEMU_FORMAT_RE)$/) {
7699 sub qemu_drive_mirror
{
7700 my ($vmid, $drive, $dst_volid, $vmiddst, $is_zero_initialized, $jobs, $completion, $qga, $bwlimit, $src_bitmap) = @_;
7702 $jobs = {} if !$jobs;
7706 $jobs->{"drive-$drive"} = {};
7708 if ($dst_volid =~ /^nbd:/) {
7709 $qemu_target = $dst_volid;
7712 my $storecfg = PVE
::Storage
::config
();
7713 my ($dst_storeid, $dst_volname) = PVE
::Storage
::parse_volume_id
($dst_volid);
7715 my $dst_scfg = PVE
::Storage
::storage_config
($storecfg, $dst_storeid);
7717 $format = qemu_img_format
($dst_scfg, $dst_volname);
7719 my $dst_path = PVE
::Storage
::path
($storecfg, $dst_volid);
7721 $qemu_target = $is_zero_initialized ?
"zeroinit:$dst_path" : $dst_path;
7724 my $opts = { timeout
=> 10, device
=> "drive-$drive", mode
=> "existing", sync
=> "full", target
=> $qemu_target };
7725 $opts->{format
} = $format if $format;
7727 if (defined($src_bitmap)) {
7728 $opts->{sync
} = 'incremental';
7729 $opts->{bitmap
} = $src_bitmap;
7730 print "drive mirror re-using dirty bitmap '$src_bitmap'\n";
7733 if (defined($bwlimit)) {
7734 $opts->{speed
} = $bwlimit * 1024;
7735 print "drive mirror is starting for drive-$drive with bandwidth limit: ${bwlimit} KB/s\n";
7737 print "drive mirror is starting for drive-$drive\n";
7740 # if a job already runs for this device we get an error, catch it for cleanup
7741 eval { mon_cmd
($vmid, "drive-mirror", %$opts); };
7743 eval { PVE
::QemuServer
::qemu_blockjobs_cancel
($vmid, $jobs) };
7745 die "mirroring error: $err\n";
7748 qemu_drive_mirror_monitor
($vmid, $vmiddst, $jobs, $completion, $qga);
7751 # $completion can be either
7752 # 'complete': wait until all jobs are ready, block-job-complete them (default)
7753 # 'cancel': wait until all jobs are ready, block-job-cancel them
7754 # 'skip': wait until all jobs are ready, return with block jobs in ready state
7755 # 'auto': wait until all jobs disappear, only use for jobs which complete automatically
7756 sub qemu_drive_mirror_monitor
{
7757 my ($vmid, $vmiddst, $jobs, $completion, $qga, $op) = @_;
7759 $completion //= 'complete';
7763 my $err_complete = 0;
7765 my $starttime = time ();
7767 die "block job ('$op') timed out\n" if $err_complete > 300;
7769 my $stats = mon_cmd
($vmid, "query-block-jobs");
7772 my $running_jobs = {};
7773 for my $stat (@$stats) {
7774 next if $stat->{type
} ne $op;
7775 $running_jobs->{$stat->{device
}} = $stat;
7778 my $readycounter = 0;
7780 for my $job_id (sort keys %$jobs) {
7781 my $job = $running_jobs->{$job_id};
7783 my $vanished = !defined($job);
7784 my $complete = defined($jobs->{$job_id}->{complete
}) && $vanished;
7785 if($complete || ($vanished && $completion eq 'auto')) {
7786 print "$job_id: $op-job finished\n";
7787 delete $jobs->{$job_id};
7791 die "$job_id: '$op' has been cancelled\n" if !defined($job);
7793 my $busy = $job->{busy
};
7794 my $ready = $job->{ready
};
7795 if (my $total = $job->{len
}) {
7796 my $transferred = $job->{offset
} || 0;
7797 my $remaining = $total - $transferred;
7798 my $percent = sprintf "%.2f", ($transferred * 100 / $total);
7800 my $duration = $ctime - $starttime;
7801 my $total_h = render_bytes
($total, 1);
7802 my $transferred_h = render_bytes
($transferred, 1);
7804 my $status = sprintf(
7805 "transferred $transferred_h of $total_h ($percent%%) in %s",
7806 render_duration
($duration),
7811 $status .= ", still busy"; # shouldn't even happen? but mirror is weird
7813 $status .= ", ready";
7816 print "$job_id: $status\n" if !$jobs->{$job_id}->{ready
};
7817 $jobs->{$job_id}->{ready
} = $ready;
7820 $readycounter++ if $job->{ready
};
7823 last if scalar(keys %$jobs) == 0;
7825 if ($readycounter == scalar(keys %$jobs)) {
7826 print "all '$op' jobs are ready\n";
7828 # do the complete later (or has already been done)
7829 last if $completion eq 'skip' || $completion eq 'auto';
7831 if ($vmiddst && $vmiddst != $vmid) {
7832 my $agent_running = $qga && qga_check_running
($vmid);
7833 if ($agent_running) {
7834 print "freeze filesystem\n";
7835 eval { mon_cmd
($vmid, "guest-fsfreeze-freeze"); };
7838 print "suspend vm\n";
7839 eval { PVE
::QemuServer
::vm_suspend
($vmid, 1); };
7843 # if we clone a disk for a new target vm, we don't switch the disk
7844 PVE
::QemuServer
::qemu_blockjobs_cancel
($vmid, $jobs);
7846 if ($agent_running) {
7847 print "unfreeze filesystem\n";
7848 eval { mon_cmd
($vmid, "guest-fsfreeze-thaw"); };
7851 print "resume vm\n";
7852 eval { PVE
::QemuServer
::vm_resume
($vmid, 1, 1); };
7859 for my $job_id (sort keys %$jobs) {
7860 # try to switch the disk if source and destination are on the same guest
7861 print "$job_id: Completing block job_id...\n";
7864 if ($completion eq 'complete') {
7865 $op = 'block-job-complete';
7866 } elsif ($completion eq 'cancel') {
7867 $op = 'block-job-cancel';
7869 die "invalid completion value: $completion\n";
7871 eval { mon_cmd
($vmid, $op, device
=> $job_id) };
7872 if ($@ =~ m/cannot be completed/) {
7873 print "$job_id: block job cannot be completed, trying again.\n";
7876 print "$job_id: Completed successfully.\n";
7877 $jobs->{$job_id}->{complete
} = 1;
7888 eval { PVE
::QemuServer
::qemu_blockjobs_cancel
($vmid, $jobs) };
7889 die "block job ($op) error: $err";
7893 sub qemu_blockjobs_cancel
{
7894 my ($vmid, $jobs) = @_;
7896 foreach my $job (keys %$jobs) {
7897 print "$job: Cancelling block job\n";
7898 eval { mon_cmd
($vmid, "block-job-cancel", device
=> $job); };
7899 $jobs->{$job}->{cancel
} = 1;
7903 my $stats = mon_cmd
($vmid, "query-block-jobs");
7905 my $running_jobs = {};
7906 foreach my $stat (@$stats) {
7907 $running_jobs->{$stat->{device
}} = $stat;
7910 foreach my $job (keys %$jobs) {
7912 if (defined($jobs->{$job}->{cancel
}) && !defined($running_jobs->{$job})) {
7913 print "$job: Done.\n";
7914 delete $jobs->{$job};
7918 last if scalar(keys %$jobs) == 0;
7925 my ($storecfg, $source, $dest, $full, $newvollist, $jobs, $completion, $qga, $bwlimit) = @_;
7927 my ($vmid, $running) = $source->@{qw(vmid running)};
7928 my ($src_drivename, $drive, $snapname) = $source->@{qw(drivename drive snapname)};
7930 my ($newvmid, $dst_drivename, $efisize) = $dest->@{qw(vmid drivename efisize)};
7931 my ($storage, $format) = $dest->@{qw(storage format)};
7933 my $use_drive_mirror = $full && $running && $src_drivename && !$snapname;
7935 if ($src_drivename && $dst_drivename && $src_drivename ne $dst_drivename) {
7936 die "cloning from/to EFI disk requires EFI disk\n"
7937 if $src_drivename eq 'efidisk0' || $dst_drivename eq 'efidisk0';
7938 die "cloning from/to TPM state requires TPM state\n"
7939 if $src_drivename eq 'tpmstate0' || $dst_drivename eq 'tpmstate0';
7941 # This would lead to two device nodes in QEMU pointing to the same backing image!
7942 die "cannot change drive name when cloning disk from/to the same VM\n"
7943 if $use_drive_mirror && $vmid == $newvmid;
7946 die "cannot move TPM state while VM is running\n"
7947 if $use_drive_mirror && $src_drivename eq 'tpmstate0';
7951 print "create " . ($full ?
'full' : 'linked') . " clone of drive ";
7952 print "$src_drivename " if $src_drivename;
7953 print "($drive->{file})\n";
7956 $newvolid = PVE
::Storage
::vdisk_clone
($storecfg, $drive->{file
}, $newvmid, $snapname);
7957 push @$newvollist, $newvolid;
7960 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($drive->{file
});
7961 $storeid = $storage if $storage;
7963 my $dst_format = resolve_dst_disk_format
($storecfg, $storeid, $volname, $format);
7967 if (drive_is_cloudinit
($drive)) {
7968 $name = "vm-$newvmid-cloudinit";
7969 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
7970 if ($scfg->{path
}) {
7971 $name .= ".$dst_format";
7974 $size = PVE
::QemuServer
::Cloudinit
::CLOUDINIT_DISK_SIZE
;
7975 } elsif ($dst_drivename eq 'efidisk0') {
7976 $size = $efisize or die "internal error - need to specify EFI disk size\n";
7977 } elsif ($dst_drivename eq 'tpmstate0') {
7978 $dst_format = 'raw';
7979 $size = PVE
::QemuServer
::Drive
::TPMSTATE_DISK_SIZE
;
7981 ($size) = PVE
::Storage
::volume_size_info
($storecfg, $drive->{file
}, 10);
7983 $newvolid = PVE
::Storage
::vdisk_alloc
(
7984 $storecfg, $storeid, $newvmid, $dst_format, $name, ($size/1024)
7986 push @$newvollist, $newvolid;
7988 PVE
::Storage
::activate_volumes
($storecfg, [$newvolid]);
7990 if (drive_is_cloudinit
($drive)) {
7991 # when cloning multiple disks (e.g. during clone_vm) it might be the last disk
7992 # if this is the case, we have to complete any block-jobs still there from
7993 # previous drive-mirrors
7994 if (($completion eq 'complete') && (scalar(keys %$jobs) > 0)) {
7995 qemu_drive_mirror_monitor
($vmid, $newvmid, $jobs, $completion, $qga);
8000 my $sparseinit = PVE
::Storage
::volume_has_feature
($storecfg, 'sparseinit', $newvolid);
8001 if ($use_drive_mirror) {
8002 qemu_drive_mirror
($vmid, $src_drivename, $newvolid, $newvmid, $sparseinit, $jobs,
8003 $completion, $qga, $bwlimit);
8005 # TODO: handle bwlimits
8006 if ($dst_drivename eq 'efidisk0') {
8007 # the relevant data on the efidisk may be smaller than the source
8008 # e.g. on RBD/ZFS, so we use dd to copy only the amount
8009 # that is given by the OVMF_VARS.fd
8010 my $src_path = PVE
::Storage
::path
($storecfg, $drive->{file
}, $snapname);
8011 my $dst_path = PVE
::Storage
::path
($storecfg, $newvolid);
8013 my $src_format = (PVE
::Storage
::parse_volname
($storecfg, $drive->{file
}))[6];
8015 # better for Ceph if block size is not too small, see bug #3324
8018 my $cmd = ['qemu-img', 'dd', '-n', '-O', $dst_format];
8020 if ($src_format eq 'qcow2' && $snapname) {
8021 die "cannot clone qcow2 EFI disk snapshot - requires QEMU >= 6.2\n"
8022 if !min_version
(kvm_user_version
(), 6, 2);
8023 push $cmd->@*, '-l', $snapname;
8025 push $cmd->@*, "bs=$bs", "osize=$size", "if=$src_path", "of=$dst_path";
8028 qemu_img_convert
($drive->{file
}, $newvolid, $size, $snapname, $sparseinit);
8034 my ($size) = eval { PVE
::Storage
::volume_size_info
($storecfg, $newvolid, 10) };
8036 my $disk = dclone
($drive);
8037 delete $disk->{format
};
8038 $disk->{file
} = $newvolid;
8039 $disk->{size
} = $size if defined($size);
8044 sub get_running_qemu_version
{
8046 my $res = mon_cmd
($vmid, "query-version");
8047 return "$res->{qemu}->{major}.$res->{qemu}->{minor}";
8050 sub qemu_use_old_bios_files
{
8051 my ($machine_type) = @_;
8053 return if !$machine_type;
8055 my $use_old_bios_files = undef;
8057 if ($machine_type =~ m/^(\S+)\.pxe$/) {
8059 $use_old_bios_files = 1;
8061 my $version = extract_version
($machine_type, kvm_user_version
());
8062 # Note: kvm version < 2.4 use non-efi pxe files, and have problems when we
8063 # load new efi bios files on migration. So this hack is required to allow
8064 # live migration from qemu-2.2 to qemu-2.4, which is sometimes used when
8065 # updrading from proxmox-ve-3.X to proxmox-ve 4.0
8066 $use_old_bios_files = !min_version
($version, 2, 4);
8069 return ($use_old_bios_files, $machine_type);
8072 sub get_efivars_size
{
8073 my ($conf, $efidisk) = @_;
8075 my $arch = get_vm_arch
($conf);
8076 $efidisk //= $conf->{efidisk0
} ? parse_drive
('efidisk0', $conf->{efidisk0
}) : undef;
8077 my $smm = PVE
::QemuServer
::Machine
::machine_type_is_q35
($conf);
8078 my (undef, $ovmf_vars) = get_ovmf_files
($arch, $efidisk, $smm);
8079 die "uefi vars image '$ovmf_vars' not found\n" if ! -f
$ovmf_vars;
8080 return -s
$ovmf_vars;
8083 sub update_efidisk_size
{
8086 return if !defined($conf->{efidisk0
});
8088 my $disk = PVE
::QemuServer
::parse_drive
('efidisk0', $conf->{efidisk0
});
8089 $disk->{size
} = get_efivars_size
($conf);
8090 $conf->{efidisk0
} = print_drive
($disk);
8095 sub update_tpmstate_size
{
8098 my $disk = PVE
::QemuServer
::parse_drive
('tpmstate0', $conf->{tpmstate0
});
8099 $disk->{size
} = PVE
::QemuServer
::Drive
::TPMSTATE_DISK_SIZE
;
8100 $conf->{tpmstate0
} = print_drive
($disk);
8103 sub create_efidisk
($$$$$$$) {
8104 my ($storecfg, $storeid, $vmid, $fmt, $arch, $efidisk, $smm) = @_;
8106 my (undef, $ovmf_vars) = get_ovmf_files
($arch, $efidisk, $smm);
8107 die "EFI vars default image not found\n" if ! -f
$ovmf_vars;
8109 my $vars_size_b = -s
$ovmf_vars;
8110 my $vars_size = PVE
::Tools
::convert_size
($vars_size_b, 'b' => 'kb');
8111 my $volid = PVE
::Storage
::vdisk_alloc
($storecfg, $storeid, $vmid, $fmt, undef, $vars_size);
8112 PVE
::Storage
::activate_volumes
($storecfg, [$volid]);
8114 qemu_img_convert
($ovmf_vars, $volid, $vars_size_b, undef, 0);
8115 my ($size) = PVE
::Storage
::volume_size_info
($storecfg, $volid, 3);
8117 return ($volid, $size/1024);
8120 sub vm_iothreads_list
{
8123 my $res = mon_cmd
($vmid, 'query-iothreads');
8126 foreach my $iothread (@$res) {
8127 $iothreads->{ $iothread->{id
} } = $iothread->{"thread-id"};
8134 my ($conf, $drive) = @_;
8138 if (!$conf->{scsihw
} || ($conf->{scsihw
} =~ m/^lsi/)) {
8140 } elsif ($conf->{scsihw
} && ($conf->{scsihw
} eq 'virtio-scsi-single')) {
8146 my $controller = int($drive->{index} / $maxdev);
8147 my $controller_prefix = ($conf->{scsihw
} && $conf->{scsihw
} eq 'virtio-scsi-single')
8151 return ($maxdev, $controller, $controller_prefix);
8154 sub resolve_dst_disk_format
{
8155 my ($storecfg, $storeid, $src_volname, $format) = @_;
8156 my ($defFormat, $validFormats) = PVE
::Storage
::storage_default_format
($storecfg, $storeid);
8159 # if no target format is specified, use the source disk format as hint
8161 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
8162 $format = qemu_img_format
($scfg, $src_volname);
8168 # test if requested format is supported - else use default
8169 my $supported = grep { $_ eq $format } @$validFormats;
8170 $format = $defFormat if !$supported;
8174 # NOTE: if this logic changes, please update docs & possibly gui logic
8175 sub find_vmstate_storage
{
8176 my ($conf, $storecfg) = @_;
8178 # first, return storage from conf if set
8179 return $conf->{vmstatestorage
} if $conf->{vmstatestorage
};
8181 my ($target, $shared, $local);
8183 foreach_storage_used_by_vm
($conf, sub {
8185 my $scfg = PVE
::Storage
::storage_config
($storecfg, $sid);
8186 my $dst = $scfg->{shared
} ? \
$shared : \
$local;
8187 $$dst = $sid if !$$dst || $scfg->{path
}; # prefer file based storage
8190 # second, use shared storage where VM has at least one disk
8191 # third, use local storage where VM has at least one disk
8192 # fall back to local storage
8193 $target = $shared // $local // 'local';
8199 my ($uuid, $uuid_str);
8200 UUID
::generate
($uuid);
8201 UUID
::unparse
($uuid, $uuid_str);
8205 sub generate_smbios1_uuid
{
8206 return "uuid=".generate_uuid
();
8212 mon_cmd
($vmid, 'nbd-server-stop');
8215 sub create_reboot_request
{
8217 open(my $fh, '>', "/run/qemu-server/$vmid.reboot")
8218 or die "failed to create reboot trigger file: $!\n";
8222 sub clear_reboot_request
{
8224 my $path = "/run/qemu-server/$vmid.reboot";
8227 $res = unlink($path);
8228 die "could not remove reboot request for $vmid: $!"
8229 if !$res && $! != POSIX
::ENOENT
;
8234 sub bootorder_from_legacy
{
8235 my ($conf, $bootcfg) = @_;
8237 my $boot = $bootcfg->{legacy
} || $boot_fmt->{legacy
}->{default};
8238 my $bootindex_hash = {};
8240 foreach my $o (split(//, $boot)) {
8241 $bootindex_hash->{$o} = $i*100;
8247 PVE
::QemuConfig-
>foreach_volume($conf, sub {
8248 my ($ds, $drive) = @_;
8250 if (drive_is_cdrom
($drive, 1)) {
8251 if ($bootindex_hash->{d
}) {
8252 $bootorder->{$ds} = $bootindex_hash->{d
};
8253 $bootindex_hash->{d
} += 1;
8255 } elsif ($bootindex_hash->{c
}) {
8256 $bootorder->{$ds} = $bootindex_hash->{c
}
8257 if $conf->{bootdisk
} && $conf->{bootdisk
} eq $ds;
8258 $bootindex_hash->{c
} += 1;
8262 if ($bootindex_hash->{n
}) {
8263 for (my $i = 0; $i < $MAX_NETS; $i++) {
8264 my $netname = "net$i";
8265 next if !$conf->{$netname};
8266 $bootorder->{$netname} = $bootindex_hash->{n
};
8267 $bootindex_hash->{n
} += 1;
8274 # Generate default device list for 'boot: order=' property. Matches legacy
8275 # default boot order, but with explicit device names. This is important, since
8276 # the fallback for when neither 'order' nor the old format is specified relies
8277 # on 'bootorder_from_legacy' above, and it would be confusing if this diverges.
8278 sub get_default_bootdevices
{
8284 my $first = PVE
::QemuServer
::Drive
::resolve_first_disk
($conf, 0);
8285 push @ret, $first if $first;
8288 $first = PVE
::QemuServer
::Drive
::resolve_first_disk
($conf, 1);
8289 push @ret, $first if $first;
8292 for (my $i = 0; $i < $MAX_NETS; $i++) {
8293 my $netname = "net$i";
8294 next if !$conf->{$netname};
8295 push @ret, $netname;
8302 sub device_bootorder
{
8305 return bootorder_from_legacy
($conf) if !defined($conf->{boot
});
8307 my $boot = parse_property_string
($boot_fmt, $conf->{boot
});
8310 if (!defined($boot) || $boot->{legacy
}) {
8311 $bootorder = bootorder_from_legacy
($conf, $boot);
8312 } elsif ($boot->{order
}) {
8313 my $i = 100; # start at 100 to allow user to insert devices before us with -args
8314 for my $dev (PVE
::Tools
::split_list
($boot->{order
})) {
8315 $bootorder->{$dev} = $i++;
8322 sub register_qmeventd_handle
{
8326 my $peer = "/var/run/qmeventd.sock";
8331 $fh = IO
::Socket
::UNIX-
>new(Peer
=> $peer, Blocking
=> 0, Timeout
=> 1);
8333 if ($! != EINTR
&& $! != EAGAIN
) {
8334 die "unable to connect to qmeventd socket (vmid: $vmid) - $!\n";
8337 die "unable to connect to qmeventd socket (vmid: $vmid) - timeout "
8338 . "after $count retries\n";
8343 # send handshake to mark VM as backing up
8344 print $fh to_json
({vzdump
=> {vmid
=> "$vmid"}});
8346 # return handle to be closed later when inhibit is no longer required
8350 # bash completion helper
8352 sub complete_backup_archives
{
8353 my ($cmdname, $pname, $cvalue) = @_;
8355 my $cfg = PVE
::Storage
::config
();
8359 if ($cvalue =~ m/^([^:]+):/) {
8363 my $data = PVE
::Storage
::template_list
($cfg, $storeid, 'backup');
8366 foreach my $id (keys %$data) {
8367 foreach my $item (@{$data->{$id}}) {
8368 next if $item->{format
} !~ m/^vma\.(${\PVE::Storage::Plugin::COMPRESSOR_RE})$/;
8369 push @$res, $item->{volid
} if defined($item->{volid
});
8376 my $complete_vmid_full = sub {
8379 my $idlist = vmstatus
();
8383 foreach my $id (keys %$idlist) {
8384 my $d = $idlist->{$id};
8385 if (defined($running)) {
8386 next if $d->{template
};
8387 next if $running && $d->{status
} ne 'running';
8388 next if !$running && $d->{status
} eq 'running';
8397 return &$complete_vmid_full();
8400 sub complete_vmid_stopped
{
8401 return &$complete_vmid_full(0);
8404 sub complete_vmid_running
{
8405 return &$complete_vmid_full(1);
8408 sub complete_storage
{
8410 my $cfg = PVE
::Storage
::config
();
8411 my $ids = $cfg->{ids
};
8414 foreach my $sid (keys %$ids) {
8415 next if !PVE
::Storage
::storage_check_enabled
($cfg, $sid, undef, 1);
8416 next if !$ids->{$sid}->{content
}->{images
};
8423 sub complete_migration_storage
{
8424 my ($cmd, $param, $current_value, $all_args) = @_;
8426 my $targetnode = @$all_args[1];
8428 my $cfg = PVE
::Storage
::config
();
8429 my $ids = $cfg->{ids
};
8432 foreach my $sid (keys %$ids) {
8433 next if !PVE
::Storage
::storage_check_enabled
($cfg, $sid, $targetnode, 1);
8434 next if !$ids->{$sid}->{content
}->{images
};
8443 my $qmpstatus = eval {
8444 PVE
::QemuConfig
::assert_config_exists_on_node
($vmid);
8445 mon_cmd
($vmid, "query-status");
8448 return $qmpstatus && $qmpstatus->{status
} eq "paused";
8451 sub check_volume_storage_type
{
8452 my ($storecfg, $vol) = @_;
8454 my ($storeid, $volname) = PVE
::Storage
::parse_volume_id
($vol);
8455 my $scfg = PVE
::Storage
::storage_config
($storecfg, $storeid);
8456 my ($vtype) = PVE
::Storage
::parse_volname
($storecfg, $vol);
8458 die "storage '$storeid' does not support content-type '$vtype'\n"
8459 if !$scfg->{content
}->{$vtype};
8464 sub add_nets_bridge_fdb
{
8465 my ($conf, $vmid) = @_;
8467 for my $opt (keys %$conf) {
8468 next if $opt !~ m/^net(\d+)$/;
8469 my $iface = "tap${vmid}i$1";
8470 # NOTE: expect setups with learning off to *not* use auto-random-generation of MAC on start
8471 my $net = parse_net
($conf->{$opt}, 1) or next;
8473 my $mac = $net->{macaddr
};
8475 log_warn
("MAC learning disabled, but vNIC '$iface' has no static MAC to add to forwarding DB!")
8476 if !file_read_firstline
("/sys/class/net/$iface/brport/learning");
8480 my $bridge = $net->{bridge
};
8482 PVE
::Network
::SDN
::Zones
::add_bridge_fdb
($iface, $mac, $bridge, $net->{firewall
});
8483 } elsif (-d
"/sys/class/net/$bridge/bridge") { # avoid fdb management with OVS for now
8484 PVE
::Network
::add_bridge_fdb
($iface, $mac, $net->{firewall
});
8489 sub del_nets_bridge_fdb
{
8490 my ($conf, $vmid) = @_;
8492 for my $opt (keys %$conf) {
8493 next if $opt !~ m/^net(\d+)$/;
8494 my $iface = "tap${vmid}i$1";
8496 my $net = parse_net
($conf->{$opt}) or next;
8497 my $mac = $net->{macaddr
} or next;
8499 my $bridge = $net->{bridge
};
8501 PVE
::Network
::SDN
::Zones
::del_bridge_fdb
($iface, $mac, $bridge, $net->{firewall
});
8502 } elsif (-d
"/sys/class/net/$bridge/bridge") { # avoid fdb management with OVS for now
8503 PVE
::Network
::del_bridge_fdb
($iface, $mac, $net->{firewall
});