]> git.proxmox.com Git - qemu-server.git/blobdiff - PVE/QemuMigrate.pm
migrate: cleanup forwarding code
[qemu-server.git] / PVE / QemuMigrate.pm
index 26d33a0f47462b13a7146c744d0345955db1c218..b729940b24955f03f82825d490f656e2ea2740c7 100644 (file)
@@ -17,6 +17,8 @@ use PVE::ReplicationState;
 use PVE::Storage;
 use PVE::Tools;
 
+use PVE::QemuConfig;
+use PVE::QemuServer::CPUConfig;
 use PVE::QemuServer::Drive;
 use PVE::QemuServer::Helpers qw(min_version);
 use PVE::QemuServer::Machine;
@@ -144,10 +146,10 @@ sub write_tunnel {
 }
 
 sub fork_tunnel {
-    my ($self, $tunnel_addr) = @_;
+    my ($self, $ssh_forward_info) = @_;
 
     my @localtunnelinfo = ();
-    foreach my $addr (@$tunnel_addr) {
+    foreach my $addr (@$ssh_forward_info) {
        push @localtunnelinfo, '-L', $addr;
     }
 
@@ -189,9 +191,9 @@ sub finish_tunnel {
 
     $self->finish_command_pipe($tunnel, 30);
 
-    if ($tunnel->{sock_addr}) {
+    if (my $unix_sockets = $tunnel->{unix_sockets}) {
        # ssh does not clean up on local host
-       my $cmd = ['rm', '-f', @{$tunnel->{sock_addr}}]; #
+       my $cmd = ['rm', '-f', @$unix_sockets];
        PVE::Tools::run_command($cmd);
 
        # .. and just to be sure check on remote side
@@ -227,7 +229,17 @@ sub prepare {
 
        $self->{forcemachine} = PVE::QemuServer::Machine::qemu_machine_pxe($vmid, $conf);
 
+       # To support custom CPU types, we keep QEMU's "-cpu" parameter intact.
+       # Since the parameter itself contains no reference to a custom model,
+       # this makes migration independent of changes to "cpu-models.conf".
+       if ($conf->{cpu}) {
+           my $cpuconf = PVE::QemuServer::CPUConfig::parse_cpu_conf_basic($conf->{cpu});
+           if ($cpuconf && PVE::QemuServer::CPUConfig::is_custom_model($cpuconf->{cputype})) {
+               $self->{forcecpu} = PVE::QemuServer::CPUConfig::get_cpu_from_running_vm($pid);
+           }
+       }
     }
+
     my $loc_res = PVE::QemuServer::check_local_resources($conf, 1);
     if (scalar @$loc_res) {
        if ($self->{running} || !$self->{opts}->{force}) {
@@ -278,7 +290,9 @@ sub sync_disks {
     my $conf = $self->{vmconf};
 
     # local volumes which have been copied
+    # and their old_id => new_id pairs
     $self->{volumes} = [];
+    $self->{volume_map} = {};
 
     my $storecfg = $self->{storecfg};
     eval {
@@ -374,6 +388,9 @@ sub sync_disks {
            return if $scfg->{shared};
 
            $local_volumes->{$volid}->{ref} = $attr->{referenced_in_config} ? 'config' : 'snapshot';
+           $local_volumes->{$volid}->{ref} = 'storage' if $attr->{is_unused};
+
+           $local_volumes->{$volid}->{is_vmstate} = $attr->{is_vmstate} ? 1 : 0;
 
            if ($attr->{cdrom}) {
                if ($volid =~ /vm-\d+-cloudinit/) {
@@ -388,6 +405,8 @@ sub sync_disks {
            die "owned by other VM (owner = VM $owner)\n"
                if !$owner || ($owner != $vmid);
 
+           return if $attr->{is_vmstate};
+
            if (defined($snaprefs)) {
                $local_volumes->{$volid}->{snapshots} = 1;
 
@@ -466,7 +485,7 @@ sub sync_disks {
                }
 
                my $live_replicatable_volumes = {};
-               PVE::QemuServer::foreach_drive($conf, sub {
+               PVE::QemuConfig->foreach_volume($conf, sub {
                    my ($ds, $drive) = @_;
 
                    my $volid = $drive->{file};
@@ -497,8 +516,11 @@ sub sync_disks {
        # sizes in config have to be accurate for remote node to correctly
        # allocate disks, rescan to be sure
        my $volid_hash = PVE::QemuServer::scan_volids($storecfg, $vmid);
-       PVE::QemuServer::foreach_drive($conf, sub {
+       PVE::QemuConfig->foreach_volume($conf, sub {
            my ($key, $drive) = @_;
+           return if $key eq 'efidisk0'; # skip efidisk, will be handled later
+           return if !defined($local_volumes->{$key}); # only update sizes for local volumes
+
            my ($updated, $old_size, $new_size) = PVE::QemuServer::Drive::update_disksize($drive, $volid_hash);
            if (defined($updated)) {
                $conf->{$key} = PVE::QemuServer::print_drive($updated);
@@ -529,15 +551,29 @@ sub sync_disks {
                next if $self->{replicated_volumes}->{$volid};
                push @{$self->{volumes}}, $volid;
                my $opts = $self->{opts};
-               my $insecure = $opts->{migration_type} eq 'insecure';
-               my $with_snapshots = $local_volumes->{$volid}->{snapshots};
                # use 'migrate' limit for transfer to other node
                my $bwlimit = PVE::Storage::get_bandwidth_limit('migration', [$targetsid, $sid], $opts->{bwlimit});
                # JSONSchema and get_bandwidth_limit use kbps - storage_migrate bps
                $bwlimit = $bwlimit * 1024 if defined($bwlimit);
 
-               PVE::Storage::storage_migrate($storecfg, $volid, $self->{ssh_info}, $targetsid,
-                                             undef, undef, undef, $bwlimit, $insecure, $with_snapshots);
+               my $storage_migrate_opts = {
+                   'bwlimit' => $bwlimit,
+                   'insecure' => $opts->{migration_type} eq 'insecure',
+                   'with_snapshots' => $local_volumes->{$volid}->{snapshots},
+                   'allow_rename' => !$local_volumes->{$volid}->{is_vmstate},
+               };
+
+               my $logfunc = sub { $self->log('info', $_[0]); };
+               my $new_volid = eval {
+                   PVE::Storage::storage_migrate($storecfg, $volid, $self->{ssh_info},
+                                                 $targetsid, $storage_migrate_opts, $logfunc);
+               };
+               if (my $err = $@) {
+                   die "storage migration for '$volid' to storage '$targetsid' failed - $err\n";
+               }
+
+               $self->{volume_map}->{$volid} = $new_volid;
+               $self->log('info', "volume '$volid' is '$new_volid' on the target\n");
            }
        }
     };
@@ -662,20 +698,31 @@ sub phase2 {
        push @$cmd, '--machine', $self->{forcemachine};
     }
 
+    if ($self->{forcecpu}) {
+       push @$cmd, '--force-cpu', $self->{forcecpu};
+    }
+
     if ($self->{online_local_volumes}) {
        push @$cmd, '--targetstorage', ($self->{opts}->{targetstorage} // '1');
     }
 
     my $spice_port;
-    my $tunnel_addr = [];
-    my $sock_addr = [];
+    my $unix_socket_info = {};
     # version > 0 for unix socket support
     my $nbd_protocol_version = 1;
     # TODO change to 'spice_ticket: <ticket>\n' in 7.0
     my $input = $spice_ticket ? "$spice_ticket\n" : "\n";
     $input .= "nbd_protocol_version: $nbd_protocol_version\n";
-    foreach my $volid (keys %{$self->{replicated_volumes}}) {
-       $input .= "replicated_volume: $volid\n";
+
+    my $number_of_online_replicated_volumes = 0;
+
+    # prevent auto-vivification
+    if ($self->{online_local_volumes}) {
+       foreach my $volid (@{$self->{online_local_volumes}}) {
+           next if !$self->{replicated_volumes}->{$volid};
+           $number_of_online_replicated_volumes++;
+           $input .= "replicated_volume: $volid\n";
+       }
     }
 
     my $target_replicated_volumes = {};
@@ -709,6 +756,7 @@ sub phase2 {
            my $targetdrive = $3;
            $targetdrive =~ s/drive-//g;
 
+           $self->{stopnbd} = 1;
            $self->{target_drive}->{$targetdrive}->{drivestr} = $drivestr;
            $self->{target_drive}->{$targetdrive}->{nbd_uri} = $nbd_uri;
        } elsif ($line =~ m!^storage migration listens on nbd:unix:(/run/qemu-server/(\d+)_nbd\.migrate):exportname=(\S+) volume:(\S+)$!) {
@@ -719,10 +767,10 @@ sub phase2 {
            my $targetdrive = $3;
            $targetdrive =~ s/drive-//g;
 
+           $self->{stopnbd} = 1;
            $self->{target_drive}->{$targetdrive}->{drivestr} = $drivestr;
            $self->{target_drive}->{$targetdrive}->{nbd_uri} = $nbd_uri;
-           push @$tunnel_addr, "$nbd_unix_addr:$nbd_unix_addr";
-           push @$sock_addr, $nbd_unix_addr;
+           $unix_socket_info->{$nbd_unix_addr} = 1;
        } elsif ($line =~ m/^re-using replicated volume: (\S+) - (.*)$/) {
            my $drive = $1;
            my $volid = $2;
@@ -739,7 +787,7 @@ sub phase2 {
 
     die "unable to detect remote migration address\n" if !$raddr;
 
-    if (scalar(keys %$target_replicated_volumes) != scalar(keys %{$self->{replicated_volumes}})) {
+    if (scalar(keys %$target_replicated_volumes) != $number_of_online_replicated_volumes) {
        die "number of replicated disks on source and target node do not match - target node too old?\n"
     }
 
@@ -748,22 +796,28 @@ sub phase2 {
     if ($migration_type eq 'secure') {
 
        if ($ruri =~ /^unix:/) {
-           unlink $raddr;
-           push @$tunnel_addr, "$raddr:$raddr";
-           $self->{tunnel} = $self->fork_tunnel($tunnel_addr);
-           push @$sock_addr, $raddr;
+           my $ssh_forward_info = ["$raddr:$raddr"];
+           $unix_socket_info->{$raddr} = 1;
+
+           my $unix_sockets = [ keys %$unix_socket_info ];
+           for my $sock (@$unix_sockets) {
+               push @$ssh_forward_info, "$sock:$sock";
+               unlink $sock;
+           }
+
+           $self->{tunnel} = $self->fork_tunnel($ssh_forward_info);
 
            my $unix_socket_try = 0; # wait for the socket to become ready
            while ($unix_socket_try <= 100) {
                $unix_socket_try++;
                my $available = 0;
-               foreach my $sock (@$sock_addr) {
+               foreach my $sock (@$unix_sockets) {
                    if (-S $sock) {
                        $available++;
                    }
                }
 
-               if ($available == @$sock_addr) {
+               if ($available == @$unix_sockets) {
                    last;
                }
 
@@ -774,17 +828,18 @@ sub phase2 {
                $self->finish_tunnel($self->{tunnel});
                die "Timeout, migration socket $ruri did not get ready";
            }
+           $self->{tunnel}->{unix_sockets} = $unix_sockets if (@$unix_sockets);
 
        } elsif ($ruri =~ /^tcp:/) {
-           my $tunnel_addr;
+           my $ssh_forward_info = [];
            if ($raddr eq "localhost") {
                # for backwards compatibility with older qemu-server versions
                my $pfamily = PVE::Tools::get_host_address_family($nodename);
                my $lport = PVE::Tools::next_migrate_port($pfamily);
-               $tunnel_addr = "$lport:localhost:$rport";
+               push @$ssh_forward_info, "$lport:localhost:$rport";
            }
 
-           $self->{tunnel} = $self->fork_tunnel($tunnel_addr);
+           $self->{tunnel} = $self->fork_tunnel($ssh_forward_info);
 
        } else {
            die "unsupported protocol in migration URI: $ruri\n";
@@ -793,8 +848,6 @@ sub phase2 {
        #fork tunnel for insecure migration, to send faster commands like resume
        $self->{tunnel} = $self->fork_tunnel();
     }
-    $self->{tunnel}->{sock_addr} = $sock_addr if (@$sock_addr);
-
     my $start = time();
 
     my $opt_bwlimit = $self->{opts}->{bwlimit};
@@ -813,14 +866,20 @@ sub phase2 {
            my $source_drive = PVE::QemuServer::parse_drive($drive, $conf->{$drive});
            my $target_drive = PVE::QemuServer::parse_drive($drive, $target->{drivestr});
 
-           my $source_sid = PVE::Storage::Plugin::parse_volume_id($source_drive->{file});
-           my $target_sid = PVE::Storage::Plugin::parse_volume_id($target_drive->{file});
+           my $source_volid = $source_drive->{file};
+           my $target_volid = $target_drive->{file};
+
+           my $source_sid = PVE::Storage::Plugin::parse_volume_id($source_volid);
+           my $target_sid = PVE::Storage::Plugin::parse_volume_id($target_volid);
 
            my $bwlimit = PVE::Storage::get_bandwidth_limit('migration', [$source_sid, $target_sid], $opt_bwlimit);
            my $bitmap = $target->{bitmap};
 
            $self->log('info', "$drive: start migration to $nbd_uri");
            PVE::QemuServer::qemu_drive_mirror($vmid, $drive, $nbd_uri, $vmid, undef, $self->{storage_migration_jobs}, 'skip', undef, $bwlimit, $bitmap);
+
+           $self->{volume_map}->{$source_volid} = $target_volid;
+           $self->log('info', "volume '$source_volid' is '$target_volid' on the target\n");
        }
     }
 
@@ -1099,15 +1158,24 @@ sub phase3_cleanup {
            eval { PVE::QemuServer::qemu_blockjobs_cancel($vmid, $self->{storage_migration_jobs}) };
            eval { PVE::QemuMigrate::cleanup_remotedisks($self) };
            die "Failed to complete storage migration: $err\n";
-       } else {
-           foreach my $target_drive (keys %{$self->{target_drive}}) {
-               my $drive = PVE::QemuServer::parse_drive($target_drive, $self->{target_drive}->{$target_drive}->{drivestr});
-               $conf->{$target_drive} = PVE::QemuServer::print_drive($drive);
-               PVE::QemuConfig->write_config($vmid, $conf);
-           }
        }
     }
 
+    if ($self->{volume_map}) {
+       my $target_drives = $self->{target_drive};
+
+       # FIXME: for NBD storage migration we now only update the volid, and
+       # not the full drivestr from the target node. Workaround that until we
+       # got some real rescan, to avoid things like wrong format in the drive
+       delete $conf->{$_} for keys %$target_drives;
+       PVE::QemuConfig->update_volume_ids($conf, $self->{volume_map});
+
+       for my $drive (keys %$target_drives) {
+           $conf->{$drive} = $target_drives->{$drive}->{drivestr};
+       }
+       PVE::QemuConfig->write_config($vmid, $conf);
+    }
+
     # transfer replication state before move config
     $self->transfer_replication_state() if $self->{replicated_volumes};
 
@@ -1121,7 +1189,8 @@ sub phase3_cleanup {
     $self->switch_replication_job_target() if $self->{replicated_volumes};
 
     if ($self->{livemigration}) {
-       if ($self->{storage_migration}) {
+       if ($self->{stopnbd}) {
+           $self->log('info', "stopping NBD storage migration server on target.");
            # stop nbd server on remote vm - requirement for resume since 2.9
            my $cmd = [@{$self->{rem_ssh}}, 'qm', 'nbdstop', $vmid];