]>
git.proxmox.com Git - pve-storage.git/blob - PVE/Storage/RBDPlugin.pm
10b54e5fd08e2867b90363c433a413c13684433a
1 package PVE
::Storage
::RBDPlugin
;
11 use PVE
::JSONSchema
qw(get_standard_option);
14 use PVE
::Storage
::Plugin
;
15 use PVE
::Tools
qw(run_command trim);
17 use base
qw(PVE::Storage::Plugin);
19 my $get_parent_image_name = sub {
21 return undef if !$parent;
22 return $parent->{image
} . "@" . $parent->{snapshot
};
25 my $add_pool_to_disk = sub {
26 my ($scfg, $disk) = @_;
28 my $pool = $scfg->{pool
} ?
$scfg->{pool
} : 'rbd';
34 my ($binary, $scfg, $storeid, $op, @options) = @_;
36 my $cmd_option = PVE
::CephConfig
::ceph_connect_option
($scfg, $storeid);
37 my $pool = $scfg->{pool
} ?
$scfg->{pool
} : 'rbd';
39 my $cmd = [$binary, '-p', $pool];
41 push @$cmd, '-c', $cmd_option->{ceph_conf
} if ($cmd_option->{ceph_conf
});
42 push @$cmd, '-m', $cmd_option->{mon_host
} if ($cmd_option->{mon_host
});
43 push @$cmd, '--auth_supported', $cmd_option->{auth_supported
} if ($cmd_option->{auth_supported
});
44 push @$cmd, '-n', "client.$cmd_option->{userid}" if ($cmd_option->{userid
});
45 push @$cmd, '--keyring', $cmd_option->{keyring
} if ($cmd_option->{keyring
});
49 push @$cmd, @options if scalar(@options);
55 my ($scfg, $storeid, $op, @options) = @_;
57 return $build_cmd->('/usr/bin/rbd', $scfg, $storeid, $op, @options);
61 my ($scfg, $storeid, $op, @options) = @_;
63 return $build_cmd->('/usr/bin/rados', $scfg, $storeid, $op, @options);
66 my $librados_connect = sub {
67 my ($scfg, $storeid, $options) = @_;
69 my $librados_config = PVE
::CephConfig
::ceph_connect_option
($scfg, $storeid);
71 my $rados = PVE
::RADOS-
>new(%$librados_config);
76 # needed for volumes created using ceph jewel (or higher)
77 my $krbd_feature_update = sub {
78 my ($scfg, $storeid, $name) = @_;
80 my ($versionparts) = ceph_version
();
81 return 1 if $versionparts->[0] < 10;
83 my (@disable, @enable);
84 my ($kmajor, $kminor) = PVE
::ProcFSTools
::kernel_version
();
86 if ($kmajor > 5 || $kmajor == 5 && $kminor >= 3) {
87 # 'deep-flatten' can only be disabled, not enabled after image creation
88 push @enable, 'fast-diff', 'object-map';
90 push @disable, 'fast-diff', 'object-map', 'deep-flatten';
94 push @enable, 'exclusive-lock';
96 push @disable, 'exclusive-lock';
99 my $active_features_list = (rbd_volume_info
($scfg, $storeid, $name))[4];
100 my $active_features = { map { $_ => 1 } @$active_features_list };
102 my $to_disable = join(',', grep { $active_features->{$_} } @disable);
103 my $to_enable = join(',', grep { !$active_features->{$_} } @enable );
106 print "disable RBD image features this kernel RBD drivers is not compatible with: $to_disable\n";
107 my $cmd = $rbd_cmd->($scfg, $storeid, 'feature', 'disable', $name, $to_disable);
110 errmsg
=> "could not disable krbd-incompatible image features '$to_disable' for rbd image: $name",
114 print "enable RBD image features this kernel RBD drivers supports: $to_enable\n";
116 my $cmd = $rbd_cmd->($scfg, $storeid, 'feature', 'enable', $name, $to_enable);
119 errmsg
=> "could not enable krbd-compatible image features '$to_enable' for rbd image: $name",
126 my $ceph_version_parser = sub {
127 my $ceph_version = shift;
128 # FIXME this is the same as pve-manager PVE::Ceph::Tools get_local_version
129 if ($ceph_version =~ /^ceph.*\s(\d+(?:\.\d+)+(?:-pve\d+)?)\s+(?:\(([a-zA-Z0-9]+)\))?/) {
130 my ($version, $buildcommit) = ($1, $2);
131 my $subversions = [ split(/\.|-/, $version) ];
133 return ($subversions, $version, $buildcommit);
135 warn "Could not parse Ceph version: '$ceph_version'\n";
141 my $version_string = $cache;
142 if (!defined($version_string)) {
143 run_command
('ceph --version', outfunc
=> sub {
144 $version_string = shift;
147 return undef if !defined($version_string);
148 # subversion is an array ref. with the version parts from major to minor
149 # version is the filtered version string
150 my ($subversions, $version) = $ceph_version_parser->($version_string);
152 return wantarray ?
($subversions, $version) : $version;
155 sub run_rbd_command
{
156 my ($cmd, %args) = @_;
159 my $errmsg = $args{errmsg
} . ": " || "";
160 if (!exists($args{errfunc
})) {
161 # ' error: 2014-02-06 11:51:59.839135 7f09f94d0760 -1 librbd: snap_unprotect: can't unprotect;
162 # at least 1 child(ren) in pool cephstor1
163 $args{errfunc
} = sub {
165 if ($line =~ m/^\d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}\.\d+ [0-9a-f]+ [\-\d]+ librbd: (.*)$/) {
170 print STDERR
$lasterr;
175 eval { run_command
($cmd, %args); };
177 die $errmsg . $lasterr if length($lasterr);
185 my ($scfg, $storeid) = @_;
187 my $cmd = &$rbd_cmd($scfg, $storeid, 'ls', '-l', '--format', 'json');
188 my $pool = $scfg->{pool
} ?
$scfg->{pool
} : 'rbd';
191 my $parser = sub { $raw .= shift };
194 run_rbd_command
($cmd, errmsg
=> "rbd error", errfunc
=> sub {}, outfunc
=> $parser);
198 die $err if $err && $err !~ m/doesn't contain rbd images/ ;
203 } elsif ($raw =~ m/^(\[.*\])$/s) { # untaint
204 $result = JSON
::decode_json
($1);
206 die "got unexpected data from rbd ls: '$raw'\n";
211 foreach my $el (@$result) {
212 next if defined($el->{snapshot
});
214 my $image = $el->{image
};
216 my ($owner) = $image =~ m/^(?:vm|base)-(\d+)-/;
217 next if !defined($owner);
219 $list->{$pool}->{$image} = {
222 parent
=> $get_parent_image_name->($el->{parent
}),
230 sub rbd_volume_info
{
231 my ($scfg, $storeid, $volname, $snap) = @_;
235 my @options = ('info', $volname, '--format', 'json');
237 push @options, '--snap', $snap;
240 $cmd = &$rbd_cmd($scfg, $storeid, @options);
243 my $parser = sub { $raw .= shift };
245 run_rbd_command
($cmd, errmsg
=> "rbd error", errfunc
=> sub {}, outfunc
=> $parser);
250 } elsif ($raw =~ m/^(\{.*\})$/s) { # untaint
251 $volume = JSON
::decode_json
($1);
253 die "got unexpected data from rbd info: '$raw'\n";
256 $volume->{parent
} = $get_parent_image_name->($volume->{parent
});
257 $volume->{protected
} = defined($volume->{protected
}) && $volume->{protected
} eq "true" ?
1 : undef;
259 return $volume->@{qw(size parent format protected features)};
270 content
=> [ {images
=> 1, rootdir
=> 1}, { images
=> 1 }],
277 description
=> "IP addresses of monitors (for external clusters).",
278 type
=> 'string', format
=> 'pve-storage-portal-dns-list',
281 description
=> "Pool.",
285 description
=> "RBD Id.",
289 description
=> "Authsupported.",
293 description
=> "Always access rbd through krbd kernel module.",
301 nodes
=> { optional
=> 1 },
302 disable
=> { optional
=> 1 },
303 monhost
=> { optional
=> 1},
304 pool
=> { optional
=> 1 },
305 username
=> { optional
=> 1 },
306 content
=> { optional
=> 1 },
307 krbd
=> { optional
=> 1 },
308 bwlimit
=> { optional
=> 1 },
312 # Storage implementation
315 my ($class, $storeid, $scfg, %param) = @_;
317 return if defined($scfg->{monhost
}); # nothing to do if not pve managed ceph
319 PVE
::CephConfig
::ceph_create_keyfile
($scfg->{type
}, $storeid);
323 my ($class, $storeid, $scfg) = @_;
325 return if defined($scfg->{monhost
}); # nothing to do if not pve managed ceph
327 PVE
::CephConfig
::ceph_remove_keyfile
($scfg->{type
}, $storeid);
331 my ($class, $volname) = @_;
333 if ($volname =~ m/^((base-(\d+)-\S+)\/)?
((base
)?
(vm
)?
-(\d
+)-\S
+)$/) {
334 return ('images', $4, $7, $2, $3, $5, 'raw');
337 die "unable to parse rbd volume name '$volname'\n";
341 my ($class, $scfg, $volname, $storeid, $snapname) = @_;
343 my $cmd_option = PVE
::CephConfig
::ceph_connect_option
($scfg, $storeid);
344 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
345 $name .= '@'.$snapname if $snapname;
347 my $pool = $scfg->{pool
} ?
$scfg->{pool
} : 'rbd';
348 return ("/dev/rbd/$pool/$name", $vmid, $vtype) if $scfg->{krbd
};
350 my $path = "rbd:$pool/$name";
352 $path .= ":conf=$cmd_option->{ceph_conf}" if $cmd_option->{ceph_conf
};
353 if (defined($scfg->{monhost
})) {
354 my $monhost = PVE
::CephConfig
::hostlist
($scfg->{monhost
}, ';');
355 $monhost =~ s/:/\\:/g;
356 $path .= ":mon_host=$monhost";
357 $path .= ":auth_supported=$cmd_option->{auth_supported}";
360 $path .= ":id=$cmd_option->{userid}:keyring=$cmd_option->{keyring}" if ($cmd_option->{keyring
});
362 return ($path, $vmid, $vtype);
365 my $find_free_diskname = sub {
366 my ($storeid, $scfg, $vmid) = @_;
368 my $cmd = &$rbd_cmd($scfg, $storeid, 'ls');
373 if ($line =~ m/^(.*)$/) { # untaint
374 push @$disk_list, $1;
379 run_rbd_command
($cmd, errmsg
=> "rbd error", errfunc
=> sub {}, outfunc
=> $parser);
383 die $err if $err && $err !~ m/doesn't contain rbd images/;
385 return PVE
::Storage
::Plugin
::get_next_vm_diskname
($disk_list, $storeid, $vmid, undef, $scfg);
389 my ($class, $storeid, $scfg, $volname) = @_;
391 my $snap = '__base__';
393 my ($vtype, $name, $vmid, $basename, $basevmid, $isBase) =
394 $class->parse_volname($volname);
396 die "create_base not possible with base image\n" if $isBase;
398 my ($size, $parent, $format, undef) = rbd_volume_info
($scfg, $storeid, $name);
399 die "rbd volume info on '$name' failed\n" if !($size);
401 die "rbd image must be at format V2" if $format ne "2";
403 die "volname '$volname' contains wrong information about parent $parent $basename\n"
404 if $basename && (!$parent || $parent ne $basename."@".$snap);
407 $newname =~ s/^vm-/base-/;
409 my $newvolname = $basename ?
"$basename/$newname" : "$newname";
411 my $cmd = &$rbd_cmd($scfg, $storeid, 'rename', &$add_pool_to_disk($scfg, $name), &$add_pool_to_disk($scfg, $newname));
412 run_rbd_command
($cmd, errmsg
=> "rbd rename '$name' error");
414 my $running = undef; #fixme : is create_base always offline ?
416 $class->volume_snapshot($scfg, $storeid, $newname, $snap, $running);
418 my (undef, undef, undef, $protected) = rbd_volume_info
($scfg, $storeid, $newname, $snap);
421 my $cmd = &$rbd_cmd($scfg, $storeid, 'snap', 'protect', $newname, '--snap', $snap);
422 run_rbd_command
($cmd, errmsg
=> "rbd protect $newname snap '$snap' error");
430 my ($class, $scfg, $storeid, $volname, $vmid, $snapname) = @_;
432 my $snap = '__base__';
433 $snap = $snapname if length $snapname;
435 my ($vtype, $basename, $basevmid, undef, undef, $isBase) =
436 $class->parse_volname($volname);
438 die "$volname is not a base image and snapname is not provided\n"
439 if !$isBase && !length($snapname);
441 my $name = $find_free_diskname->($storeid, $scfg, $vmid);
443 warn "clone $volname: $basename snapname $snap to $name\n";
445 if (length($snapname)) {
446 my (undef, undef, undef, $protected) = rbd_volume_info
($scfg, $storeid, $volname, $snapname);
449 my $cmd = &$rbd_cmd($scfg, $storeid, 'snap', 'protect', $volname, '--snap', $snapname);
450 run_rbd_command
($cmd, errmsg
=> "rbd protect $volname snap $snapname error");
454 my $newvol = "$basename/$name";
455 $newvol = $name if length($snapname);
457 my $cmd = &$rbd_cmd($scfg, $storeid, 'clone', &$add_pool_to_disk($scfg, $basename),
458 '--snap', $snap, &$add_pool_to_disk($scfg, $name));
460 run_rbd_command
($cmd, errmsg
=> "rbd clone '$basename' error");
466 my ($class, $storeid, $scfg, $vmid, $fmt, $name, $size) = @_;
469 die "illegal name '$name' - should be 'vm-$vmid-*'\n"
470 if $name && $name !~ m/^vm-$vmid-/;
472 $name = $find_free_diskname->($storeid, $scfg, $vmid) if !$name;
474 my $cmd = &$rbd_cmd($scfg, $storeid, 'create', '--image-format' , 2, '--size', int(($size+1023)/1024), $name);
475 run_rbd_command
($cmd, errmsg
=> "rbd create $name' error");
481 my ($class, $storeid, $scfg, $volname, $isBase) = @_;
483 my ($vtype, $name, $vmid, undef, undef, undef) =
484 $class->parse_volname($volname);
487 my $snap = '__base__';
488 my (undef, undef, undef, $protected) = rbd_volume_info
($scfg, $storeid, $name, $snap);
490 my $cmd = &$rbd_cmd($scfg, $storeid, 'snap', 'unprotect', $name, '--snap', $snap);
491 run_rbd_command
($cmd, errmsg
=> "rbd unprotect $name snap '$snap' error");
495 $class->deactivate_volume($storeid, $scfg, $volname);
497 my $cmd = &$rbd_cmd($scfg, $storeid, 'snap', 'purge', $name);
498 run_rbd_command
($cmd, errmsg
=> "rbd snap purge '$volname' error");
500 $cmd = &$rbd_cmd($scfg, $storeid, 'rm', $name);
501 run_rbd_command
($cmd, errmsg
=> "rbd rm '$volname' error");
507 my ($class, $storeid, $scfg, $vmid, $vollist, $cache) = @_;
509 $cache->{rbd
} = rbd_ls
($scfg, $storeid) if !$cache->{rbd
};
510 my $pool = $scfg->{pool
} ?
$scfg->{pool
} : 'rbd';
514 if (my $dat = $cache->{rbd
}->{$pool}) {
515 foreach my $image (keys %$dat) {
517 my $info = $dat->{$image};
519 my $volname = $info->{name
};
520 my $parent = $info->{parent
};
521 my $owner = $info->{vmid
};
523 if ($parent && $parent =~ m/^(base-\d+-\S+)\@__base__$/) {
524 $info->{volid
} = "$storeid:$1/$volname";
526 $info->{volid
} = "$storeid:$volname";
530 my $found = grep { $_ eq $info->{volid
} } @$vollist;
533 next if defined ($vmid) && ($owner ne $vmid);
536 $info->{format
} = 'raw';
546 my ($class, $storeid, $scfg, $cache) = @_;
549 my $rados = &$librados_connect($scfg, $storeid);
550 my $df = $rados->mon_command({ prefix
=> 'df', format
=> 'json' });
552 my ($d) = grep { $_->{name
} eq $scfg->{pool
} } @{$df->{pools
}};
554 # max_avail -> max available space for data w/o replication in the pool
555 # bytes_used -> data w/o replication in the pool
556 my $free = $d->{stats
}->{max_avail
};
557 my $used = $d->{stats
}->{stored
} // $d->{stats
}->{bytes_used
};
558 my $total = $used + $free;
561 return ($total, $free, $used, $active);
564 sub activate_storage
{
565 my ($class, $storeid, $scfg, $cache) = @_;
569 sub deactivate_storage
{
570 my ($class, $storeid, $scfg, $cache) = @_;
574 my $get_kernel_device_name = sub {
575 my ($pool, $name) = @_;
577 return "/dev/rbd/$pool/$name";
581 my ($class, $storeid, $scfg, $volname, $snapname) = @_;
583 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
584 $name .= '@'.$snapname if $snapname;
586 my $pool = $scfg->{pool
} ?
$scfg->{pool
} : 'rbd';
588 my $kerneldev = $get_kernel_device_name->($pool, $name);
590 return $kerneldev if -b
$kerneldev; # already mapped
592 $krbd_feature_update->($scfg, $storeid, $name) if !$snapname;
594 my $cmd = &$rbd_cmd($scfg, $storeid, 'map', $name);
595 run_rbd_command
($cmd, errmsg
=> "can't map rbd volume $name");
601 my ($class, $storeid, $scfg, $volname, $snapname) = @_;
603 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
604 $name .= '@'.$snapname if $snapname;
606 my $pool = $scfg->{pool
} ?
$scfg->{pool
} : 'rbd';
608 my $kerneldev = $get_kernel_device_name->($pool, $name);
611 my $cmd = &$rbd_cmd($scfg, $storeid, 'unmap', $kerneldev);
612 run_rbd_command
($cmd, errmsg
=> "can't unmap rbd device $kerneldev");
618 sub activate_volume
{
619 my ($class, $storeid, $scfg, $volname, $snapname, $cache) = @_;
621 $class->map_volume($storeid, $scfg, $volname, $snapname) if $scfg->{krbd
};
626 sub deactivate_volume
{
627 my ($class, $storeid, $scfg, $volname, $snapname, $cache) = @_;
629 $class->unmap_volume($storeid, $scfg, $volname, $snapname);
634 sub volume_size_info
{
635 my ($class, $scfg, $storeid, $volname, $timeout) = @_;
637 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
638 my ($size, undef) = rbd_volume_info
($scfg, $storeid, $name);
643 my ($class, $scfg, $storeid, $volname, $size, $running) = @_;
645 return 1 if $running && !$scfg->{krbd
}; # FIXME???
647 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
649 my $cmd = &$rbd_cmd($scfg, $storeid, 'resize', '--allow-shrink', '--size', ($size/1024/1024), $name);
650 run_rbd_command
($cmd, errmsg
=> "rbd resize '$volname' error");
654 sub volume_snapshot
{
655 my ($class, $scfg, $storeid, $volname, $snap) = @_;
657 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
659 my $cmd = &$rbd_cmd($scfg, $storeid, 'snap', 'create', '--snap', $snap, $name);
660 run_rbd_command
($cmd, errmsg
=> "rbd snapshot '$volname' error");
664 sub volume_snapshot_rollback
{
665 my ($class, $scfg, $storeid, $volname, $snap) = @_;
667 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
669 my $cmd = &$rbd_cmd($scfg, $storeid, 'snap', 'rollback', '--snap', $snap, $name);
670 run_rbd_command
($cmd, errmsg
=> "rbd snapshot $volname to '$snap' error");
673 sub volume_snapshot_delete
{
674 my ($class, $scfg, $storeid, $volname, $snap, $running) = @_;
676 return 1 if $running && !$scfg->{krbd
}; # FIXME: ????
678 $class->deactivate_volume($storeid, $scfg, $volname, $snap, {});
680 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
682 my (undef, undef, undef, $protected) = rbd_volume_info
($scfg, $storeid, $name, $snap);
684 my $cmd = &$rbd_cmd($scfg, $storeid, 'snap', 'unprotect', $name, '--snap', $snap);
685 run_rbd_command
($cmd, errmsg
=> "rbd unprotect $name snap '$snap' error");
688 my $cmd = &$rbd_cmd($scfg, $storeid, 'snap', 'rm', '--snap', $snap, $name);
690 run_rbd_command
($cmd, errmsg
=> "rbd snapshot '$volname' error");
695 sub volume_has_feature
{
696 my ($class, $scfg, $feature, $storeid, $volname, $snapname, $running) = @_;
699 snapshot
=> { current
=> 1, snap
=> 1},
700 clone
=> { base
=> 1, snap
=> 1},
701 template
=> { current
=> 1},
702 copy
=> { base
=> 1, current
=> 1, snap
=> 1},
703 sparseinit
=> { base
=> 1, current
=> 1},
706 my ($vtype, $name, $vmid, $basename, $basevmid, $isBase) =
707 $class->parse_volname($volname);
713 $key = $isBase ?
'base' : 'current';
715 return 1 if $features->{$feature}->{$key};