]> git.proxmox.com Git - pve-storage.git/blame - PVE/Storage/LVMPlugin.pm
rbd: use add/delete hooks
[pve-storage.git] / PVE / Storage / LVMPlugin.pm
CommitLineData
1dc01b9f
DM
1package PVE::Storage::LVMPlugin;
2
3use strict;
4use warnings;
3e44cd84 5use Data::Dumper;
1dc01b9f
DM
6use IO::File;
7use PVE::Tools qw(run_command trim);
8use PVE::Storage::Plugin;
9use PVE::JSONSchema qw(get_standard_option);
10
11use base qw(PVE::Storage::Plugin);
12
13# lvm helper functions
14
15sub lvm_pv_info {
16 my ($device) = @_;
17
18 die "no device specified" if !$device;
19
20 my $has_label = 0;
21
22 my $cmd = ['/usr/bin/file', '-L', '-s', $device];
23 run_command($cmd, outfunc => sub {
24 my $line = shift;
25 $has_label = 1 if $line =~ m/LVM2/;
26 });
27
28 return undef if !$has_label;
29
30 $cmd = ['/sbin/pvs', '--separator', ':', '--noheadings', '--units', 'k',
31 '--unbuffered', '--nosuffix', '--options',
32 'pv_name,pv_size,vg_name,pv_uuid', $device];
33
34 my $pvinfo;
35 run_command($cmd, outfunc => sub {
36 my $line = shift;
37
38 $line = trim($line);
39
40 my ($pvname, $size, $vgname, $uuid) = split(':', $line);
41
5c687bd9 42 die "found multiple pvs entries for device '$device'\n"
1dc01b9f
DM
43 if $pvinfo;
44
45 $pvinfo = {
46 pvname => $pvname,
a3f38a64 47 size => int($size),
1dc01b9f
DM
48 vgname => $vgname,
49 uuid => $uuid,
50 };
51 });
52
53 return $pvinfo;
54}
55
56sub clear_first_sector {
57 my ($dev) = shift;
58
59 if (my $fh = IO::File->new($dev, "w")) {
60 my $buf = 0 x 512;
61 syswrite $fh, $buf;
5c687bd9 62 $fh->close();
1dc01b9f
DM
63 }
64}
65
66sub lvm_create_volume_group {
67 my ($device, $vgname, $shared) = @_;
5c687bd9 68
1dc01b9f 69 my $res = lvm_pv_info($device);
5c687bd9 70
1dc01b9f
DM
71 if ($res->{vgname}) {
72 return if $res->{vgname} eq $vgname; # already created
73 die "device '$device' is already used by volume group '$res->{vgname}'\n";
74 }
75
76 clear_first_sector($device); # else pvcreate fails
77
78 # we use --metadatasize 250k, which reseults in "pe_start = 512"
79 # so pe_start is aligned on a 128k boundary (advantage for SSDs)
80 my $cmd = ['/sbin/pvcreate', '--metadatasize', '250k', $device];
81
82 run_command($cmd, errmsg => "pvcreate '$device' error");
83
84 $cmd = ['/sbin/vgcreate', $vgname, $device];
85 # push @$cmd, '-c', 'y' if $shared; # we do not use this yet
86
87 run_command($cmd, errmsg => "vgcreate $vgname $device error");
88}
89
90sub lvm_vgs {
91
92 my $cmd = ['/sbin/vgs', '--separator', ':', '--noheadings', '--units', 'b',
93 '--unbuffered', '--nosuffix', '--options',
94 'vg_name,vg_size,vg_free'];
95
96 my $vgs = {};
97 eval {
98 run_command($cmd, outfunc => sub {
99 my $line = shift;
100
101 $line = trim($line);
102
103 my ($name, $size, $free) = split (':', $line);
104
105 $vgs->{$name} = { size => int ($size), free => int ($free) };
106 });
107 };
108 my $err = $@;
109
110 # just warn (vgs return error code 5 if clvmd does not run)
111 # but output is still OK (list without clustered VGs)
112 warn $err if $err;
113
114 return $vgs;
115}
116
3e44cd84 117sub lvm_list_volumes {
1dc01b9f
DM
118 my ($vgname) = @_;
119
120 my $cmd = ['/sbin/lvs', '--separator', ':', '--noheadings', '--units', 'b',
121 '--unbuffered', '--nosuffix', '--options',
3e44cd84 122 'vg_name,lv_name,lv_size,lv_attr,pool_lv,data_percent,metadata_percent,snap_percent,uuid,tags'];
1dc01b9f
DM
123
124 push @$cmd, $vgname if $vgname;
125
126 my $lvs = {};
127 run_command($cmd, outfunc => sub {
128 my $line = shift;
129
130 $line = trim($line);
131
3e44cd84
DM
132 my ($vg_name, $lv_name, $lv_size, $lv_attr, $pool_lv, $data_percent, $meta_percent, $snap_percent, $uuid, $tags) = split(':', $line);
133 return if !$vg_name;
134 return if !$lv_name;
1dc01b9f 135
3e44cd84 136 my $lv_type = substr($lv_attr, 0, 1);
1dc01b9f 137
3e44cd84 138 my $d = {
a3f38a64 139 lv_size => int($lv_size),
3e44cd84
DM
140 lv_type => $lv_type,
141 };
142 $d->{pool_lv} = $pool_lv if $pool_lv;
7a9dd119 143 $d->{tags} = $tags if $tags;
3e44cd84
DM
144
145 if ($lv_type eq 't') {
146 $data_percent ||= 0;
147 $meta_percent ||= 0;
148 $snap_percent ||= 0;
faabe9e2 149 $d->{used} = int(($data_percent * $lv_size)/100);
1dc01b9f 150 }
3e44cd84 151 $lvs->{$vg_name}->{$lv_name} = $d;
1dc01b9f
DM
152 });
153
154 return $lvs;
155}
156
5c687bd9 157# Configuration
1dc01b9f 158
1dc01b9f
DM
159sub type {
160 return 'lvm';
161}
162
163sub plugindata {
164 return {
68b2c18a 165 content => [ {images => 1, rootdir => 1}, { images => 1 }],
1dc01b9f
DM
166 };
167}
168
169sub properties {
170 return {
171 vgname => {
172 description => "Volume group name.",
173 type => 'string', format => 'pve-storage-vgname',
174 },
175 base => {
176 description => "Base volume. This volume is automatically activated.",
177 type => 'string', format => 'pve-volume-id',
178 },
179 saferemove => {
180 description => "Zero-out data when removing LVs.",
181 type => 'boolean',
182 },
399ab2b6
PB
183 saferemove_throughput => {
184 description => "Wipe throughput (cstream -t parameter value).",
185 type => 'string',
186 },
7a9dd119
FG
187 tagged_only => {
188 description => "Only use logical volumes tagged with 'pve-vm-ID'.",
189 type => 'boolean',
190 }
1dc01b9f
DM
191 };
192}
193
194sub options {
195 return {
196 vgname => { fixed => 1 },
0423e8c6 197 nodes => { optional => 1 },
1dc01b9f
DM
198 shared => { optional => 1 },
199 disable => { optional => 1 },
0423e8c6
FG
200 saferemove => { optional => 1 },
201 saferemove_throughput => { optional => 1 },
1dc01b9f 202 content => { optional => 1 },
0423e8c6 203 base => { fixed => 1, optional => 1 },
7a9dd119 204 tagged_only => { optional => 1 },
9edb99a5 205 bwlimit => { optional => 1 },
1dc01b9f
DM
206 };
207}
208
209# Storage implementation
210
211sub parse_volname {
212 my ($class, $volname) = @_;
213
5dca5c7c 214 PVE::Storage::Plugin::parse_lvm_name($volname);
1dc01b9f
DM
215
216 if ($volname =~ m/^(vm-(\d+)-\S+)$/) {
7800e84d 217 return ('images', $1, $2, undef, undef, undef, 'raw');
1dc01b9f
DM
218 }
219
220 die "unable to parse lvm volume name '$volname'\n";
221}
222
452e3ee7 223sub filesystem_path {
e67069eb
DM
224 my ($class, $scfg, $volname, $snapname) = @_;
225
226 die "lvm snapshot is not implemented"if defined($snapname);
1dc01b9f
DM
227
228 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
229
230 my $vg = $scfg->{vgname};
5c687bd9 231
1dc01b9f
DM
232 my $path = "/dev/$vg/$name";
233
5521b580 234 return wantarray ? ($path, $vmid, $vtype) : $path;
1dc01b9f
DM
235}
236
5eab0272
DM
237sub create_base {
238 my ($class, $storeid, $scfg, $volname) = @_;
239
240 die "can't create base images in lvm storage\n";
241}
242
243sub clone_image {
f236eaf8 244 my ($class, $scfg, $storeid, $volname, $vmid, $snap) = @_;
5eab0272
DM
245
246 die "can't clone images in lvm storage\n";
247}
248
b1378461
DM
249sub lvm_find_free_diskname {
250 my ($lvs, $vg, $storeid, $vmid) = @_;
251
252 my $name;
253
254 for (my $i = 1; $i < 100; $i++) {
255 my $tn = "vm-$vmid-disk-$i";
256 if (!defined ($lvs->{$vg}->{$tn})) {
257 $name = $tn;
258 last;
259 }
260 }
261
262 die "unable to allocate an image name for ID $vmid in storage '$storeid'\n"
263 if !$name;
264
265 return $name;
266}
267
1dc01b9f
DM
268sub alloc_image {
269 my ($class, $storeid, $scfg, $vmid, $fmt, $name, $size) = @_;
270
271 die "unsupported format '$fmt'" if $fmt ne 'raw';
272
5c687bd9 273 die "illegal name '$name' - sould be 'vm-$vmid-*'\n"
1dc01b9f
DM
274 if $name && $name !~ m/^vm-$vmid-/;
275
276 my $vgs = lvm_vgs();
277
278 my $vg = $scfg->{vgname};
279
e8acaa3c 280 die "no such volume group '$vg'\n" if !defined ($vgs->{$vg});
1dc01b9f
DM
281
282 my $free = int($vgs->{$vg}->{free});
283
284 die "not enough free space ($free < $size)\n" if $free < $size;
285
b1378461 286 $name = lvm_find_free_diskname(lvm_list_volumes($vg), $vg, $storeid, $vmid)
1dc01b9f
DM
287 if !$name;
288
289 my $cmd = ['/sbin/lvcreate', '-aly', '--addtag', "pve-vm-$vmid", '--size', "${size}k", '--name', $name, $vg];
290
291 run_command($cmd, errmsg => "lvcreate '$vg/pve-vm-$vmid' error");
292
293 return $name;
294}
295
296sub free_image {
32437ed2 297 my ($class, $storeid, $scfg, $volname, $isBase) = @_;
1dc01b9f
DM
298
299 my $vg = $scfg->{vgname};
399ab2b6 300
1dc01b9f
DM
301 # we need to zero out LVM data for security reasons
302 # and to allow thin provisioning
303
304 my $zero_out_worker = sub {
399ab2b6
PB
305 print "zero-out data on image $volname (/dev/$vg/del-$volname)\n";
306
307 # wipe throughput up to 10MB/s by default; may be overwritten with saferemove_throughput
308 my $throughput = '-10485760';
309 if ($scfg->{saferemove_throughput}) {
310 $throughput = $scfg->{saferemove_throughput};
311 }
312
313 my $cmd = [
314 '/usr/bin/cstream',
315 '-i', '/dev/zero',
316 '-o', "/dev/$vg/del-$volname",
317 '-T', '10',
318 '-v', '1',
319 '-b', '1048576',
320 '-t', "$throughput"
321 ];
322 eval { run_command($cmd, errmsg => "zero out finished (note: 'No space left on device' is ok here)"); };
1dc01b9f
DM
323 warn $@ if $@;
324
325 $class->cluster_lock_storage($storeid, $scfg->{shared}, undef, sub {
326 my $cmd = ['/sbin/lvremove', '-f', "$vg/del-$volname"];
327 run_command($cmd, errmsg => "lvremove '$vg/del-$volname' error");
328 });
399ab2b6 329 print "successfully removed volume $volname ($vg/del-$volname)\n";
1dc01b9f
DM
330 };
331
399ab2b6
PB
332 my $cmd = ['/sbin/lvchange', '-aly', "$vg/$volname"];
333 run_command($cmd, errmsg => "can't activate LV '$vg/$volname' to zero-out its data");
334
1dc01b9f
DM
335 if ($scfg->{saferemove}) {
336 # avoid long running task, so we only rename here
399ab2b6 337 $cmd = ['/sbin/lvrename', $vg, $volname, "del-$volname"];
1dc01b9f
DM
338 run_command($cmd, errmsg => "lvrename '$vg/$volname' error");
339 return $zero_out_worker;
340 } else {
341 my $tmpvg = $scfg->{vgname};
399ab2b6 342 $cmd = ['/sbin/lvremove', '-f', "$tmpvg/$volname"];
1dc01b9f
DM
343 run_command($cmd, errmsg => "lvremove '$tmpvg/$volname' error");
344 }
345
346 return undef;
347}
348
7a9dd119
FG
349my $check_tags = sub {
350 my ($tags) = @_;
351
352 return defined($tags) && $tags =~ /(^|,)pve-vm-\d+(,|$)/;
353};
354
1dc01b9f
DM
355sub list_images {
356 my ($class, $storeid, $scfg, $vmid, $vollist, $cache) = @_;
357
358 my $vgname = $scfg->{vgname};
359
3e44cd84 360 $cache->{lvs} = lvm_list_volumes() if !$cache->{lvs};
1dc01b9f
DM
361
362 my $res = [];
5c687bd9 363
1dc01b9f
DM
364 if (my $dat = $cache->{lvs}->{$vgname}) {
365
366 foreach my $volname (keys %$dat) {
367
3e44cd84
DM
368 next if $volname !~ m/^vm-(\d+)-/;
369 my $owner = $1;
370
371 my $info = $dat->{$volname};
372
7a9dd119
FG
373 next if $scfg->{tagged_only} && !&$check_tags($info->{tags});
374
3e44cd84 375 next if $info->{lv_type} ne '-';
1dc01b9f
DM
376
377 my $volid = "$storeid:$volname";
378
379 if ($vollist) {
380 my $found = grep { $_ eq $volid } @$vollist;
381 next if !$found;
382 } else {
3e44cd84 383 next if defined($vmid) && ($owner ne $vmid);
1dc01b9f
DM
384 }
385
3e44cd84
DM
386 push @$res, {
387 volid => $volid, format => 'raw', size => $info->{lv_size}, vmid => $owner,
388 };
1dc01b9f
DM
389 }
390 }
391
392 return $res;
393}
394
395sub status {
396 my ($class, $storeid, $scfg, $cache) = @_;
397
398 $cache->{vgs} = lvm_vgs() if !$cache->{vgs};
399
400 my $vgname = $scfg->{vgname};
401
097a2b2f
DM
402 if (my $info = $cache->{vgs}->{$vgname}) {
403 return ($info->{size}, $info->{free}, $info->{size} - $info->{free}, 1);
1dc01b9f
DM
404 }
405
406 return undef;
407}
408
409sub activate_storage {
410 my ($class, $storeid, $scfg, $cache) = @_;
411
412 $cache->{vgs} = lvm_vgs() if !$cache->{vgs};
413
414 # In LVM2, vgscans take place automatically;
415 # this is just to be sure
5c687bd9 416 if ($cache->{vgs} && !$cache->{vgscaned} &&
1dc01b9f
DM
417 !$cache->{vgs}->{$scfg->{vgname}}) {
418 $cache->{vgscaned} = 1;
419 my $cmd = ['/sbin/vgscan', '--ignorelockingfailure', '--mknodes'];
420 eval { run_command($cmd, outfunc => sub {}); };
421 warn $@ if $@;
422 }
423
424 # we do not acticate any volumes here ('vgchange -aly')
425 # instead, volumes are activate individually later
426}
427
428sub deactivate_storage {
429 my ($class, $storeid, $scfg, $cache) = @_;
430
431 my $cmd = ['/sbin/vgchange', '-aln', $scfg->{vgname}];
432 run_command($cmd, errmsg => "can't deactivate VG '$scfg->{vgname}'");
433}
434
435sub activate_volume {
02e797b8 436 my ($class, $storeid, $scfg, $volname, $snapname, $cache) = @_;
c8943a85 437 #fix me lvmchange is not provided on
02e797b8 438 my $path = $class->path($scfg, $volname, $snapname);
1dc01b9f 439
c8943a85 440 my $lvm_activate_mode = 'ey';
1dc01b9f
DM
441
442 my $cmd = ['/sbin/lvchange', "-a$lvm_activate_mode", $path];
443 run_command($cmd, errmsg => "can't activate LV '$path'");
444}
445
446sub deactivate_volume {
02e797b8 447 my ($class, $storeid, $scfg, $volname, $snapname, $cache) = @_;
1dc01b9f 448
02e797b8 449 my $path = $class->path($scfg, $volname, $snapname);
1dc01b9f
DM
450 return if ! -b $path;
451
452 my $cmd = ['/sbin/lvchange', '-aln', $path];
453 run_command($cmd, errmsg => "can't deactivate LV '$path'");
454}
455
530defb6
AD
456sub volume_resize {
457 my ($class, $scfg, $storeid, $volname, $size, $running) = @_;
458
459 $size = ($size/1024/1024) . "M";
460
461 my $path = $class->path($scfg, $volname);
462 my $cmd = ['/sbin/lvextend', '-L', $size, $path];
463 run_command($cmd, errmsg => "error resizing volume '$path'");
464
465 return 1;
466}
467
33818d16 468sub volume_snapshot {
f5640e7d 469 my ($class, $scfg, $storeid, $volname, $snap) = @_;
33818d16
AD
470
471 die "lvm snapshot is not implemented";
472}
473
051e85b8
AD
474sub volume_snapshot_rollback {
475 my ($class, $scfg, $storeid, $volname, $snap) = @_;
476
477 die "lvm snapshot rollback is not implemented";
478}
479
f57e796b
AD
480sub volume_snapshot_delete {
481 my ($class, $scfg, $storeid, $volname, $snap) = @_;
482
483 die "lvm snapshot delete is not implemented";
484}
485
f7d4064f
AD
486sub volume_has_feature {
487 my ($class, $scfg, $feature, $storeid, $volname, $snapname, $running) = @_;
488
9bb4abf6
AD
489 my $features = {
490 copy => { base => 1, current => 1},
491 };
492
493 my ($vtype, $name, $vmid, $basename, $basevmid, $isBase) =
494 $class->parse_volname($volname);
495
496 my $key = undef;
497 if($snapname){
2c5a7097 498 $key = 'snap';
9bb4abf6
AD
499 }else{
500 $key = $isBase ? 'base' : 'current';
501 }
502 return 1 if $features->{$feature}->{$key};
503
f7d4064f
AD
504 return undef;
505}
506
5cbbc78f
WB
507sub volume_export_formats {
508 my ($class, $scfg, $storeid, $volname, $snapshot, $base_snapshot, $with_snapshots) = @_;
509 return () if defined($snapshot); # lvm-thin only
510 return volume_import_formats($class, $scfg, $storeid, $volname, $base_snapshot, $with_snapshots);
511}
512
513sub volume_export {
514 my ($class, $scfg, $storeid, $fh, $volname, $format, $snapshot, $base_snapshot, $with_snapshots) = @_;
515 die "volume export format $format not available for $class\n"
516 if $format ne 'raw+size';
517 die "cannot export volumes together with their snapshots in $class\n"
518 if $with_snapshots;
519 die "cannot export a snapshot in $class\n" if defined($snapshot);
520 die "cannot export an incremental stream in $class\n" if defined($base_snapshot);
521 my $file = $class->path($scfg, $volname, $storeid);
522 my $size;
523 # should be faster than querying LVM, also checks for the device file's availability
524 run_command(['/sbin/blockdev', '--getsize64', $file], outfunc => sub {
525 my ($line) = @_;
526 die "unexpected output from /sbin/blockdev: $line\n" if $line !~ /^(\d+)$/;
527 $size = int($1);
528 });
529 PVE::Storage::Plugin::write_common_header($fh, $size);
530 run_command(['dd', "if=$file", "bs=64k"], output => '>&'.fileno($fh));
531}
532
533sub volume_import_formats {
534 my ($class, $scfg, $storeid, $volname, $base_snapshot, $with_snapshots) = @_;
535 return () if $with_snapshots; # not supported
536 return () if defined($base_snapshot); # not supported
537 return ('raw+size');
538}
539
540sub volume_import {
541 my ($class, $scfg, $storeid, $fh, $volname, $format, $base_snapshot, $with_snapshots) = @_;
542 die "volume import format $format not available for $class\n"
543 if $format ne 'raw+size';
544 die "cannot import volumes together with their snapshots in $class\n"
545 if $with_snapshots;
546 die "cannot import an incremental stream in $class\n" if defined($base_snapshot);
547
548 my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $file_format) =
549 $class->parse_volname($volname);
550 die "cannot import format $format into a file of format $file_format\n"
551 if $file_format ne 'raw';
552
553 my $vg = $scfg->{vgname};
554 my $lvs = lvm_list_volumes($vg);
555 die "volume $vg/$volname already exists\n"
556 if $lvs->{$vg}->{$volname};
557
558 my ($size) = PVE::Storage::Plugin::read_common_header($fh);
559 $size = int($size/1024);
560
561 eval {
562 my $allocname = $class->alloc_image($storeid, $scfg, $vmid, 'raw', $name, $size);
563 if ($allocname ne $volname) {
564 my $oldname = $volname;
565 $volname = $allocname; # Let the cleanup code know what to free
566 die "internal error: unexpected allocated name: '$allocname' != '$oldname'\n";
567 }
568 my $file = $class->path($scfg, $volname, $storeid)
569 or die "internal error: failed to get path to newly allocated volume $volname\n";
570 run_command(['dd', "of=$file", 'conv=sparse', 'bs=64k'],
571 input => '<&'.fileno($fh));
572 };
573 if (my $err = $@) {
574 eval { $class->free_image($storeid, $scfg, $volname, 0) };
575 warn $@ if $@;
576 die $err;
577 }
578}
579
1dc01b9f 5801;