]> git.proxmox.com Git - pve-storage.git/blame - PVE/Storage/LVMPlugin.pm
next diskname: start ids with 0 to honor MAX_VOLUMES_PER_GUEST
[pve-storage.git] / PVE / Storage / LVMPlugin.pm
CommitLineData
1dc01b9f
DM
1package PVE::Storage::LVMPlugin;
2
3use strict;
4use warnings;
074b2cb4 5
1dc01b9f 6use IO::File;
074b2cb4 7
1dc01b9f
DM
8use PVE::Tools qw(run_command trim);
9use PVE::Storage::Plugin;
10use PVE::JSONSchema qw(get_standard_option);
11
12use base qw(PVE::Storage::Plugin);
13
14# lvm helper functions
15
16sub lvm_pv_info {
17 my ($device) = @_;
18
19 die "no device specified" if !$device;
20
21 my $has_label = 0;
22
23 my $cmd = ['/usr/bin/file', '-L', '-s', $device];
24 run_command($cmd, outfunc => sub {
25 my $line = shift;
26 $has_label = 1 if $line =~ m/LVM2/;
27 });
28
29 return undef if !$has_label;
30
31 $cmd = ['/sbin/pvs', '--separator', ':', '--noheadings', '--units', 'k',
32 '--unbuffered', '--nosuffix', '--options',
33 'pv_name,pv_size,vg_name,pv_uuid', $device];
34
35 my $pvinfo;
36 run_command($cmd, outfunc => sub {
37 my $line = shift;
38
39 $line = trim($line);
40
41 my ($pvname, $size, $vgname, $uuid) = split(':', $line);
42
5c687bd9 43 die "found multiple pvs entries for device '$device'\n"
1dc01b9f
DM
44 if $pvinfo;
45
46 $pvinfo = {
47 pvname => $pvname,
a3f38a64 48 size => int($size),
1dc01b9f
DM
49 vgname => $vgname,
50 uuid => $uuid,
51 };
52 });
53
54 return $pvinfo;
55}
56
57sub clear_first_sector {
58 my ($dev) = shift;
59
60 if (my $fh = IO::File->new($dev, "w")) {
61 my $buf = 0 x 512;
62 syswrite $fh, $buf;
5c687bd9 63 $fh->close();
1dc01b9f
DM
64 }
65}
66
67sub lvm_create_volume_group {
68 my ($device, $vgname, $shared) = @_;
5c687bd9 69
1dc01b9f 70 my $res = lvm_pv_info($device);
5c687bd9 71
1dc01b9f
DM
72 if ($res->{vgname}) {
73 return if $res->{vgname} eq $vgname; # already created
74 die "device '$device' is already used by volume group '$res->{vgname}'\n";
75 }
76
77 clear_first_sector($device); # else pvcreate fails
78
79 # we use --metadatasize 250k, which reseults in "pe_start = 512"
80 # so pe_start is aligned on a 128k boundary (advantage for SSDs)
81 my $cmd = ['/sbin/pvcreate', '--metadatasize', '250k', $device];
82
83 run_command($cmd, errmsg => "pvcreate '$device' error");
84
85 $cmd = ['/sbin/vgcreate', $vgname, $device];
86 # push @$cmd, '-c', 'y' if $shared; # we do not use this yet
87
88 run_command($cmd, errmsg => "vgcreate $vgname $device error");
89}
90
91sub lvm_vgs {
8cccb344 92 my ($includepvs) = @_;
1dc01b9f
DM
93
94 my $cmd = ['/sbin/vgs', '--separator', ':', '--noheadings', '--units', 'b',
8cccb344
DC
95 '--unbuffered', '--nosuffix', '--options'];
96
97 my $cols = [qw(vg_name vg_size vg_free lv_count)];
98
99 if ($includepvs) {
100 push @$cols, qw(pv_name pv_size pv_free);
101 }
102
103 push @$cmd, join(',', @$cols);
1dc01b9f
DM
104
105 my $vgs = {};
106 eval {
107 run_command($cmd, outfunc => sub {
108 my $line = shift;
109
110 $line = trim($line);
111
8cccb344
DC
112 my ($name, $size, $free, $lvcount, $pvname, $pvsize, $pvfree) = split (':', $line);
113
114 $vgs->{$name} = { size => int ($size), free => int ($free), lvcount => int($lvcount) }
115 if !$vgs->{$name};
1dc01b9f 116
8cccb344
DC
117 if (defined($pvname) && defined($pvsize) && defined($pvfree)) {
118 push @{$vgs->{$name}->{pvs}}, {
119 name => $pvname,
120 size => int($pvsize),
121 free => int($pvfree),
122 };
123 }
1dc01b9f
DM
124 });
125 };
126 my $err = $@;
127
128 # just warn (vgs return error code 5 if clvmd does not run)
129 # but output is still OK (list without clustered VGs)
130 warn $err if $err;
131
132 return $vgs;
133}
134
3e44cd84 135sub lvm_list_volumes {
1dc01b9f
DM
136 my ($vgname) = @_;
137
138 my $cmd = ['/sbin/lvs', '--separator', ':', '--noheadings', '--units', 'b',
139 '--unbuffered', '--nosuffix', '--options',
2c2fd98b 140 'vg_name,lv_name,lv_size,lv_attr,pool_lv,data_percent,metadata_percent,snap_percent,uuid,tags,metadata_size'];
1dc01b9f
DM
141
142 push @$cmd, $vgname if $vgname;
143
144 my $lvs = {};
145 run_command($cmd, outfunc => sub {
146 my $line = shift;
147
148 $line = trim($line);
149
2c2fd98b 150 my ($vg_name, $lv_name, $lv_size, $lv_attr, $pool_lv, $data_percent, $meta_percent, $snap_percent, $uuid, $tags, $meta_size) = split(':', $line);
3e44cd84
DM
151 return if !$vg_name;
152 return if !$lv_name;
1dc01b9f 153
3e44cd84 154 my $lv_type = substr($lv_attr, 0, 1);
1dc01b9f 155
3e44cd84 156 my $d = {
a3f38a64 157 lv_size => int($lv_size),
3e44cd84
DM
158 lv_type => $lv_type,
159 };
160 $d->{pool_lv} = $pool_lv if $pool_lv;
7a9dd119 161 $d->{tags} = $tags if $tags;
3e44cd84
DM
162
163 if ($lv_type eq 't') {
164 $data_percent ||= 0;
165 $meta_percent ||= 0;
166 $snap_percent ||= 0;
2c2fd98b
DC
167 $d->{metadata_size} = int($meta_size);
168 $d->{metadata_used} = int(($meta_percent * $meta_size)/100);
faabe9e2 169 $d->{used} = int(($data_percent * $lv_size)/100);
1dc01b9f 170 }
3e44cd84 171 $lvs->{$vg_name}->{$lv_name} = $d;
1dc01b9f
DM
172 });
173
174 return $lvs;
175}
176
5c687bd9 177# Configuration
1dc01b9f 178
1dc01b9f
DM
179sub type {
180 return 'lvm';
181}
182
183sub plugindata {
184 return {
68b2c18a 185 content => [ {images => 1, rootdir => 1}, { images => 1 }],
1dc01b9f
DM
186 };
187}
188
189sub properties {
190 return {
191 vgname => {
192 description => "Volume group name.",
193 type => 'string', format => 'pve-storage-vgname',
194 },
195 base => {
196 description => "Base volume. This volume is automatically activated.",
197 type => 'string', format => 'pve-volume-id',
198 },
199 saferemove => {
200 description => "Zero-out data when removing LVs.",
201 type => 'boolean',
202 },
399ab2b6
PB
203 saferemove_throughput => {
204 description => "Wipe throughput (cstream -t parameter value).",
205 type => 'string',
206 },
7a9dd119
FG
207 tagged_only => {
208 description => "Only use logical volumes tagged with 'pve-vm-ID'.",
209 type => 'boolean',
210 }
1dc01b9f
DM
211 };
212}
213
214sub options {
215 return {
216 vgname => { fixed => 1 },
0423e8c6 217 nodes => { optional => 1 },
1dc01b9f
DM
218 shared => { optional => 1 },
219 disable => { optional => 1 },
0423e8c6
FG
220 saferemove => { optional => 1 },
221 saferemove_throughput => { optional => 1 },
1dc01b9f 222 content => { optional => 1 },
0423e8c6 223 base => { fixed => 1, optional => 1 },
7a9dd119 224 tagged_only => { optional => 1 },
9edb99a5 225 bwlimit => { optional => 1 },
1dc01b9f
DM
226 };
227}
228
229# Storage implementation
230
f9602323
TL
231sub on_add_hook {
232 my ($class, $storeid, $scfg, %param) = @_;
233
234 if (my $base = $scfg->{base}) {
235 my ($baseid, $volname) = PVE::Storage::parse_volume_id($base);
236
237 my $cfg = PVE::Storage::config();
238 my $basecfg = PVE::Storage::storage_config ($cfg, $baseid, 1);
239 die "base storage ID '$baseid' does not exist\n" if !$basecfg;
240
241 # we only support iscsi for now
242 die "unsupported base type '$basecfg->{type}'"
243 if $basecfg->{type} ne 'iscsi';
244
245 my $path = PVE::Storage::path($cfg, $base);
246
247 PVE::Storage::activate_storage($cfg, $baseid);
248
249 lvm_create_volume_group($path, $scfg->{vgname}, $scfg->{shared});
250 }
251}
252
1dc01b9f
DM
253sub parse_volname {
254 my ($class, $volname) = @_;
255
5dca5c7c 256 PVE::Storage::Plugin::parse_lvm_name($volname);
1dc01b9f
DM
257
258 if ($volname =~ m/^(vm-(\d+)-\S+)$/) {
7800e84d 259 return ('images', $1, $2, undef, undef, undef, 'raw');
1dc01b9f
DM
260 }
261
262 die "unable to parse lvm volume name '$volname'\n";
263}
264
452e3ee7 265sub filesystem_path {
e67069eb
DM
266 my ($class, $scfg, $volname, $snapname) = @_;
267
268 die "lvm snapshot is not implemented"if defined($snapname);
1dc01b9f
DM
269
270 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
271
272 my $vg = $scfg->{vgname};
5c687bd9 273
1dc01b9f
DM
274 my $path = "/dev/$vg/$name";
275
5521b580 276 return wantarray ? ($path, $vmid, $vtype) : $path;
1dc01b9f
DM
277}
278
5eab0272
DM
279sub create_base {
280 my ($class, $storeid, $scfg, $volname) = @_;
281
282 die "can't create base images in lvm storage\n";
283}
284
285sub clone_image {
f236eaf8 286 my ($class, $scfg, $storeid, $volname, $vmid, $snap) = @_;
5eab0272
DM
287
288 die "can't clone images in lvm storage\n";
289}
290
b1378461
DM
291sub lvm_find_free_diskname {
292 my ($lvs, $vg, $storeid, $vmid) = @_;
293
294 my $name;
295
ca552c76
SI
296 my $disk_ids = {};
297 my @vols = keys(%{$lvs->{$vg}});
298
299 foreach my $vol (@vols) {
300 if ($vol =~ m/(vm|base)-\Q$vmid\E-disk-(\d+)/){
301 $disk_ids->{$2} = 1;
b1378461
DM
302 }
303 }
304
ca552c76
SI
305 for (my $i = 1; $i < 100; $i++) {
306 return "vm-$vmid-disk-$i" if !$disk_ids->{$i};
307 }
308
309 die "unable to allocate an image name for ID $vmid in storage '$storeid'\n";
b1378461 310
b1378461
DM
311}
312
1dc01b9f
DM
313sub alloc_image {
314 my ($class, $storeid, $scfg, $vmid, $fmt, $name, $size) = @_;
315
316 die "unsupported format '$fmt'" if $fmt ne 'raw';
317
5c687bd9 318 die "illegal name '$name' - sould be 'vm-$vmid-*'\n"
1dc01b9f
DM
319 if $name && $name !~ m/^vm-$vmid-/;
320
321 my $vgs = lvm_vgs();
322
323 my $vg = $scfg->{vgname};
324
e8acaa3c 325 die "no such volume group '$vg'\n" if !defined ($vgs->{$vg});
1dc01b9f
DM
326
327 my $free = int($vgs->{$vg}->{free});
328
329 die "not enough free space ($free < $size)\n" if $free < $size;
330
b1378461 331 $name = lvm_find_free_diskname(lvm_list_volumes($vg), $vg, $storeid, $vmid)
1dc01b9f
DM
332 if !$name;
333
334 my $cmd = ['/sbin/lvcreate', '-aly', '--addtag', "pve-vm-$vmid", '--size', "${size}k", '--name', $name, $vg];
335
336 run_command($cmd, errmsg => "lvcreate '$vg/pve-vm-$vmid' error");
337
338 return $name;
339}
340
341sub free_image {
32437ed2 342 my ($class, $storeid, $scfg, $volname, $isBase) = @_;
1dc01b9f
DM
343
344 my $vg = $scfg->{vgname};
399ab2b6 345
1dc01b9f
DM
346 # we need to zero out LVM data for security reasons
347 # and to allow thin provisioning
348
349 my $zero_out_worker = sub {
399ab2b6
PB
350 print "zero-out data on image $volname (/dev/$vg/del-$volname)\n";
351
352 # wipe throughput up to 10MB/s by default; may be overwritten with saferemove_throughput
353 my $throughput = '-10485760';
354 if ($scfg->{saferemove_throughput}) {
355 $throughput = $scfg->{saferemove_throughput};
356 }
357
358 my $cmd = [
359 '/usr/bin/cstream',
360 '-i', '/dev/zero',
361 '-o', "/dev/$vg/del-$volname",
362 '-T', '10',
363 '-v', '1',
364 '-b', '1048576',
365 '-t', "$throughput"
366 ];
367 eval { run_command($cmd, errmsg => "zero out finished (note: 'No space left on device' is ok here)"); };
1dc01b9f
DM
368 warn $@ if $@;
369
370 $class->cluster_lock_storage($storeid, $scfg->{shared}, undef, sub {
371 my $cmd = ['/sbin/lvremove', '-f', "$vg/del-$volname"];
372 run_command($cmd, errmsg => "lvremove '$vg/del-$volname' error");
373 });
399ab2b6 374 print "successfully removed volume $volname ($vg/del-$volname)\n";
1dc01b9f
DM
375 };
376
399ab2b6
PB
377 my $cmd = ['/sbin/lvchange', '-aly', "$vg/$volname"];
378 run_command($cmd, errmsg => "can't activate LV '$vg/$volname' to zero-out its data");
379
1dc01b9f
DM
380 if ($scfg->{saferemove}) {
381 # avoid long running task, so we only rename here
399ab2b6 382 $cmd = ['/sbin/lvrename', $vg, $volname, "del-$volname"];
1dc01b9f
DM
383 run_command($cmd, errmsg => "lvrename '$vg/$volname' error");
384 return $zero_out_worker;
385 } else {
386 my $tmpvg = $scfg->{vgname};
399ab2b6 387 $cmd = ['/sbin/lvremove', '-f', "$tmpvg/$volname"];
1dc01b9f
DM
388 run_command($cmd, errmsg => "lvremove '$tmpvg/$volname' error");
389 }
390
391 return undef;
392}
393
7a9dd119
FG
394my $check_tags = sub {
395 my ($tags) = @_;
396
397 return defined($tags) && $tags =~ /(^|,)pve-vm-\d+(,|$)/;
398};
399
1dc01b9f
DM
400sub list_images {
401 my ($class, $storeid, $scfg, $vmid, $vollist, $cache) = @_;
402
403 my $vgname = $scfg->{vgname};
404
3e44cd84 405 $cache->{lvs} = lvm_list_volumes() if !$cache->{lvs};
1dc01b9f
DM
406
407 my $res = [];
5c687bd9 408
1dc01b9f
DM
409 if (my $dat = $cache->{lvs}->{$vgname}) {
410
411 foreach my $volname (keys %$dat) {
412
3e44cd84
DM
413 next if $volname !~ m/^vm-(\d+)-/;
414 my $owner = $1;
415
416 my $info = $dat->{$volname};
417
7a9dd119
FG
418 next if $scfg->{tagged_only} && !&$check_tags($info->{tags});
419
3e44cd84 420 next if $info->{lv_type} ne '-';
1dc01b9f
DM
421
422 my $volid = "$storeid:$volname";
423
424 if ($vollist) {
425 my $found = grep { $_ eq $volid } @$vollist;
426 next if !$found;
427 } else {
3e44cd84 428 next if defined($vmid) && ($owner ne $vmid);
1dc01b9f
DM
429 }
430
3e44cd84
DM
431 push @$res, {
432 volid => $volid, format => 'raw', size => $info->{lv_size}, vmid => $owner,
433 };
1dc01b9f
DM
434 }
435 }
436
437 return $res;
438}
439
440sub status {
441 my ($class, $storeid, $scfg, $cache) = @_;
442
443 $cache->{vgs} = lvm_vgs() if !$cache->{vgs};
444
445 my $vgname = $scfg->{vgname};
446
097a2b2f
DM
447 if (my $info = $cache->{vgs}->{$vgname}) {
448 return ($info->{size}, $info->{free}, $info->{size} - $info->{free}, 1);
1dc01b9f
DM
449 }
450
451 return undef;
452}
453
454sub activate_storage {
455 my ($class, $storeid, $scfg, $cache) = @_;
456
457 $cache->{vgs} = lvm_vgs() if !$cache->{vgs};
458
459 # In LVM2, vgscans take place automatically;
460 # this is just to be sure
5c687bd9 461 if ($cache->{vgs} && !$cache->{vgscaned} &&
1dc01b9f
DM
462 !$cache->{vgs}->{$scfg->{vgname}}) {
463 $cache->{vgscaned} = 1;
464 my $cmd = ['/sbin/vgscan', '--ignorelockingfailure', '--mknodes'];
465 eval { run_command($cmd, outfunc => sub {}); };
466 warn $@ if $@;
467 }
468
469 # we do not acticate any volumes here ('vgchange -aly')
470 # instead, volumes are activate individually later
471}
472
473sub deactivate_storage {
474 my ($class, $storeid, $scfg, $cache) = @_;
475
476 my $cmd = ['/sbin/vgchange', '-aln', $scfg->{vgname}];
477 run_command($cmd, errmsg => "can't deactivate VG '$scfg->{vgname}'");
478}
479
480sub activate_volume {
02e797b8 481 my ($class, $storeid, $scfg, $volname, $snapname, $cache) = @_;
c8943a85 482 #fix me lvmchange is not provided on
02e797b8 483 my $path = $class->path($scfg, $volname, $snapname);
1dc01b9f 484
c8943a85 485 my $lvm_activate_mode = 'ey';
1dc01b9f
DM
486
487 my $cmd = ['/sbin/lvchange', "-a$lvm_activate_mode", $path];
488 run_command($cmd, errmsg => "can't activate LV '$path'");
489}
490
491sub deactivate_volume {
02e797b8 492 my ($class, $storeid, $scfg, $volname, $snapname, $cache) = @_;
1dc01b9f 493
02e797b8 494 my $path = $class->path($scfg, $volname, $snapname);
1dc01b9f
DM
495 return if ! -b $path;
496
497 my $cmd = ['/sbin/lvchange', '-aln', $path];
498 run_command($cmd, errmsg => "can't deactivate LV '$path'");
499}
500
530defb6
AD
501sub volume_resize {
502 my ($class, $scfg, $storeid, $volname, $size, $running) = @_;
503
504 $size = ($size/1024/1024) . "M";
505
506 my $path = $class->path($scfg, $volname);
507 my $cmd = ['/sbin/lvextend', '-L', $size, $path];
508 run_command($cmd, errmsg => "error resizing volume '$path'");
509
510 return 1;
511}
512
33818d16 513sub volume_snapshot {
f5640e7d 514 my ($class, $scfg, $storeid, $volname, $snap) = @_;
33818d16
AD
515
516 die "lvm snapshot is not implemented";
517}
518
051e85b8
AD
519sub volume_snapshot_rollback {
520 my ($class, $scfg, $storeid, $volname, $snap) = @_;
521
522 die "lvm snapshot rollback is not implemented";
523}
524
f57e796b
AD
525sub volume_snapshot_delete {
526 my ($class, $scfg, $storeid, $volname, $snap) = @_;
527
528 die "lvm snapshot delete is not implemented";
529}
530
f7d4064f
AD
531sub volume_has_feature {
532 my ($class, $scfg, $feature, $storeid, $volname, $snapname, $running) = @_;
533
9bb4abf6
AD
534 my $features = {
535 copy => { base => 1, current => 1},
536 };
537
538 my ($vtype, $name, $vmid, $basename, $basevmid, $isBase) =
539 $class->parse_volname($volname);
540
541 my $key = undef;
542 if($snapname){
2c5a7097 543 $key = 'snap';
9bb4abf6
AD
544 }else{
545 $key = $isBase ? 'base' : 'current';
546 }
547 return 1 if $features->{$feature}->{$key};
548
f7d4064f
AD
549 return undef;
550}
551
5cbbc78f
WB
552sub volume_export_formats {
553 my ($class, $scfg, $storeid, $volname, $snapshot, $base_snapshot, $with_snapshots) = @_;
554 return () if defined($snapshot); # lvm-thin only
555 return volume_import_formats($class, $scfg, $storeid, $volname, $base_snapshot, $with_snapshots);
556}
557
558sub volume_export {
559 my ($class, $scfg, $storeid, $fh, $volname, $format, $snapshot, $base_snapshot, $with_snapshots) = @_;
560 die "volume export format $format not available for $class\n"
561 if $format ne 'raw+size';
562 die "cannot export volumes together with their snapshots in $class\n"
563 if $with_snapshots;
564 die "cannot export a snapshot in $class\n" if defined($snapshot);
565 die "cannot export an incremental stream in $class\n" if defined($base_snapshot);
566 my $file = $class->path($scfg, $volname, $storeid);
567 my $size;
568 # should be faster than querying LVM, also checks for the device file's availability
569 run_command(['/sbin/blockdev', '--getsize64', $file], outfunc => sub {
570 my ($line) = @_;
571 die "unexpected output from /sbin/blockdev: $line\n" if $line !~ /^(\d+)$/;
572 $size = int($1);
573 });
574 PVE::Storage::Plugin::write_common_header($fh, $size);
575 run_command(['dd', "if=$file", "bs=64k"], output => '>&'.fileno($fh));
576}
577
578sub volume_import_formats {
579 my ($class, $scfg, $storeid, $volname, $base_snapshot, $with_snapshots) = @_;
580 return () if $with_snapshots; # not supported
581 return () if defined($base_snapshot); # not supported
582 return ('raw+size');
583}
584
585sub volume_import {
586 my ($class, $scfg, $storeid, $fh, $volname, $format, $base_snapshot, $with_snapshots) = @_;
587 die "volume import format $format not available for $class\n"
588 if $format ne 'raw+size';
589 die "cannot import volumes together with their snapshots in $class\n"
590 if $with_snapshots;
591 die "cannot import an incremental stream in $class\n" if defined($base_snapshot);
592
593 my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $file_format) =
594 $class->parse_volname($volname);
595 die "cannot import format $format into a file of format $file_format\n"
596 if $file_format ne 'raw';
597
598 my $vg = $scfg->{vgname};
599 my $lvs = lvm_list_volumes($vg);
600 die "volume $vg/$volname already exists\n"
601 if $lvs->{$vg}->{$volname};
602
603 my ($size) = PVE::Storage::Plugin::read_common_header($fh);
604 $size = int($size/1024);
605
606 eval {
607 my $allocname = $class->alloc_image($storeid, $scfg, $vmid, 'raw', $name, $size);
608 if ($allocname ne $volname) {
609 my $oldname = $volname;
610 $volname = $allocname; # Let the cleanup code know what to free
611 die "internal error: unexpected allocated name: '$allocname' != '$oldname'\n";
612 }
613 my $file = $class->path($scfg, $volname, $storeid)
614 or die "internal error: failed to get path to newly allocated volume $volname\n";
615 run_command(['dd', "of=$file", 'conv=sparse', 'bs=64k'],
616 input => '<&'.fileno($fh));
617 };
618 if (my $err = $@) {
619 eval { $class->free_image($storeid, $scfg, $volname, 0) };
620 warn $@ if $@;
621 die $err;
622 }
623}
624
1dc01b9f 6251;