]> git.proxmox.com Git - pve-storage.git/blame - PVE/Storage/ZFSPoolPlugin.pm
allow --allow-shrink on RBD resize
[pve-storage.git] / PVE / Storage / ZFSPoolPlugin.pm
CommitLineData
85fda4dd 1package PVE::Storage::ZFSPoolPlugin;
5bb8e010
DM
2
3use strict;
4use warnings;
5use IO::File;
6use POSIX;
7use PVE::Tools qw(run_command);
8use PVE::Storage::Plugin;
21430e50 9use PVE::RPCEnvironment;
5bb8e010
DM
10
11use base qw(PVE::Storage::Plugin);
12
5bb8e010 13sub type {
85fda4dd 14 return 'zfspool';
5bb8e010
DM
15}
16
17sub plugindata {
18 return {
1ccae449
DM
19 content => [ {images => 1, rootdir => 1}, {images => 1 , rootdir => 1}],
20 format => [ { raw => 1, subvol => 1 } , 'raw' ],
5bb8e010 21 };
85fda4dd 22}
5bb8e010 23
7730694e
DM
24sub properties {
25 return {
26 blocksize => {
27 description => "block size",
28 type => 'string',
29 },
30 sparse => {
31 description => "use sparse volumes",
32 type => 'boolean',
33 },
34 };
35}
36
5bb8e010
DM
37sub options {
38 return {
7730694e
DM
39 pool => { fixed => 1 },
40 blocksize => { optional => 1 },
41 sparse => { optional => 1 },
42 nodes => { optional => 1 },
5bb8e010 43 disable => { optional => 1 },
5bb8e010
DM
44 content => { optional => 1 },
45 };
46}
47
7730694e
DM
48# static zfs helper methods
49
060ef890
DM
50sub zfs_parse_size {
51 my ($text) = @_;
52
53 return 0 if !$text;
54
55 if ($text =~ m/^(\d+(\.\d+)?)([TGMK])?$/) {
56
57 my ($size, $reminder, $unit) = ($1, $2, $3);
58
59 if ($unit) {
60 if ($unit eq 'K') {
61 $size *= 1024;
62 } elsif ($unit eq 'M') {
63 $size *= 1024*1024;
64 } elsif ($unit eq 'G') {
65 $size *= 1024*1024*1024;
66 } elsif ($unit eq 'T') {
67 $size *= 1024*1024*1024*1024;
68 } else {
69 die "got unknown zfs size unit '$unit'\n";
70 }
71 }
72
73 if ($reminder) {
74 $size = ceil($size);
75 }
76
77 return $size;
78
79 }
80
81 warn "unable to parse zfs size '$text'\n";
82
83 return 0;
84}
85
7730694e
DM
86sub zfs_parse_zvol_list {
87 my ($text) = @_;
88
89 my $list = ();
90
91 return $list if !$text;
92
93 my @lines = split /\n/, $text;
94 foreach my $line (@lines) {
1ccae449
DM
95 my ($dataset, $size, $origin, $type, $refquota) = split(/\s+/, $line);
96 next if !($type eq 'volume' || $type eq 'filesystem');
97
98 my $zvol = {};
99 my @parts = split /\//, $dataset;
dec97937 100 next if scalar(@parts) < 2; # we need pool/name
1ccae449
DM
101 my $name = pop @parts;
102 my $pool = join('/', @parts);
103
851658c3 104 next unless $name =~ m!^(vm|base|subvol|basevol)-(\d+)-(\S+)$!;
1ccae449
DM
105 $zvol->{owner} = $2;
106
1ccae449
DM
107 $zvol->{pool} = $pool;
108 $zvol->{name} = $name;
109 if ($type eq 'filesystem') {
110 if ($refquota eq 'none') {
111 $zvol->{size} = 0;
112 } else {
113 $zvol->{size} = zfs_parse_size($refquota);
7730694e 114 }
1ccae449
DM
115 $zvol->{format} = 'subvol';
116 } else {
117 $zvol->{size} = zfs_parse_size($size);
118 $zvol->{format} = 'raw';
7730694e 119 }
1ccae449
DM
120 if ($origin !~ /^-$/) {
121 $zvol->{origin} = $origin;
122 }
123 push @$list, $zvol;
7730694e
DM
124 }
125
126 return $list;
127}
128
cc80ed9c
WL
129sub parse_volname {
130 my ($class, $volname) = @_;
131
8e5b96ca
DM
132 if ($volname =~ m/^(((base|basevol)-(\d+)-\S+)\/)?((base|basevol|vm|subvol)-(\d+)-\S+)$/) {
133 my $format = ($6 eq 'subvol' || $6 eq 'basevol') ? 'subvol' : 'raw';
134 my $isBase = ($6 eq 'base' || $6 eq 'basevol');
135 return ('images', $5, $7, $2, $4, $isBase, $format);
cc80ed9c
WL
136 }
137
138 die "unable to parse zfs volume name '$volname'\n";
139}
140
7730694e
DM
141# virtual zfs methods (subclass can overwrite them)
142
f3e632d0 143sub path {
e67069eb 144 my ($class, $scfg, $volname, $storeid, $snapname) = @_;
f3e632d0
WL
145
146 my ($vtype, $name, $vmid) = $class->parse_volname($volname);
147
148 my $path = '';
149
1ccae449 150 if ($vtype eq "images") {
74b724a6 151 if ($name =~ m/^subvol-/ || $name =~ m/^basevol-/) {
f482231e 152 # fixme: we currently assume standard mount point?!
851658c3 153 $path = "/$scfg->{pool}/$name";
1ccae449 154 } else {
851658c3 155 $path = "/dev/zvol/$scfg->{pool}/$name";
1ccae449 156 }
f482231e 157 $path .= "\@$snapname" if defined($snapname);
f3e632d0 158 } else {
85fda4dd 159 die "$vtype is not allowed in ZFSPool!";
f3e632d0
WL
160 }
161
162 return ($path, $vmid, $vtype);
163}
164
7730694e
DM
165sub zfs_request {
166 my ($class, $scfg, $timeout, $method, @params) = @_;
167
21430e50
FG
168 $timeout = PVE::RPCEnvironment::is_worker() ? 60*60 : 5
169 if !$timeout;
7730694e
DM
170
171 my $cmd = [];
172
173 if ($method eq 'zpool_list') {
86d47239 174 push @$cmd, 'zpool', 'list';
7730694e
DM
175 } else {
176 push @$cmd, 'zfs', $method;
177 }
178
179 push @$cmd, @params;
180
181 my $msg = '';
182
183 my $output = sub {
184 my $line = shift;
185 $msg .= "$line\n";
186 };
187
1f390a30 188 run_command($cmd, errmsg => "zfs error", outfunc => $output, timeout => $timeout);
7730694e
DM
189
190 return $msg;
191}
192
b3ba95e4
WL
193sub alloc_image {
194 my ($class, $storeid, $scfg, $vmid, $fmt, $name, $size) = @_;
195
1ccae449
DM
196 my $volname = $name;
197
198 if ($fmt eq 'raw') {
b3ba95e4 199
1ccae449
DM
200 die "illegal name '$volname' - sould be 'vm-$vmid-*'\n"
201 if $volname && $volname !~ m/^vm-$vmid-/;
55525ad2 202 $volname = $class->zfs_find_free_diskname($storeid, $scfg, $vmid, $fmt)
1ccae449 203 if !$volname;
b3ba95e4 204
1ccae449
DM
205 $class->zfs_create_zvol($scfg, $volname, $size);
206 my $devname = "/dev/zvol/$scfg->{pool}/$volname";
82e08809 207
1ccae449 208 run_command("udevadm trigger --subsystem-match block");
602eacfe 209 system('udevadm', 'settle', '--timeout', '10', "--exit-if-exists=${devname}");
76fd7dc7 210
1ccae449 211 } elsif ( $fmt eq 'subvol') {
55525ad2
DM
212
213 die "illegal name '$volname' - sould be 'subvol-$vmid-*'\n"
214 if $volname && $volname !~ m/^subvol-$vmid-/;
215 $volname = $class->zfs_find_free_diskname($storeid, $scfg, $vmid, $fmt)
216 if !$volname;
217
1ccae449
DM
218 die "illegal name '$volname' - sould be 'subvol-$vmid-*'\n"
219 if $volname !~ m/^subvol-$vmid-/;
76fd7dc7 220
1ccae449
DM
221 $class->zfs_create_subvol($scfg, $volname, $size);
222
223 } else {
224 die "unsupported format '$fmt'";
225 }
b3ba95e4 226
82e08809 227 return $volname;
b3ba95e4
WL
228}
229
e9565df5
WL
230sub free_image {
231 my ($class, $storeid, $scfg, $volname, $isBase) = @_;
232
233 my (undef, $name, undef) = $class->parse_volname($volname);
234
235 $class->zfs_delete_zvol($scfg, $name);
236
237 return undef;
238}
239
ca04180f
WL
240sub list_images {
241 my ($class, $storeid, $scfg, $vmid, $vollist, $cache) = @_;
242
243 $cache->{zfs} = $class->zfs_list_zvol($scfg) if !$cache->{zfs};
244 my $zfspool = $scfg->{pool};
245 my $res = [];
246
247 if (my $dat = $cache->{zfs}->{$zfspool}) {
248
249 foreach my $image (keys %$dat) {
250
1b83c3d9 251 my $info = $dat->{$image};
ca04180f 252
1b83c3d9
FG
253 my $volname = $info->{name};
254 my $parent = $info->{parent};
255 my $owner = $info->{vmid};
256
257 if ($parent && $parent =~ m/^(\S+)\@__base__$/) {
ca04180f 258 my ($basename) = ($1);
1b83c3d9 259 $info->{volid} = "$storeid:$basename/$volname";
ca04180f 260 } else {
1b83c3d9 261 $info->{volid} = "$storeid:$volname";
ca04180f
WL
262 }
263
ca04180f 264 if ($vollist) {
1b83c3d9 265 my $found = grep { $_ eq $info->{volid} } @$vollist;
ca04180f
WL
266 next if !$found;
267 } else {
268 next if defined ($vmid) && ($owner ne $vmid);
269 }
270
ca04180f
WL
271 push @$res, $info;
272 }
273 }
ca04180f
WL
274 return $res;
275}
276
7730694e
DM
277sub zfs_get_pool_stats {
278 my ($class, $scfg) = @_;
279
280 my $available = 0;
281 my $used = 0;
282
283 my $text = $class->zfs_request($scfg, undef, 'get', '-o', 'value', '-Hp',
284 'available,used', $scfg->{pool});
285
286 my @lines = split /\n/, $text;
287
288 if($lines[0] =~ /^(\d+)$/) {
289 $available = $1;
290 }
291
292 if($lines[1] =~ /^(\d+)$/) {
293 $used = $1;
294 }
295
296 return ($available, $used);
297}
298
7730694e
DM
299sub zfs_create_zvol {
300 my ($class, $scfg, $zvol, $size) = @_;
301
302 my $cmd = ['create'];
303
304 push @$cmd, '-s' if $scfg->{sparse};
305
306 push @$cmd, '-b', $scfg->{blocksize} if $scfg->{blocksize};
307
308 push @$cmd, '-V', "${size}k", "$scfg->{pool}/$zvol";
309
310 $class->zfs_request($scfg, undef, @$cmd);
311}
312
1ccae449
DM
313sub zfs_create_subvol {
314 my ($class, $scfg, $volname, $size) = @_;
315
316 my $dataset = "$scfg->{pool}/$volname";
317
efaf4017
DM
318 my $cmd = ['create', '-o', 'acltype=posixacl', '-o', 'xattr=sa',
319 '-o', "refquota=${size}k", $dataset];
1ccae449
DM
320
321 $class->zfs_request($scfg, undef, @$cmd);
322}
323
7730694e
DM
324sub zfs_delete_zvol {
325 my ($class, $scfg, $zvol) = @_;
326
1f390a30
WL
327 my $err;
328
329 for (my $i = 0; $i < 6; $i++) {
330
331 eval { $class->zfs_request($scfg, undef, 'destroy', '-r', "$scfg->{pool}/$zvol"); };
332 if ($err = $@) {
333 if ($err =~ m/^zfs error:(.*): dataset is busy.*/) {
334 sleep(1);
27ff0e99
WL
335 } elsif ($err =~ m/^zfs error:.*: dataset does not exist.*$/) {
336 $err = undef;
337 last;
1f390a30
WL
338 } else {
339 die $err;
340 }
341 } else {
342 last;
343 }
344 }
345
346 die $err if $err;
7730694e
DM
347}
348
349sub zfs_list_zvol {
350 my ($class, $scfg) = @_;
351
1ccae449 352 my $text = $class->zfs_request($scfg, 10, 'list', '-o', 'name,volsize,origin,type,refquota', '-t', 'volume,filesystem', '-Hr');
7730694e
DM
353 my $zvols = zfs_parse_zvol_list($text);
354 return undef if !$zvols;
355
356 my $list = ();
357 foreach my $zvol (@$zvols) {
1ccae449
DM
358 my $pool = $zvol->{pool};
359 my $name = $zvol->{name};
7730694e
DM
360 my $parent = $zvol->{origin};
361 if($zvol->{origin} && $zvol->{origin} =~ m/^$scfg->{pool}\/(\S+)$/){
362 $parent = $1;
363 }
364
1ccae449
DM
365 $list->{$pool}->{$name} = {
366 name => $name,
7730694e
DM
367 size => $zvol->{size},
368 parent => $parent,
1ccae449
DM
369 format => $zvol->{format},
370 vmid => $zvol->{owner},
7730694e
DM
371 };
372 }
373
374 return $list;
375}
376
377sub zfs_find_free_diskname {
55525ad2 378 my ($class, $storeid, $scfg, $vmid, $format) = @_;
7730694e
DM
379
380 my $name = undef;
381 my $volumes = $class->zfs_list_zvol($scfg);
382
383 my $disk_ids = {};
384 my $dat = $volumes->{$scfg->{pool}};
385
386 foreach my $image (keys %$dat) {
387 my $volname = $dat->{$image}->{name};
851658c3 388 if ($volname =~ m/(vm|base|subvol|basevol)-$vmid-disk-(\d+)/){
7730694e
DM
389 $disk_ids->{$2} = 1;
390 }
391 }
392
393 for (my $i = 1; $i < 100; $i++) {
394 if (!$disk_ids->{$i}) {
55525ad2 395 return $format eq 'subvol' ? "subvol-$vmid-disk-$i" : "vm-$vmid-disk-$i";
7730694e
DM
396 }
397 }
398
399 die "unable to allocate an image name for VM $vmid in storage '$storeid'\n";
400}
401
2fc59177
DM
402sub zfs_get_latest_snapshot {
403 my ($class, $scfg, $volname) = @_;
404
851658c3
WL
405 my $vname = ($class->parse_volname($volname))[1];
406
2fc59177
DM
407 # abort rollback if snapshot is not the latest
408 my @params = ('-t', 'snapshot', '-o', 'name', '-s', 'creation');
281f9587 409 my $text = $class->zfs_request($scfg, undef, 'list', @params);
2fc59177
DM
410 my @snapshots = split(/\n/, $text);
411
412 my $recentsnap;
413 foreach (@snapshots) {
851658c3 414 if (/$scfg->{pool}\/$vname/) {
2fc59177
DM
415 s/^.*@//;
416 $recentsnap = $_;
417 }
418 }
419
420 return $recentsnap;
421}
422
b5e5f7e3
DM
423sub status {
424 my ($class, $storeid, $scfg, $cache) = @_;
425
426 my $total = 0;
427 my $free = 0;
428 my $used = 0;
429 my $active = 0;
430
431 eval {
432 ($free, $used) = $class->zfs_get_pool_stats($scfg);
433 $active = 1;
434 $total = $free + $used;
435 };
436 warn $@ if $@;
437
438 return ($total, $free, $used, $active);
439}
440
441sub volume_size_info {
442 my ($class, $scfg, $storeid, $volname, $timeout) = @_;
443
851658c3 444 my (undef, $vname, undef, undef, undef, undef, $format) =
79f2b938
DM
445 $class->parse_volname($volname);
446
447 my $attr = $format eq 'subvol' ? 'refquota' : 'volsize';
851658c3 448 my $text = $class->zfs_request($scfg, undef, 'get', '-Hp', $attr, "$scfg->{pool}/$vname");
79f2b938
DM
449 if ($text =~ /\s$attr\s(\d+)\s/) {
450 return $1;
451 }
452
453 die "Could not get zfs volume size\n";
b5e5f7e3
DM
454}
455
456sub volume_snapshot {
f5640e7d 457 my ($class, $scfg, $storeid, $volname, $snap) = @_;
b5e5f7e3 458
851658c3
WL
459 my $vname = ($class->parse_volname($volname))[1];
460
461 $class->zfs_request($scfg, undef, 'snapshot', "$scfg->{pool}/$vname\@$snap");
b5e5f7e3
DM
462}
463
464sub volume_snapshot_delete {
465 my ($class, $scfg, $storeid, $volname, $snap, $running) = @_;
466
851658c3
WL
467 my $vname = ($class->parse_volname($volname))[1];
468
469 $class->deactivate_volume($storeid, $scfg, $vname, $snap, {});
470 $class->zfs_request($scfg, undef, 'destroy', "$scfg->{pool}/$vname\@$snap");
b5e5f7e3
DM
471}
472
2b40ffae
WL
473sub volume_snapshot_rollback {
474 my ($class, $scfg, $storeid, $volname, $snap) = @_;
475
851658c3
WL
476 my $vname = ($class->parse_volname($volname))[1];
477
478 $class->zfs_request($scfg, undef, 'rollback', "$scfg->{pool}/$vname\@$snap");
1597f1f9
WL
479}
480
481sub volume_rollback_is_possible {
482 my ($class, $scfg, $storeid, $volname, $snap) = @_;
483
2fc59177 484 my $recentsnap = $class->zfs_get_latest_snapshot($scfg, $volname);
2b40ffae 485 if ($snap ne $recentsnap) {
1597f1f9 486 die "can't rollback, more recent snapshots exist\n";
2b40ffae
WL
487 }
488
1597f1f9 489 return 1;
2b40ffae
WL
490}
491
0a3d992f
DM
492sub activate_storage {
493 my ($class, $storeid, $scfg, $cache) = @_;
86d47239
WL
494
495 my @param = ('-o', 'name', '-H');
496
281f9587 497 my $text = $class->zfs_request($scfg, undef, 'zpool_list', @param);
93124ef4
DM
498
499 # Note: $scfg->{pool} can include dataset <pool>/<dataset>
500 my $pool = $scfg->{pool};
501 $pool =~ s!/.*$!!;
502
503 if ($text !~ $pool) {
86d47239
WL
504 run_command("zpool import -d /dev/disk/by-id/ -a");
505 }
0a3d992f
DM
506 return 1;
507}
508
509sub deactivate_storage {
510 my ($class, $storeid, $scfg, $cache) = @_;
511 return 1;
512}
513
d4c63dc1 514sub activate_volume {
02e797b8 515 my ($class, $storeid, $scfg, $volname, $snapname, $cache) = @_;
d4c63dc1
WL
516 return 1;
517}
518
519sub deactivate_volume {
02e797b8 520 my ($class, $storeid, $scfg, $volname, $snapname, $cache) = @_;
d4c63dc1
WL
521 return 1;
522}
5bb8e010 523
d3a282e8
WL
524sub clone_image {
525 my ($class, $scfg, $storeid, $volname, $vmid, $snap) = @_;
526
527 $snap ||= '__base__';
528
55525ad2 529 my ($vtype, $basename, $basevmid, undef, undef, $isBase, $format) =
d3a282e8
WL
530 $class->parse_volname($volname);
531
532 die "clone_image only works on base images\n" if !$isBase;
533
55525ad2 534 my $name = $class->zfs_find_free_diskname($storeid, $scfg, $vmid, $format);
d3a282e8 535
851658c3
WL
536 if ($format eq 'subvol') {
537 my $size = $class->zfs_request($scfg, undef, 'list', '-H', '-o', 'refquota', "$scfg->{pool}/$basename");
538 chomp($size);
539 $class->zfs_request($scfg, undef, 'clone', "$scfg->{pool}/$basename\@$snap", "$scfg->{pool}/$name", '-o', "refquota=$size");
540 } else {
541 $class->zfs_request($scfg, undef, 'clone', "$scfg->{pool}/$basename\@$snap", "$scfg->{pool}/$name");
542 }
d3a282e8 543
851658c3 544 return "$basename/$name";
d3a282e8
WL
545}
546
547sub create_base {
548 my ($class, $storeid, $scfg, $volname) = @_;
549
550 my $snap = '__base__';
551
851658c3 552 my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) =
d3a282e8
WL
553 $class->parse_volname($volname);
554
555 die "create_base not possible with base image\n" if $isBase;
556
557 my $newname = $name;
851658c3
WL
558 if ( $format eq 'subvol' ) {
559 $newname =~ s/^subvol-/basevol-/;
560 } else {
561 $newname =~ s/^vm-/base-/;
562 }
d3a282e8
WL
563 my $newvolname = $basename ? "$basename/$newname" : "$newname";
564
565 $class->zfs_request($scfg, undef, 'rename', "$scfg->{pool}/$name", "$scfg->{pool}/$newname");
566
567 my $running = undef; #fixme : is create_base always offline ?
568
569 $class->volume_snapshot($scfg, $storeid, $newname, $snap, $running);
570
571 return $newvolname;
572}
573
a4034b9f
WL
574sub volume_resize {
575 my ($class, $scfg, $storeid, $volname, $size, $running) = @_;
576
79f2b938
DM
577 my $new_size = int($size/1024);
578
851658c3 579 my (undef, $vname, undef, undef, undef, undef, $format) =
79f2b938
DM
580 $class->parse_volname($volname);
581
582 my $attr = $format eq 'subvol' ? 'refquota' : 'volsize';
a4034b9f 583
851658c3 584 $class->zfs_request($scfg, undef, 'set', "$attr=${new_size}k", "$scfg->{pool}/$vname");
a4034b9f
WL
585
586 return $new_size;
587}
588
2b40ffae
WL
589sub volume_has_feature {
590 my ($class, $scfg, $feature, $storeid, $volname, $snapname, $running) = @_;
591
592 my $features = {
593 snapshot => { current => 1, snap => 1},
594 clone => { base => 1},
595 template => { current => 1},
596 copy => { base => 1, current => 1},
baafddbd 597 sparseinit => { base => 1, current => 1},
2b40ffae
WL
598 };
599
600 my ($vtype, $name, $vmid, $basename, $basevmid, $isBase) =
601 $class->parse_volname($volname);
602
603 my $key = undef;
604
605 if ($snapname) {
606 $key = 'snap';
607 } else {
608 $key = $isBase ? 'base' : 'current';
609 }
610
611 return 1 if $features->{$feature}->{$key};
612
613 return undef;
614}
615
5bb8e010 6161;